diff --git a/build-tools-internal/src/main/java/org/elasticsearch/gradle/internal/toolchain/AdoptiumJdkToolchainResolver.java b/build-tools-internal/src/main/java/org/elasticsearch/gradle/internal/toolchain/AdoptiumJdkToolchainResolver.java
index 0270ee22ca8c5..89a40711c9a19 100644
--- a/build-tools-internal/src/main/java/org/elasticsearch/gradle/internal/toolchain/AdoptiumJdkToolchainResolver.java
+++ b/build-tools-internal/src/main/java/org/elasticsearch/gradle/internal/toolchain/AdoptiumJdkToolchainResolver.java
@@ -11,7 +11,6 @@
 import com.fasterxml.jackson.databind.JsonNode;
 import com.fasterxml.jackson.databind.ObjectMapper;
 
-import org.apache.commons.compress.utils.Lists;
 import org.gradle.jvm.toolchain.JavaLanguageVersion;
 import org.gradle.jvm.toolchain.JavaToolchainDownload;
 import org.gradle.jvm.toolchain.JavaToolchainRequest;
@@ -21,17 +20,17 @@
 import java.io.IOException;
 import java.net.URI;
 import java.net.URL;
-import java.util.Comparator;
 import java.util.Map;
 import java.util.Optional;
 import java.util.concurrent.ConcurrentHashMap;
+import java.util.stream.StreamSupport;
 
 import static org.gradle.jvm.toolchain.JavaToolchainDownload.fromUri;
 
 public abstract class AdoptiumJdkToolchainResolver extends AbstractCustomJavaToolchainResolver {
 
     // package protected for better testing
-    final Map<AdoptiumVersionRequest, Optional<AdoptiumVersionInfo>> CACHED_SEMVERS = new ConcurrentHashMap<>();
+    final Map<AdoptiumVersionRequest, Optional<String>> CACHED_RELEASES = new ConcurrentHashMap<>();
 
     @Override
     public Optional<JavaToolchainDownload> resolve(JavaToolchainRequest request) {
@@ -39,7 +38,7 @@ public Optional<JavaToolchainDownload> resolve(JavaToolchainRequest request) {
             return Optional.empty();
         }
         AdoptiumVersionRequest versionRequestKey = toVersionRequest(request);
-        Optional<AdoptiumVersionInfo> versionInfo = CACHED_SEMVERS.computeIfAbsent(
+        Optional<String> versionInfo = CACHED_RELEASES.computeIfAbsent(
             versionRequestKey,
             (r) -> resolveAvailableVersion(versionRequestKey)
         );
@@ -54,12 +53,12 @@ private AdoptiumVersionRequest toVersionRequest(JavaToolchainRequest request) {
         return new AdoptiumVersionRequest(platform, arch, javaLanguageVersion);
     }
 
-    private Optional<AdoptiumVersionInfo> resolveAvailableVersion(AdoptiumVersionRequest requestKey) {
+    private Optional<String> resolveAvailableVersion(AdoptiumVersionRequest requestKey) {
         ObjectMapper mapper = new ObjectMapper();
         try {
             int languageVersion = requestKey.languageVersion.asInt();
             URL source = new URL(
-                "https://api.adoptium.net/v3/info/release_versions?architecture="
+                "https://api.adoptium.net/v3/info/release_names?architecture="
                     + requestKey.arch
                     + "&image_type=jdk&os="
                     + requestKey.platform
@@ -71,14 +70,8 @@ private Optional<AdoptiumVersionInfo> resolveAvailableVersion(AdoptiumVersionReq
                     + ")"
             );
             JsonNode jsonNode = mapper.readTree(source);
-            JsonNode versionsNode = jsonNode.get("versions");
-            return Optional.of(
-                Lists.newArrayList(versionsNode.iterator())
-                    .stream()
-                    .map(this::toVersionInfo)
-                    .max(Comparator.comparing(AdoptiumVersionInfo::semver))
-                    .get()
-            );
+            JsonNode versionsNode = jsonNode.get("releases");
+            return StreamSupport.stream(versionsNode.spliterator(), false).map(JsonNode::textValue).findFirst();
         } catch (FileNotFoundException e) {
             // request combo not supported (e.g. aarch64 + windows
             return Optional.empty();
@@ -87,21 +80,10 @@ private Optional<AdoptiumVersionInfo> resolveAvailableVersion(AdoptiumVersionReq
         }
     }
 
-    private AdoptiumVersionInfo toVersionInfo(JsonNode node) {
-        return new AdoptiumVersionInfo(
-            node.get("build").asInt(),
-            node.get("major").asInt(),
-            node.get("minor").asInt(),
-            node.get("openjdk_version").asText(),
-            node.get("security").asInt(),
-            node.get("semver").asText()
-        );
-    }
-
-    private URI resolveDownloadURI(AdoptiumVersionRequest request, AdoptiumVersionInfo versionInfo) {
+    private URI resolveDownloadURI(AdoptiumVersionRequest request, String version) {
         return URI.create(
-            "https://api.adoptium.net/v3/binary/version/jdk-"
-                + versionInfo.semver
+            "https://api.adoptium.net/v3/binary/version/"
+                + version
                 + "/"
                 + request.platform
                 + "/"
@@ -118,7 +100,5 @@ private boolean requestIsSupported(JavaToolchainRequest request) {
         return anyVendorOr(request.getJavaToolchainSpec().getVendor().get(), JvmVendorSpec.ADOPTIUM);
     }
 
-    record AdoptiumVersionInfo(int build, int major, int minor, String openjdkVersion, int security, String semver) {}
-
     record AdoptiumVersionRequest(String platform, String arch, JavaLanguageVersion languageVersion) {}
 }
diff --git a/build-tools-internal/src/main/java/org/elasticsearch/gradle/internal/toolchain/OracleOpenJdkToolchainResolver.java b/build-tools-internal/src/main/java/org/elasticsearch/gradle/internal/toolchain/OracleOpenJdkToolchainResolver.java
index 818cb040c172e..162895fd486cf 100644
--- a/build-tools-internal/src/main/java/org/elasticsearch/gradle/internal/toolchain/OracleOpenJdkToolchainResolver.java
+++ b/build-tools-internal/src/main/java/org/elasticsearch/gradle/internal/toolchain/OracleOpenJdkToolchainResolver.java
@@ -39,11 +39,7 @@ record JdkBuild(JavaLanguageVersion languageVersion, String version, String buil
     );
 
     // package private so it can be replaced by tests
-    List<JdkBuild> builds = List.of(
-        getBundledJdkBuild(),
-        // 22 release candidate
-        new JdkBuild(JavaLanguageVersion.of(22), "22", "36", "830ec9fcccef480bb3e73fb7ecafe059")
-    );
+    List<JdkBuild> builds = List.of(getBundledJdkBuild());
 
     private JdkBuild getBundledJdkBuild() {
         String bundledJdkVersion = VersionProperties.getBundledJdkVersion();
diff --git a/build-tools-internal/src/test/groovy/org/elasticsearch/gradle/internal/toolchain/AdoptiumJdkToolchainResolverSpec.groovy b/build-tools-internal/src/test/groovy/org/elasticsearch/gradle/internal/toolchain/AdoptiumJdkToolchainResolverSpec.groovy
index 6383d577f027f..fe4a644ddfc1d 100644
--- a/build-tools-internal/src/test/groovy/org/elasticsearch/gradle/internal/toolchain/AdoptiumJdkToolchainResolverSpec.groovy
+++ b/build-tools-internal/src/test/groovy/org/elasticsearch/gradle/internal/toolchain/AdoptiumJdkToolchainResolverSpec.groovy
@@ -11,7 +11,6 @@ package org.elasticsearch.gradle.internal.toolchain
 import org.gradle.api.services.BuildServiceParameters
 import org.gradle.jvm.toolchain.JavaLanguageVersion
 import org.gradle.jvm.toolchain.JavaToolchainResolver
-import org.gradle.platform.OperatingSystem
 
 import static org.elasticsearch.gradle.internal.toolchain.AbstractCustomJavaToolchainResolver.toArchString
 import static org.elasticsearch.gradle.internal.toolchain.AbstractCustomJavaToolchainResolver.toOsString
@@ -38,12 +37,7 @@ class AdoptiumJdkToolchainResolverSpec extends AbstractToolchainResolverSpec {
                     toOsString(it[2], it[1]),
                     toArchString(it[3]),
                     languageVersion);
-            resolver.CACHED_SEMVERS.put(request, Optional.of(new AdoptiumJdkToolchainResolver.AdoptiumVersionInfo(languageVersion.asInt(),
-                    1,
-                    1,
-                    "" + languageVersion.asInt() + ".1.1.1+37",
-                    0, "" + languageVersion.asInt() + ".1.1.1+37.1"
-            )))
+            resolver.CACHED_RELEASES.put(request, Optional.of('jdk-' + languageVersion.asInt() + '.1.1.1+37.1'))
 
         }
         return resolver
diff --git a/build-tools-internal/version.properties b/build-tools-internal/version.properties
index 044f6c07c756e..a2744e89174b2 100644
--- a/build-tools-internal/version.properties
+++ b/build-tools-internal/version.properties
@@ -2,7 +2,7 @@ elasticsearch     = 8.15.0
 lucene            = 9.10.0
 
 bundled_jdk_vendor = openjdk
-bundled_jdk = 21.0.2+13@f2283984656d49d69e91c558476027ac
+bundled_jdk = 22.0.1+8@c7ec1332f7bb44aeba2eb341ae18aca4
 # optional dependencies
 spatial4j         = 0.7
 jts               = 1.15.0
diff --git a/docs/changelog/108409.yaml b/docs/changelog/108409.yaml
new file mode 100644
index 0000000000000..6cff86cf93930
--- /dev/null
+++ b/docs/changelog/108409.yaml
@@ -0,0 +1,6 @@
+pr: 108409
+summary: Support multiple associated groups for TopN
+area: Application
+type: enhancement
+issues:
+ - 108018
diff --git a/docs/changelog/108574.yaml b/docs/changelog/108574.yaml
new file mode 100644
index 0000000000000..b3c957721e01e
--- /dev/null
+++ b/docs/changelog/108574.yaml
@@ -0,0 +1,5 @@
+pr: 108574
+summary: "[ESQL] CBRT function"
+area: ES|QL
+type: enhancement
+issues: []
diff --git a/docs/changelog/108600.yaml b/docs/changelog/108600.yaml
new file mode 100644
index 0000000000000..59177bf34114c
--- /dev/null
+++ b/docs/changelog/108600.yaml
@@ -0,0 +1,15 @@
+pr: 108600
+summary: "Prevent DLS/FLS if `replication` is assigned"
+area: Security
+type: breaking
+issues: [ ]
+breaking:
+  title: "Prevent DLS/FLS if `replication` is assigned"
+  area: REST API
+  details: For cross-cluster API keys, {es} no longer allows specifying document-level security (DLS)
+    or field-level security (FLS) in the `search` field, if `replication` is also specified.
+    {es} likewise blocks the use of any existing cross-cluster API keys that meet this condition.
+  impact: Remove any document-level security (DLS) or field-level security (FLS) definitions from the `search` field
+    for cross-cluster API keys that also have a `replication` field, or create two separate cross-cluster API keys,
+    one for search and one for replication.
+  notable: false
diff --git a/docs/changelog/108602.yaml b/docs/changelog/108602.yaml
new file mode 100644
index 0000000000000..d544c89980123
--- /dev/null
+++ b/docs/changelog/108602.yaml
@@ -0,0 +1,5 @@
+pr: 108602
+summary: "[Inference API] Extract optional long instead of integer in `RateLimitSettings#of`"
+area: Machine Learning
+type: bug
+issues: []
diff --git a/docs/changelog/108643.yaml b/docs/changelog/108643.yaml
new file mode 100644
index 0000000000000..f71a943673326
--- /dev/null
+++ b/docs/changelog/108643.yaml
@@ -0,0 +1,6 @@
+pr: 108643
+summary: Use `scheduleUnlessShuttingDown` in `LeaderChecker`
+area: Cluster Coordination
+type: bug
+issues:
+ - 108642
diff --git a/docs/changelog/108651.yaml b/docs/changelog/108651.yaml
new file mode 100644
index 0000000000000..e629c114dac51
--- /dev/null
+++ b/docs/changelog/108651.yaml
@@ -0,0 +1,29 @@
+pr: 108651
+summary: Add support for the 'ISP' database to the geoip processor
+area: Ingest Node
+type: enhancement
+issues: []
+highlight:
+  title: Add support for the 'ISP' database to the geoip processor
+  body: |-
+    Follow on to https://github.com/elastic/elasticsearch/pull/107287,
+    https://github.com/elastic/elasticsearch/pull/107377, and
+    https://github.com/elastic/elasticsearch/pull/108639
+
+    Adds support for the ['GeoIP2
+    ISP'](https://dev.maxmind.com/geoip/docs/databases/isp) database from
+    MaxMind to the geoip processor.
+
+    The geoip processor will automatically download the [various 'GeoLite2'
+    databases](https://dev.maxmind.com/geoip/geolite2-free-geolocation-data),
+    but the 'GeoIP2 ISP' database is not a 'GeoLite2' database -- it's a
+    commercial database available to those with a suitable license from
+    MaxMind.
+
+    The support that is being added for it in this PR is in line with the
+    support that we already have for MaxMind's 'GeoIP2 City' and 'GeoIP2
+    Country' databases -- that is, one would need to arrange their own
+    download management via some custom endpoint or otherwise arrange for
+    the relevant file(s) to be in the $ES_CONFIG/ingest-geoip directory on
+    the nodes of the cluster.
+  notable: true
diff --git a/docs/changelog/108654.yaml b/docs/changelog/108654.yaml
new file mode 100644
index 0000000000000..9afae6a19ca80
--- /dev/null
+++ b/docs/changelog/108654.yaml
@@ -0,0 +1,5 @@
+pr: 108654
+summary: Update bundled JDK to Java 22 (again)
+area: Packaging
+type: upgrade
+issues: []
diff --git a/docs/changelog/108672.yaml b/docs/changelog/108672.yaml
new file mode 100644
index 0000000000000..e1261fcf6f232
--- /dev/null
+++ b/docs/changelog/108672.yaml
@@ -0,0 +1,5 @@
+pr: 108672
+summary: Add bounds checking to parsing ISO8601 timezone offset values
+area: Infra/Core
+type: bug
+issues: []
diff --git a/docs/reference/connector/apis/update-connector-filtering-api.asciidoc b/docs/reference/connector/apis/update-connector-filtering-api.asciidoc
index f864b68f65395..7ae80276d3151 100644
--- a/docs/reference/connector/apis/update-connector-filtering-api.asciidoc
+++ b/docs/reference/connector/apis/update-connector-filtering-api.asciidoc
@@ -6,7 +6,7 @@
 
 beta::[]
 
-Updates the draft `filtering` configuration of a connector and marks the draft validation state as `edited`. The filtering configuration can be activated once validated by the Elastic connector service.
+Updates the draft `filtering` configuration of a connector and marks the draft validation state as `edited`. The filtering draft is activated once validated by the running Elastic connector service.
 
 The filtering property is used to configure sync rules (both basic and advanced) for a connector. Learn more in the {enterprise-search-ref}/sync-rules.html[sync rules documentation].
 
@@ -15,14 +15,13 @@ The filtering property is used to configure sync rules (both basic and advanced)
 
 `PUT _connector/<connector_id>/_filtering`
 
-`PUT _connector/<connector_id>/_filtering/_activate`
-
 [[update-connector-filtering-api-prereq]]
 ==== {api-prereq-title}
 
 * To sync data using self-managed connectors, you need to deploy the {enterprise-search-ref}/build-connector.html[Elastic connector service] on your own infrastructure. This service runs automatically on Elastic Cloud for native connectors.
 * The `connector_id` parameter should reference an existing connector.
-* To activate filtering rules, the `draft.validation.state` must be `valid`.
+* Filtering draft is activated once validated by the running Elastic connector service, the `draft.validation.state` must be `valid`.
+* If, after a validation attempt, the `draft.validation.state` equals to `invalid`, inspect `draft.validation.errors` and fix any issues.
 
 [[update-connector-filtering-api-path-params]]
 ==== {api-path-parms-title}
@@ -185,20 +184,4 @@ PUT _connector/my-sql-connector/_filtering/_validation
 
 Note, you can also update draft `rules` and `advanced_snippet` in a single request.
 
-Once the draft is updated, its validation state is set to `edited`. The connector service will then validate the rules and report the validation state as either `invalid` or `valid`. If the state is `valid`, the draft filtering can be activated with:
-
-
-[source,console]
-----
-PUT _connector/my-sql-connector/_filtering/_activate
-----
-// TEST[continued]
-
-[source,console-result]
-----
-{
-    "result": "updated"
-}
-----
-
-Once filtering rules are activated, they will be applied to all subsequent full or incremental syncs.
+Once the draft is updated, its validation state is set to `edited`. The connector service will then validate the rules and report the validation state as either `invalid` or `valid`. If the state is `valid`, the draft filtering will be activated by the running Elastic connector service.
diff --git a/docs/reference/esql/esql-language.asciidoc b/docs/reference/esql/esql-language.asciidoc
index 77f5e79753fdd..a6b4da47f249f 100644
--- a/docs/reference/esql/esql-language.asciidoc
+++ b/docs/reference/esql/esql-language.asciidoc
@@ -14,6 +14,7 @@ Detailed reference documentation for the {esql} language:
 * <<esql-multivalued-fields>>
 * <<esql-enrich-data>>
 * <<esql-process-data-with-dissect-and-grok>>
+* <<esql-implicit-casting>>
 
 include::esql-syntax.asciidoc[]
 include::esql-commands.asciidoc[]
@@ -23,3 +24,4 @@ include::esql-index-options.asciidoc[]
 include::multivalued-fields.asciidoc[]
 include::esql-process-data-with-dissect-grok.asciidoc[]
 include::esql-enrich-data.asciidoc[]
+include::implicit-casting.asciidoc[]
diff --git a/docs/reference/esql/functions/description/cbrt.asciidoc b/docs/reference/esql/functions/description/cbrt.asciidoc
new file mode 100644
index 0000000000000..836dec8a87d69
--- /dev/null
+++ b/docs/reference/esql/functions/description/cbrt.asciidoc
@@ -0,0 +1,5 @@
+// This is generated by ESQL's AbstractFunctionTestCase. Do no edit it. See ../README.md for how to regenerate it.
+
+*Description*
+
+Returns the cube root of a number. The input can be any numeric value, the return value is always a double. Cube roots of infinities are null.
diff --git a/docs/reference/esql/functions/description/sqrt.asciidoc b/docs/reference/esql/functions/description/sqrt.asciidoc
index 61e4f9b64fcd1..b9f354a33541f 100644
--- a/docs/reference/esql/functions/description/sqrt.asciidoc
+++ b/docs/reference/esql/functions/description/sqrt.asciidoc
@@ -2,4 +2,4 @@
 
 *Description*
 
-Returns the square root of a number. The input can be any numeric value, the return value is always a double. Square roots of negative numbers and infinites are null.
+Returns the square root of a number. The input can be any numeric value, the return value is always a double. Square roots of negative numbers and infinities are null.
diff --git a/docs/reference/esql/functions/examples/cbrt.asciidoc b/docs/reference/esql/functions/examples/cbrt.asciidoc
new file mode 100644
index 0000000000000..56f1ef0a819e0
--- /dev/null
+++ b/docs/reference/esql/functions/examples/cbrt.asciidoc
@@ -0,0 +1,13 @@
+// This is generated by ESQL's AbstractFunctionTestCase. Do no edit it. See ../README.md for how to regenerate it.
+
+*Example*
+
+[source.merge.styled,esql]
+----
+include::{esql-specs}/math.csv-spec[tag=cbrt]
+----
+[%header.monospaced.styled,format=dsv,separator=|]
+|===
+include::{esql-specs}/math.csv-spec[tag=cbrt-result]
+|===
+
diff --git a/docs/reference/esql/functions/kibana/definition/cbrt.json b/docs/reference/esql/functions/kibana/definition/cbrt.json
new file mode 100644
index 0000000000000..600174e17ca0c
--- /dev/null
+++ b/docs/reference/esql/functions/kibana/definition/cbrt.json
@@ -0,0 +1,59 @@
+{
+  "comment" : "This is generated by ESQL's AbstractFunctionTestCase. Do no edit it. See ../README.md for how to regenerate it.",
+  "type" : "eval",
+  "name" : "cbrt",
+  "description" : "Returns the cube root of a number. The input can be any numeric value, the return value is always a double.\nCube roots of infinities are null.",
+  "signatures" : [
+    {
+      "params" : [
+        {
+          "name" : "number",
+          "type" : "double",
+          "optional" : false,
+          "description" : "Numeric expression. If `null`, the function returns `null`."
+        }
+      ],
+      "variadic" : false,
+      "returnType" : "double"
+    },
+    {
+      "params" : [
+        {
+          "name" : "number",
+          "type" : "integer",
+          "optional" : false,
+          "description" : "Numeric expression. If `null`, the function returns `null`."
+        }
+      ],
+      "variadic" : false,
+      "returnType" : "double"
+    },
+    {
+      "params" : [
+        {
+          "name" : "number",
+          "type" : "long",
+          "optional" : false,
+          "description" : "Numeric expression. If `null`, the function returns `null`."
+        }
+      ],
+      "variadic" : false,
+      "returnType" : "double"
+    },
+    {
+      "params" : [
+        {
+          "name" : "number",
+          "type" : "unsigned_long",
+          "optional" : false,
+          "description" : "Numeric expression. If `null`, the function returns `null`."
+        }
+      ],
+      "variadic" : false,
+      "returnType" : "double"
+    }
+  ],
+  "examples" : [
+    "ROW d = 1000.0\n| EVAL c = cbrt(d)"
+  ]
+}
diff --git a/docs/reference/esql/functions/kibana/definition/sqrt.json b/docs/reference/esql/functions/kibana/definition/sqrt.json
index e990049a9ce67..7d9111036402d 100644
--- a/docs/reference/esql/functions/kibana/definition/sqrt.json
+++ b/docs/reference/esql/functions/kibana/definition/sqrt.json
@@ -2,7 +2,7 @@
   "comment" : "This is generated by ESQL's AbstractFunctionTestCase. Do no edit it. See ../README.md for how to regenerate it.",
   "type" : "eval",
   "name" : "sqrt",
-  "description" : "Returns the square root of a number. The input can be any numeric value, the return value is always a double.\nSquare roots of negative numbers and infinites are null.",
+  "description" : "Returns the square root of a number. The input can be any numeric value, the return value is always a double.\nSquare roots of negative numbers and infinities are null.",
   "signatures" : [
     {
       "params" : [
diff --git a/docs/reference/esql/functions/kibana/docs/cbrt.md b/docs/reference/esql/functions/kibana/docs/cbrt.md
new file mode 100644
index 0000000000000..50cdad02818e8
--- /dev/null
+++ b/docs/reference/esql/functions/kibana/docs/cbrt.md
@@ -0,0 +1,12 @@
+<!--
+This is generated by ESQL's AbstractFunctionTestCase. Do no edit it. See ../README.md for how to regenerate it.
+-->
+
+### CBRT
+Returns the cube root of a number. The input can be any numeric value, the return value is always a double.
+Cube roots of infinities are null.
+
+```
+ROW d = 1000.0
+| EVAL c = cbrt(d)
+```
diff --git a/docs/reference/esql/functions/kibana/docs/sqrt.md b/docs/reference/esql/functions/kibana/docs/sqrt.md
index 264abe53921c4..fccec95a4884d 100644
--- a/docs/reference/esql/functions/kibana/docs/sqrt.md
+++ b/docs/reference/esql/functions/kibana/docs/sqrt.md
@@ -4,7 +4,7 @@ This is generated by ESQL's AbstractFunctionTestCase. Do no edit it. See ../READ
 
 ### SQRT
 Returns the square root of a number. The input can be any numeric value, the return value is always a double.
-Square roots of negative numbers and infinites are null.
+Square roots of negative numbers and infinities are null.
 
 ```
 ROW d = 100.0
diff --git a/docs/reference/esql/functions/layout/cbrt.asciidoc b/docs/reference/esql/functions/layout/cbrt.asciidoc
new file mode 100644
index 0000000000000..18106f0e6ca35
--- /dev/null
+++ b/docs/reference/esql/functions/layout/cbrt.asciidoc
@@ -0,0 +1,15 @@
+// This is generated by ESQL's AbstractFunctionTestCase. Do no edit it. See ../README.md for how to regenerate it.
+
+[discrete]
+[[esql-cbrt]]
+=== `CBRT`
+
+*Syntax*
+
+[.text-center]
+image::esql/functions/signature/cbrt.svg[Embedded,opts=inline]
+
+include::../parameters/cbrt.asciidoc[]
+include::../description/cbrt.asciidoc[]
+include::../types/cbrt.asciidoc[]
+include::../examples/cbrt.asciidoc[]
diff --git a/docs/reference/esql/functions/math-functions.asciidoc b/docs/reference/esql/functions/math-functions.asciidoc
index 9aa5cd2db1927..db907c8d54061 100644
--- a/docs/reference/esql/functions/math-functions.asciidoc
+++ b/docs/reference/esql/functions/math-functions.asciidoc
@@ -13,6 +13,7 @@
 * <<esql-asin>>
 * <<esql-atan>>
 * <<esql-atan2>>
+* <<esql-cbrt>>
 * <<esql-ceil>>
 * <<esql-cos>>
 * <<esql-cosh>>
@@ -37,6 +38,7 @@ include::layout/acos.asciidoc[]
 include::layout/asin.asciidoc[]
 include::layout/atan.asciidoc[]
 include::layout/atan2.asciidoc[]
+include::layout/cbrt.asciidoc[]
 include::layout/ceil.asciidoc[]
 include::layout/cos.asciidoc[]
 include::layout/cosh.asciidoc[]
diff --git a/docs/reference/esql/functions/parameters/cbrt.asciidoc b/docs/reference/esql/functions/parameters/cbrt.asciidoc
new file mode 100644
index 0000000000000..65013f4c21265
--- /dev/null
+++ b/docs/reference/esql/functions/parameters/cbrt.asciidoc
@@ -0,0 +1,6 @@
+// This is generated by ESQL's AbstractFunctionTestCase. Do no edit it. See ../README.md for how to regenerate it.
+
+*Parameters*
+
+`number`::
+Numeric expression. If `null`, the function returns `null`.
diff --git a/docs/reference/esql/functions/signature/cbrt.svg b/docs/reference/esql/functions/signature/cbrt.svg
new file mode 100644
index 0000000000000..ba96c276caaa0
--- /dev/null
+++ b/docs/reference/esql/functions/signature/cbrt.svg
@@ -0,0 +1 @@
+<svg version="1.1" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns="http://www.w3.org/2000/svg" width="264" height="46" viewbox="0 0 264 46"><defs><style type="text/css">#guide .c{fill:none;stroke:#222222;}#guide .k{fill:#000000;font-family:Roboto Mono,Sans-serif;font-size:20px;}#guide .s{fill:#e4f4ff;stroke:#222222;}#guide .syn{fill:#8D8D8D;font-family:Roboto Mono,Sans-serif;font-size:20px;}</style></defs><path class="c" d="M0 31h5m68 0h10m32 0h10m92 0h10m32 0h5"/><rect class="s" x="5" y="5" width="68" height="36"/><text class="k" x="15" y="31">CBRT</text><rect class="s" x="83" y="5" width="32" height="36" rx="7"/><text class="syn" x="93" y="31">(</text><rect class="s" x="125" y="5" width="92" height="36" rx="7"/><text class="k" x="135" y="31">number</text><rect class="s" x="227" y="5" width="32" height="36" rx="7"/><text class="syn" x="237" y="31">)</text></svg>
\ No newline at end of file
diff --git a/docs/reference/esql/functions/type-conversion-functions.asciidoc b/docs/reference/esql/functions/type-conversion-functions.asciidoc
index 2fec7f40bde8b..96c29a776bc2b 100644
--- a/docs/reference/esql/functions/type-conversion-functions.asciidoc
+++ b/docs/reference/esql/functions/type-conversion-functions.asciidoc
@@ -5,6 +5,11 @@
 <titleabbrev>Type conversion functions</titleabbrev>
 ++++
 
+[TIP]
+====
+{esql} supports implicit casting from string literals to certain data types. Refer to <<esql-implicit-casting,implicit casting>> for details.
+====
+
 {esql} supports these type conversion functions:
 
 // tag::type_list[]
diff --git a/docs/reference/esql/functions/types/cbrt.asciidoc b/docs/reference/esql/functions/types/cbrt.asciidoc
new file mode 100644
index 0000000000000..7cda278abdb56
--- /dev/null
+++ b/docs/reference/esql/functions/types/cbrt.asciidoc
@@ -0,0 +1,12 @@
+// This is generated by ESQL's AbstractFunctionTestCase. Do no edit it. See ../README.md for how to regenerate it.
+
+*Supported types*
+
+[%header.monospaced.styled,format=dsv,separator=|]
+|===
+number | result
+double | double
+integer | double
+long | double
+unsigned_long | double
+|===
diff --git a/docs/reference/esql/implicit-casting.asciidoc b/docs/reference/esql/implicit-casting.asciidoc
new file mode 100644
index 0000000000000..f0c0aa3d82063
--- /dev/null
+++ b/docs/reference/esql/implicit-casting.asciidoc
@@ -0,0 +1,53 @@
+[[esql-implicit-casting]]
+=== {esql} implicit casting
+
+++++
+<titleabbrev>Implicit casting</titleabbrev>
+++++
+
+Often users will input `datetime`, `ip`, `version`, or geospatial objects as simple strings in their queries for use in predicates, functions, or expressions. {esql} provides <<esql-type-conversion-functions, type conversion functions>> to explicitly convert these strings into the desired data types.
+
+Without implicit casting users must explicitly code these `to_X` functions in their queries, when string literals don't match the target data types they are assigned or compared to. Here is an example of using `to_datetime` to explicitly perform a data type conversion.
+
+[source.merge.styled,esql]
+----
+FROM employees
+| EVAL dd_ns1=date_diff("day", to_datetime("2023-12-02T11:00:00.00Z"), birth_date)
+| SORT emp_no
+| KEEP dd_ns1
+| LIMIT 1
+----
+
+Implicit casting improves usability, by automatically converting string literals to the target data type. This is most useful when the target data type is `datetime`, `ip`, `version` or a geo spatial. It is natural to specify these as a string in queries.
+
+The first query can be coded without calling the `to_datetime` function, as follows:
+
+[source.merge.styled,esql]
+----
+FROM employees
+| EVAL dd_ns1=date_diff("day", "2023-12-02T11:00:00.00Z", birth_date)
+| SORT emp_no
+| KEEP dd_ns1
+| LIMIT 1
+----
+
+[float]
+=== Implicit casting support
+
+The following table details which {esql} operations support implicit casting for different data types.
+
+[%header.monospaced.styled,format=dsv,separator=|]
+|===
+||ScalarFunction|BinaryComparison|ArithmeticOperation|InListPredicate|AggregateFunction
+|DATETIME|Y|Y|Y|Y|N
+|DOUBLE|Y|N|N|N|N
+|LONG|Y|N|N|N|N
+|INTEGER|Y|N|N|N|N
+|IP|Y|Y|Y|Y|N
+|VERSION|Y|Y|Y|Y|N
+|GEO_POINT|Y|N|N|N|N
+|GEO_SHAPE|Y|N|N|N|N
+|CARTESIAN_POINT|Y|N|N|N|N
+|CARTESIAN_SHAPE|Y|N|N|N|N
+|BOOLEAN|Y|Y|Y|Y|N
+|===
diff --git a/docs/reference/ingest/processors/geoip.asciidoc b/docs/reference/ingest/processors/geoip.asciidoc
index 3348ae9cbfee9..4fbf9678f2fc7 100644
--- a/docs/reference/ingest/processors/geoip.asciidoc
+++ b/docs/reference/ingest/processors/geoip.asciidoc
@@ -60,10 +60,15 @@ in `properties`.
 `hosting_provider`, `tor_exit_node`, `anonymous_vpn`, `anonymous`, `public_proxy`, and `residential_proxy`. The fields actually added
 depend on what has been found and which properties were configured in `properties`.
 * If the GeoIP2 Domain database is used, then the following fields may be added under the `target_field`: `ip`, and `domain`.
+The fields actually added depend on what has been found and which properties were configured in `properties`.
+* If the GeoIP2 ISP database is used, then the following fields may be added under the `target_field`: `ip`, `asn`,
+`organization_name`, `network`, `isp`, `isp_organization`, `mobile_country_code`, and `mobile_network_code`. The fields actually added
+depend on what has been found and which properties were configured in `properties`.
 * If the GeoIP2 Enterprise database is used, then the following fields may be added under the `target_field`: `ip`,
 `country_iso_code`, `country_name`, `continent_name`, `region_iso_code`, `region_name`, `city_name`, `timezone`, `location`, `asn`,
-`organization_name`, `network`, `hosting_provider`, `tor_exit_node`, `anonymous_vpn`, `anonymous`, `public_proxy`, and `residential_proxy`.
-The fields actually added depend on what has been found and which properties were configured in `properties`.
+`organization_name`, `network`, `hosting_provider`, `tor_exit_node`, `anonymous_vpn`, `anonymous`, `public_proxy`, `residential_proxy`,
+`isp`, `isp_organization`, `mobile_country_code`, and `mobile_network_code`. The fields actually added depend on what has been found
+and which properties were configured in `properties`.
 
 
 Here is an example that uses the default city database and adds the geographical information to the `geoip` field based on the `ip` field:
diff --git a/docs/reference/search/retriever.asciidoc b/docs/reference/search/retriever.asciidoc
index c47ccd60afc05..590df272cc89e 100644
--- a/docs/reference/search/retriever.asciidoc
+++ b/docs/reference/search/retriever.asciidoc
@@ -12,6 +12,11 @@ allows for complex behavior to be depicted in a tree-like structure, called
 the retriever tree, to better clarify the order of operations that occur
 during a search.
 
+[TIP]
+====
+Refer to <<retrievers-overview>> for a high level overview of the retrievers abstraction.
+====
+
 The following retrievers are available:
 
 `standard`::
diff --git a/gradle/verification-metadata.xml b/gradle/verification-metadata.xml
index 00c6ec4bd4a2e..53db6f13a31b3 100644
--- a/gradle/verification-metadata.xml
+++ b/gradle/verification-metadata.xml
@@ -1720,6 +1720,27 @@
             <sha256 value="b6c17e747ae78cdd6de4d7532b3164b277daee97c007d3eaa2b39cca99882664" origin="Generated by Gradle"/>
          </artifact>
       </component>
+      <component group="openjdk_22" name="linux" version="22.0.1">
+         <artifact name="linux-22.0.1-aarch64.tar.gz">
+            <sha256 value="0887c42b9897f889415a6f7b88549d38af99f6ef2d1117199de012beab0631eb" origin="Generated by Gradle"/>
+         </artifact>
+         <artifact name="linux-22.0.1-x64.tar.gz">
+            <sha256 value="133c8b65113304904cdef7c9103274d141cfb64b191ff48ceb6528aca25c67b1" origin="Generated by Gradle"/>
+         </artifact>
+      </component>
+      <component group="openjdk_22" name="macos" version="22.0.1">
+         <artifact name="macos-22.0.1-aarch64.tar.gz">
+            <sha256 value="b949a3bc13e3c5152ab55d12e699dfa6c8b00bedeb8302b13be4aec3ee734351" origin="Generated by Gradle"/>
+         </artifact>
+         <artifact name="macos-22.0.1-x64.tar.gz">
+            <sha256 value="5daa4f9894cc3a617a5f9fe2c48e5391d3a2e672c91e1597041672f57696846f" origin="Generated by Gradle"/>
+         </artifact>
+      </component>
+      <component group="openjdk_22" name="windows" version="22.0.1">
+         <artifact name="windows-22.0.1-x64.zip">
+            <sha256 value="de7f00fd1bd0d3a4c678fff2681dfad19284d74d357218a4be6f623488d040da" origin="Generated by Gradle"/>
+         </artifact>
+      </component>
       <component group="org.abego.treelayout" name="org.abego.treelayout.core" version="1.0.3">
          <artifact name="org.abego.treelayout.core-1.0.3.jar">
             <sha256 value="fa5e31395c39c2e7d46aca0f81f72060931607b2fa41bd36038eb2cb6fb93326" origin="Generated by Gradle"/>
diff --git a/modules/data-streams/build.gradle b/modules/data-streams/build.gradle
index 8acdb0f156af1..b9d38551a2674 100644
--- a/modules/data-streams/build.gradle
+++ b/modules/data-streams/build.gradle
@@ -20,6 +20,7 @@ restResources {
 
 dependencies {
   testImplementation project(path: ':test:test-clusters')
+  internalClusterTestImplementation project(":modules:mapper-extras")
 }
 
 tasks.named('yamlRestTest') {
diff --git a/modules/data-streams/src/internalClusterTest/java/org/elasticsearch/datastreams/DataStreamIT.java b/modules/data-streams/src/internalClusterTest/java/org/elasticsearch/datastreams/DataStreamIT.java
index 2b1a8e1c0e318..f79eea8676b3e 100644
--- a/modules/data-streams/src/internalClusterTest/java/org/elasticsearch/datastreams/DataStreamIT.java
+++ b/modules/data-streams/src/internalClusterTest/java/org/elasticsearch/datastreams/DataStreamIT.java
@@ -1281,7 +1281,7 @@ public void testSearchAllResolvesDataStreams() throws Exception {
     public void testGetDataStream() throws Exception {
         Settings settings = Settings.builder().put(IndexMetadata.SETTING_NUMBER_OF_REPLICAS, maximumNumberOfReplicas() + 2).build();
         DataStreamLifecycle lifecycle = DataStreamLifecycle.newBuilder().dataRetention(randomMillisUpToYear9999()).build();
-        putComposableIndexTemplate("template_for_foo", null, List.of("metrics-foo*"), settings, null, null, lifecycle);
+        putComposableIndexTemplate("template_for_foo", null, List.of("metrics-foo*"), settings, null, null, lifecycle, false);
         int numDocsFoo = randomIntBetween(2, 16);
         indexDocs("metrics-foo", numDocsFoo);
 
@@ -1642,7 +1642,8 @@ public void testCreateDataStreamWithSameNameAsDataStreamAlias() throws Exception
                 null,
                 null,
                 Map.of("my-alias", AliasMetadata.builder("my-alias").build()),
-                null
+                null,
+                false
             );
             var request = new CreateDataStreamAction.Request("my-ds");
             assertAcked(client().execute(CreateDataStreamAction.INSTANCE, request).actionGet());
@@ -1675,7 +1676,8 @@ public void testCreateDataStreamAliasWithSameNameAsIndexAlias() throws Exception
                 null,
                 null,
                 Map.of("logs", AliasMetadata.builder("logs").build()),
-                null
+                null,
+                false
             );
 
             var request = new CreateDataStreamAction.Request("logs-es");
@@ -1712,7 +1714,8 @@ public void testCreateDataStreamAliasWithSameNameAsIndex() throws Exception {
                     null,
                     null,
                     Map.of("logs", AliasMetadata.builder("logs").build()),
-                    null
+                    null,
+                    false
                 )
             );
             assertThat(
@@ -1902,7 +1905,11 @@ static void verifyDocs(String dataStream, long expectedNumHits, long minGenerati
     }
 
     public static void putComposableIndexTemplate(String id, List<String> patterns) throws IOException {
-        putComposableIndexTemplate(id, null, patterns, null, null);
+        putComposableIndexTemplate(id, patterns, false);
+    }
+
+    public static void putComposableIndexTemplate(String id, List<String> patterns, boolean withFailureStore) throws IOException {
+        putComposableIndexTemplate(id, null, patterns, null, null, null, null, withFailureStore);
     }
 
     public void testPartitionedTemplate() throws IOException {
@@ -2277,7 +2284,7 @@ static void putComposableIndexTemplate(
         @Nullable Settings settings,
         @Nullable Map<String, Object> metadata
     ) throws IOException {
-        putComposableIndexTemplate(id, mappings, patterns, settings, metadata, null, null);
+        putComposableIndexTemplate(id, mappings, patterns, settings, metadata, null, null, false);
     }
 
     static void putComposableIndexTemplate(
@@ -2287,7 +2294,8 @@ static void putComposableIndexTemplate(
         @Nullable Settings settings,
         @Nullable Map<String, Object> metadata,
         @Nullable Map<String, AliasMetadata> aliases,
-        @Nullable DataStreamLifecycle lifecycle
+        @Nullable DataStreamLifecycle lifecycle,
+        boolean withFailureStore
     ) throws IOException {
         TransportPutComposableIndexTemplateAction.Request request = new TransportPutComposableIndexTemplateAction.Request(id);
         request.indexTemplate(
@@ -2295,7 +2303,7 @@ static void putComposableIndexTemplate(
                 .indexPatterns(patterns)
                 .template(new Template(settings, mappings == null ? null : CompressedXContent.fromJSON(mappings), aliases, lifecycle))
                 .metadata(metadata)
-                .dataStreamTemplate(new ComposableIndexTemplate.DataStreamTemplate())
+                .dataStreamTemplate(new ComposableIndexTemplate.DataStreamTemplate(false, false, withFailureStore))
                 .build()
         );
         client().execute(TransportPutComposableIndexTemplateAction.TYPE, request).actionGet();
diff --git a/modules/data-streams/src/internalClusterTest/java/org/elasticsearch/datastreams/DataStreamsSnapshotsIT.java b/modules/data-streams/src/internalClusterTest/java/org/elasticsearch/datastreams/DataStreamsSnapshotsIT.java
index da782cfd86ce2..1bd4d54b9c804 100644
--- a/modules/data-streams/src/internalClusterTest/java/org/elasticsearch/datastreams/DataStreamsSnapshotsIT.java
+++ b/modules/data-streams/src/internalClusterTest/java/org/elasticsearch/datastreams/DataStreamsSnapshotsIT.java
@@ -36,6 +36,7 @@
 import org.elasticsearch.common.settings.Settings;
 import org.elasticsearch.common.unit.ByteSizeUnit;
 import org.elasticsearch.index.Index;
+import org.elasticsearch.index.mapper.extras.MapperExtrasPlugin;
 import org.elasticsearch.index.query.QueryBuilders;
 import org.elasticsearch.plugins.Plugin;
 import org.elasticsearch.rest.RestStatus;
@@ -81,13 +82,17 @@ public class DataStreamsSnapshotsIT extends AbstractSnapshotIntegTestCase {
 
     private String dsBackingIndexName;
     private String otherDsBackingIndexName;
+    private String fsBackingIndexName;
+    private String fsFailureIndexName;
     private String ds2BackingIndexName;
     private String otherDs2BackingIndexName;
+    private String fs2BackingIndexName;
+    private String fs2FailureIndexName;
     private String id;
 
     @Override
     protected Collection<Class<? extends Plugin>> nodePlugins() {
-        return List.of(MockRepository.Plugin.class, DataStreamsPlugin.class);
+        return List.of(MockRepository.Plugin.class, DataStreamsPlugin.class, MapperExtrasPlugin.class);
     }
 
     @Before
@@ -97,6 +102,18 @@ public void setup() throws Exception {
         createRepository(REPO, "fs", location);
 
         DataStreamIT.putComposableIndexTemplate("t1", List.of("ds", "other-ds"));
+        DataStreamIT.putComposableIndexTemplate("t2", """
+            {
+                "properties": {
+                  "@timestamp": {
+                    "type": "date",
+                    "format": "date_optional_time||epoch_millis"
+                  },
+                  "flag": {
+                    "type": "boolean"
+                  }
+              }
+            }""", List.of("with-fs"), null, null, null, null, true);
 
         CreateDataStreamAction.Request request = new CreateDataStreamAction.Request("ds");
         AcknowledgedResponse response = client.execute(CreateDataStreamAction.INSTANCE, request).get();
@@ -106,15 +123,30 @@ public void setup() throws Exception {
         response = client.execute(CreateDataStreamAction.INSTANCE, request).get();
         assertTrue(response.isAcknowledged());
 
+        request = new CreateDataStreamAction.Request("with-fs");
+        response = client.execute(CreateDataStreamAction.INSTANCE, request).get();
+        assertTrue(response.isAcknowledged());
+
         // Resolve backing index names after data streams have been created:
         // (these names have a date component, and running around midnight could lead to test failures otherwise)
         GetDataStreamAction.Request getDataStreamRequest = new GetDataStreamAction.Request(new String[] { "*" });
         GetDataStreamAction.Response getDataStreamResponse = client.execute(GetDataStreamAction.INSTANCE, getDataStreamRequest).actionGet();
         dsBackingIndexName = getDataStreamResponse.getDataStreams().get(0).getDataStream().getIndices().get(0).getName();
         otherDsBackingIndexName = getDataStreamResponse.getDataStreams().get(1).getDataStream().getIndices().get(0).getName();
+        fsBackingIndexName = getDataStreamResponse.getDataStreams().get(2).getDataStream().getIndices().get(0).getName();
+        fsFailureIndexName = getDataStreamResponse.getDataStreams()
+            .get(2)
+            .getDataStream()
+            .getFailureIndices()
+            .getIndices()
+            .get(0)
+            .getName();
+
         // Will be used in some tests, to test renaming while restoring a snapshot:
         ds2BackingIndexName = dsBackingIndexName.replace("-ds-", "-ds2-");
         otherDs2BackingIndexName = otherDsBackingIndexName.replace("-other-ds-", "-other-ds2-");
+        fs2BackingIndexName = fsBackingIndexName.replace("-with-fs-", "-with-fs2-");
+        fs2FailureIndexName = fsFailureIndexName.replace("-with-fs-", "-with-fs2-");
 
         DocWriteResponse indexResponse = client.prepareIndex("ds")
             .setOpType(DocWriteRequest.OpType.CREATE)
@@ -232,12 +264,16 @@ public void testSnapshotAndRestoreAllDataStreamsInPlace() throws Exception {
         GetDataStreamAction.Response ds = client.execute(GetDataStreamAction.INSTANCE, getDataSteamRequest).get();
         assertThat(
             ds.getDataStreams().stream().map(e -> e.getDataStream().getName()).collect(Collectors.toList()),
-            contains(equalTo("ds"), equalTo("other-ds"))
+            contains(equalTo("ds"), equalTo("other-ds"), equalTo("with-fs"))
         );
         List<Index> backingIndices = ds.getDataStreams().get(0).getDataStream().getIndices();
         assertThat(backingIndices.stream().map(Index::getName).collect(Collectors.toList()), contains(dsBackingIndexName));
         backingIndices = ds.getDataStreams().get(1).getDataStream().getIndices();
         assertThat(backingIndices.stream().map(Index::getName).collect(Collectors.toList()), contains(otherDsBackingIndexName));
+        backingIndices = ds.getDataStreams().get(2).getDataStream().getIndices();
+        assertThat(backingIndices.stream().map(Index::getName).collect(Collectors.toList()), contains(fsBackingIndexName));
+        List<Index> failureIndices = ds.getDataStreams().get(2).getDataStream().getFailureIndices().getIndices();
+        assertThat(failureIndices.stream().map(Index::getName).collect(Collectors.toList()), contains(fsFailureIndexName));
     }
 
     public void testSnapshotAndRestoreInPlace() {
@@ -295,13 +331,72 @@ public void testSnapshotAndRestoreInPlace() {
 
         // The backing index created as part of rollover should still exist (but just not part of the data stream)
         assertThat(indexExists(backingIndexAfterSnapshot), is(true));
-        // An additional rollover should create a new backing index (3th generation) and leave .ds-ds-...-2 index as is:
+        // An additional rollover should create a new backing index (3rd generation) and leave .ds-ds-...-2 index as is:
         rolloverRequest = new RolloverRequest("ds", null);
         rolloverResponse = client.admin().indices().rolloverIndex(rolloverRequest).actionGet();
         assertThat(rolloverResponse.isRolledOver(), is(true));
         assertThat(rolloverResponse.getNewIndex(), equalTo(DataStream.getDefaultBackingIndexName("ds", 3)));
     }
 
+    public void testFailureStoreSnapshotAndRestore() throws Exception {
+        CreateSnapshotResponse createSnapshotResponse = client.admin()
+            .cluster()
+            .prepareCreateSnapshot(REPO, SNAPSHOT)
+            .setWaitForCompletion(true)
+            .setIndices("with-fs")
+            .setIncludeGlobalState(false)
+            .get();
+
+        RestStatus status = createSnapshotResponse.getSnapshotInfo().status();
+        assertEquals(RestStatus.OK, status);
+
+        assertThat(getSnapshot(REPO, SNAPSHOT).indices(), containsInAnyOrder(fsBackingIndexName, fsFailureIndexName));
+
+        assertAcked(client.execute(DeleteDataStreamAction.INSTANCE, new DeleteDataStreamAction.Request("with-fs")));
+
+        {
+            RestoreSnapshotResponse restoreSnapshotResponse = client.admin()
+                .cluster()
+                .prepareRestoreSnapshot(REPO, SNAPSHOT)
+                .setWaitForCompletion(true)
+                .setIndices("with-fs")
+                .get();
+
+            assertEquals(2, restoreSnapshotResponse.getRestoreInfo().successfulShards());
+
+            GetDataStreamAction.Response ds = client.execute(
+                GetDataStreamAction.INSTANCE,
+                new GetDataStreamAction.Request(new String[] { "with-fs" })
+            ).get();
+            assertEquals(1, ds.getDataStreams().size());
+            assertEquals(1, ds.getDataStreams().get(0).getDataStream().getIndices().size());
+            assertEquals(fsBackingIndexName, ds.getDataStreams().get(0).getDataStream().getIndices().get(0).getName());
+            assertEquals(fsFailureIndexName, ds.getDataStreams().get(0).getDataStream().getFailureIndices().getIndices().get(0).getName());
+        }
+        {
+            // With rename pattern
+            RestoreSnapshotResponse restoreSnapshotResponse = client.admin()
+                .cluster()
+                .prepareRestoreSnapshot(REPO, SNAPSHOT)
+                .setWaitForCompletion(true)
+                .setIndices("with-fs")
+                .setRenamePattern("-fs")
+                .setRenameReplacement("-fs2")
+                .get();
+
+            assertEquals(2, restoreSnapshotResponse.getRestoreInfo().successfulShards());
+
+            GetDataStreamAction.Response ds = client.execute(
+                GetDataStreamAction.INSTANCE,
+                new GetDataStreamAction.Request(new String[] { "with-fs2" })
+            ).get();
+            assertEquals(1, ds.getDataStreams().size());
+            assertEquals(1, ds.getDataStreams().get(0).getDataStream().getIndices().size());
+            assertEquals(fs2BackingIndexName, ds.getDataStreams().get(0).getDataStream().getIndices().get(0).getName());
+            assertEquals(fs2FailureIndexName, ds.getDataStreams().get(0).getDataStream().getFailureIndices().getIndices().get(0).getName());
+        }
+    }
+
     public void testSnapshotAndRestoreAllIncludeSpecificDataStream() throws Exception {
         DocWriteResponse indexResponse = client.prepareIndex("other-ds")
             .setOpType(DocWriteRequest.OpType.CREATE)
@@ -338,10 +433,13 @@ public void testSnapshotAndRestoreAllIncludeSpecificDataStream() throws Exceptio
         if (filterDuringSnapshotting) {
             assertThat(getSnapshot(REPO, SNAPSHOT).indices(), containsInAnyOrder(backingIndexName));
         } else {
-            assertThat(getSnapshot(REPO, SNAPSHOT).indices(), containsInAnyOrder(dsBackingIndexName, otherDsBackingIndexName));
+            assertThat(
+                getSnapshot(REPO, SNAPSHOT).indices(),
+                containsInAnyOrder(dsBackingIndexName, otherDsBackingIndexName, fsBackingIndexName, fsFailureIndexName)
+            );
         }
 
-        assertAcked(client.execute(DeleteDataStreamAction.INSTANCE, new DeleteDataStreamAction.Request(new String[] { "*" })).get());
+        assertAcked(client.execute(DeleteDataStreamAction.INSTANCE, new DeleteDataStreamAction.Request("*")).get());
         assertAcked(client.admin().indices().prepareDelete("*").setIndicesOptions(IndicesOptions.LENIENT_EXPAND_OPEN_CLOSED_HIDDEN));
 
         RestoreSnapshotRequest restoreSnapshotRequest = new RestoreSnapshotRequest(REPO, SNAPSHOT);
@@ -395,7 +493,10 @@ public void testSnapshotAndRestoreReplaceAll() throws Exception {
 
         RestStatus status = createSnapshotResponse.getSnapshotInfo().status();
         assertEquals(RestStatus.OK, status);
-        assertThat(getSnapshot(REPO, SNAPSHOT).indices(), containsInAnyOrder(dsBackingIndexName, otherDsBackingIndexName));
+        assertThat(
+            getSnapshot(REPO, SNAPSHOT).indices(),
+            containsInAnyOrder(dsBackingIndexName, otherDsBackingIndexName, fsBackingIndexName, fsFailureIndexName)
+        );
 
         assertAcked(client.execute(DeleteDataStreamAction.INSTANCE, new DeleteDataStreamAction.Request(new String[] { "*" })).get());
         assertAcked(client.admin().indices().prepareDelete("*").setIndicesOptions(IndicesOptions.LENIENT_EXPAND_OPEN_CLOSED_HIDDEN));
@@ -403,7 +504,7 @@ public void testSnapshotAndRestoreReplaceAll() throws Exception {
         var restoreSnapshotRequest = new RestoreSnapshotRequest(REPO, SNAPSHOT).waitForCompletion(true).includeGlobalState(false);
         RestoreSnapshotResponse restoreSnapshotResponse = client.admin().cluster().restoreSnapshot(restoreSnapshotRequest).actionGet();
 
-        assertEquals(2, restoreSnapshotResponse.getRestoreInfo().successfulShards());
+        assertEquals(4, restoreSnapshotResponse.getRestoreInfo().successfulShards());
 
         assertEquals(DOCUMENT_SOURCE, client.prepareGet(dsBackingIndexName, id).get().getSourceAsMap());
         assertResponse(client.prepareSearch("ds"), response -> {
@@ -416,10 +517,10 @@ public void testSnapshotAndRestoreReplaceAll() throws Exception {
             GetDataStreamAction.INSTANCE,
             new GetDataStreamAction.Request(new String[] { "*" })
         ).get();
-        assertEquals(2, ds.getDataStreams().size());
+        assertEquals(3, ds.getDataStreams().size());
         assertThat(
             ds.getDataStreams().stream().map(i -> i.getDataStream().getName()).collect(Collectors.toList()),
-            containsInAnyOrder("ds", "other-ds")
+            containsInAnyOrder("ds", "other-ds", "with-fs")
         );
 
         GetAliasesResponse getAliasesResponse = client.admin().indices().getAliases(new GetAliasesRequest("my-alias")).actionGet();
@@ -451,14 +552,17 @@ public void testSnapshotAndRestoreAll() throws Exception {
 
         RestStatus status = createSnapshotResponse.getSnapshotInfo().status();
         assertEquals(RestStatus.OK, status);
-        assertThat(getSnapshot(REPO, SNAPSHOT).indices(), containsInAnyOrder(dsBackingIndexName, otherDsBackingIndexName));
+        assertThat(
+            getSnapshot(REPO, SNAPSHOT).indices(),
+            containsInAnyOrder(dsBackingIndexName, otherDsBackingIndexName, fsBackingIndexName, fsFailureIndexName)
+        );
 
-        assertAcked(client.execute(DeleteDataStreamAction.INSTANCE, new DeleteDataStreamAction.Request(new String[] { "*" })).get());
+        assertAcked(client.execute(DeleteDataStreamAction.INSTANCE, new DeleteDataStreamAction.Request("*")).get());
         assertAcked(client.admin().indices().prepareDelete("*").setIndicesOptions(IndicesOptions.LENIENT_EXPAND_OPEN_CLOSED_HIDDEN));
 
         var restoreSnapshotRequest = new RestoreSnapshotRequest(REPO, SNAPSHOT).waitForCompletion(true).includeGlobalState(false);
         RestoreSnapshotResponse restoreSnapshotResponse = client.admin().cluster().restoreSnapshot(restoreSnapshotRequest).actionGet();
-        assertEquals(2, restoreSnapshotResponse.getRestoreInfo().successfulShards());
+        assertEquals(4, restoreSnapshotResponse.getRestoreInfo().successfulShards());
 
         assertEquals(DOCUMENT_SOURCE, client.prepareGet(dsBackingIndexName, id).get().getSourceAsMap());
         assertResponse(client.prepareSearch("ds"), response -> {
@@ -471,11 +575,15 @@ public void testSnapshotAndRestoreAll() throws Exception {
             GetDataStreamAction.INSTANCE,
             new GetDataStreamAction.Request(new String[] { "*" })
         ).get();
-        assertEquals(2, ds.getDataStreams().size());
+        assertEquals(3, ds.getDataStreams().size());
         assertEquals(1, ds.getDataStreams().get(0).getDataStream().getIndices().size());
         assertEquals(dsBackingIndexName, ds.getDataStreams().get(0).getDataStream().getIndices().get(0).getName());
         assertEquals(1, ds.getDataStreams().get(1).getDataStream().getIndices().size());
         assertEquals(otherDsBackingIndexName, ds.getDataStreams().get(1).getDataStream().getIndices().get(0).getName());
+        assertEquals(1, ds.getDataStreams().get(2).getDataStream().getIndices().size());
+        assertEquals(fsBackingIndexName, ds.getDataStreams().get(2).getDataStream().getIndices().get(0).getName());
+        assertEquals(1, ds.getDataStreams().get(2).getDataStream().getFailureIndices().getIndices().size());
+        assertEquals(fsFailureIndexName, ds.getDataStreams().get(2).getDataStream().getFailureIndices().getIndices().get(0).getName());
 
         GetAliasesResponse getAliasesResponse = client.admin().indices().getAliases(new GetAliasesRequest("my-alias")).actionGet();
         assertThat(getAliasesResponse.getDataStreamAliases().keySet(), containsInAnyOrder("ds", "other-ds"));
@@ -507,16 +615,19 @@ public void testSnapshotAndRestoreIncludeAliasesFalse() throws Exception {
 
         RestStatus status = createSnapshotResponse.getSnapshotInfo().status();
         assertEquals(RestStatus.OK, status);
-        assertThat(getSnapshot(REPO, SNAPSHOT).indices(), containsInAnyOrder(dsBackingIndexName, otherDsBackingIndexName));
+        assertThat(
+            getSnapshot(REPO, SNAPSHOT).indices(),
+            containsInAnyOrder(dsBackingIndexName, otherDsBackingIndexName, fsBackingIndexName, fsFailureIndexName)
+        );
 
-        assertAcked(client.execute(DeleteDataStreamAction.INSTANCE, new DeleteDataStreamAction.Request(new String[] { "*" })).get());
+        assertAcked(client.execute(DeleteDataStreamAction.INSTANCE, new DeleteDataStreamAction.Request("*")).get());
         assertAcked(client.admin().indices().prepareDelete("*").setIndicesOptions(IndicesOptions.LENIENT_EXPAND_OPEN_CLOSED_HIDDEN));
 
         var restoreSnapshotRequest = new RestoreSnapshotRequest(REPO, SNAPSHOT).waitForCompletion(true)
             .includeGlobalState(false)
             .includeAliases(false);
         RestoreSnapshotResponse restoreSnapshotResponse = client.admin().cluster().restoreSnapshot(restoreSnapshotRequest).actionGet();
-        assertEquals(2, restoreSnapshotResponse.getRestoreInfo().successfulShards());
+        assertEquals(4, restoreSnapshotResponse.getRestoreInfo().successfulShards());
 
         assertEquals(DOCUMENT_SOURCE, client.prepareGet(dsBackingIndexName, id).get().getSourceAsMap());
         assertResponse(client.prepareSearch("ds"), response -> {
@@ -529,11 +640,15 @@ public void testSnapshotAndRestoreIncludeAliasesFalse() throws Exception {
             GetDataStreamAction.INSTANCE,
             new GetDataStreamAction.Request(new String[] { "*" })
         ).get();
-        assertEquals(2, ds.getDataStreams().size());
+        assertEquals(3, ds.getDataStreams().size());
         assertEquals(1, ds.getDataStreams().get(0).getDataStream().getIndices().size());
         assertEquals(dsBackingIndexName, ds.getDataStreams().get(0).getDataStream().getIndices().get(0).getName());
         assertEquals(1, ds.getDataStreams().get(1).getDataStream().getIndices().size());
         assertEquals(otherDsBackingIndexName, ds.getDataStreams().get(1).getDataStream().getIndices().get(0).getName());
+        assertEquals(1, ds.getDataStreams().get(2).getDataStream().getIndices().size());
+        assertEquals(fsBackingIndexName, ds.getDataStreams().get(2).getDataStream().getIndices().get(0).getName());
+        assertEquals(1, ds.getDataStreams().get(2).getDataStream().getIndices().size());
+        assertEquals(fsFailureIndexName, ds.getDataStreams().get(2).getDataStream().getFailureIndices().getIndices().get(0).getName());
 
         GetAliasesResponse getAliasesResponse = client.admin().indices().getAliases(new GetAliasesRequest("*")).actionGet();
         assertThat(getAliasesResponse.getDataStreamAliases(), anEmptyMap());
@@ -930,7 +1045,32 @@ public void testPartialRestoreSnapshotThatIncludesDataStream() {
             .prepareRestoreSnapshot(REPO, snapshot)
             .setIndices(indexWithoutDataStream)
             .setWaitForCompletion(true)
-            .setRestoreGlobalState(randomBoolean())
+            .setRestoreGlobalState(false)
+            .get()
+            .getRestoreInfo();
+        assertThat(restoreInfo.failedShards(), is(0));
+        assertThat(restoreInfo.successfulShards(), is(1));
+    }
+
+    /**
+     * This test is a copy of the {@link #testPartialRestoreSnapshotThatIncludesDataStream()} the only difference
+     * is that one include the global state and one doesn't. In general this shouldn't matter that's why it used to be
+     * a random parameter of the test, but because of #107515 it fails when we include the global state. Keep them
+     * separate until this is fixed.
+     */
+    @AwaitsFix(bugUrl = "https://github.com/elastic/elasticsearch/issues/107515")
+    public void testPartialRestoreSnapshotThatIncludesDataStreamWithGlobalState() {
+        final String snapshot = "test-snapshot";
+        final String indexWithoutDataStream = "test-idx-no-ds";
+        createIndexWithContent(indexWithoutDataStream);
+        createFullSnapshot(REPO, snapshot);
+        assertAcked(client.admin().indices().prepareDelete(indexWithoutDataStream));
+        RestoreInfo restoreInfo = client.admin()
+            .cluster()
+            .prepareRestoreSnapshot(REPO, snapshot)
+            .setIndices(indexWithoutDataStream)
+            .setWaitForCompletion(true)
+            .setRestoreGlobalState(true)
             .get()
             .getRestoreInfo();
         assertThat(restoreInfo.failedShards(), is(0));
@@ -1027,7 +1167,32 @@ public void testExcludeDSFromSnapshotWhenExcludingItsIndices() {
             .cluster()
             .prepareRestoreSnapshot(REPO, snapshot)
             .setWaitForCompletion(true)
-            .setRestoreGlobalState(randomBoolean())
+            .setRestoreGlobalState(false)
+            .get()
+            .getRestoreInfo();
+        assertThat(restoreInfo.failedShards(), is(0));
+        assertThat(restoreInfo.successfulShards(), is(1));
+    }
+
+    /**
+     * This test is a copy of the {@link #testExcludeDSFromSnapshotWhenExcludingItsIndices()} the only difference
+     * is that one include the global state and one doesn't. In general this shouldn't matter that's why it used to be
+     * a random parameter of the test, but because of #107515 it fails when we include the global state. Keep them
+     * separate until this is fixed.
+     */
+    @AwaitsFix(bugUrl = "https://github.com/elastic/elasticsearch/issues/107515")
+    public void testExcludeDSFromSnapshotWhenExcludingItsIndicesWithGlobalState() {
+        final String snapshot = "test-snapshot";
+        final String indexWithoutDataStream = "test-idx-no-ds";
+        createIndexWithContent(indexWithoutDataStream);
+        final SnapshotInfo snapshotInfo = createSnapshot(REPO, snapshot, List.of("*", "-.*"));
+        assertThat(snapshotInfo.dataStreams(), empty());
+        assertAcked(client.admin().indices().prepareDelete(indexWithoutDataStream));
+        RestoreInfo restoreInfo = client.admin()
+            .cluster()
+            .prepareRestoreSnapshot(REPO, snapshot)
+            .setWaitForCompletion(true)
+            .setRestoreGlobalState(true)
             .get()
             .getRestoreInfo();
         assertThat(restoreInfo.failedShards(), is(0));
@@ -1051,7 +1216,7 @@ public void testRestoreSnapshotFully() throws Exception {
         assertEquals(RestStatus.OK, restoreSnapshotResponse.status());
 
         GetDataStreamAction.Request getRequest = new GetDataStreamAction.Request(new String[] { "*" });
-        assertThat(client.execute(GetDataStreamAction.INSTANCE, getRequest).get().getDataStreams(), hasSize(2));
+        assertThat(client.execute(GetDataStreamAction.INSTANCE, getRequest).get().getDataStreams(), hasSize(3));
         assertNotNull(client.admin().indices().prepareGetIndex().setIndices(indexName).get());
     }
 
diff --git a/modules/data-streams/src/internalClusterTest/java/org/elasticsearch/datastreams/lifecycle/CrudDataStreamLifecycleIT.java b/modules/data-streams/src/internalClusterTest/java/org/elasticsearch/datastreams/lifecycle/CrudDataStreamLifecycleIT.java
index d43dad87a6067..7712be94b4326 100644
--- a/modules/data-streams/src/internalClusterTest/java/org/elasticsearch/datastreams/lifecycle/CrudDataStreamLifecycleIT.java
+++ b/modules/data-streams/src/internalClusterTest/java/org/elasticsearch/datastreams/lifecycle/CrudDataStreamLifecycleIT.java
@@ -11,6 +11,7 @@
 import org.elasticsearch.action.datastreams.CreateDataStreamAction;
 import org.elasticsearch.action.datastreams.lifecycle.GetDataStreamLifecycleAction;
 import org.elasticsearch.action.datastreams.lifecycle.PutDataStreamLifecycleAction;
+import org.elasticsearch.action.support.master.AcknowledgedRequest;
 import org.elasticsearch.cluster.metadata.DataStreamLifecycle;
 import org.elasticsearch.core.TimeValue;
 import org.elasticsearch.datastreams.DataStreamsPlugin;
@@ -229,6 +230,8 @@ public void testDeleteLifecycle() throws Exception {
         // Remove lifecycle from concrete data stream
         {
             DeleteDataStreamLifecycleAction.Request deleteDataLifecycleRequest = new DeleteDataStreamLifecycleAction.Request(
+                TimeValue.THIRTY_SECONDS,
+                AcknowledgedRequest.DEFAULT_ACK_TIMEOUT,
                 new String[] { "with-lifecycle-1" }
             );
             assertThat(
@@ -254,6 +257,8 @@ public void testDeleteLifecycle() throws Exception {
         // Remove lifecycle from all data streams
         {
             DeleteDataStreamLifecycleAction.Request deleteDataLifecycleRequest = new DeleteDataStreamLifecycleAction.Request(
+                TimeValue.THIRTY_SECONDS,
+                AcknowledgedRequest.DEFAULT_ACK_TIMEOUT,
                 new String[] { "*" }
             );
             assertThat(
diff --git a/modules/data-streams/src/internalClusterTest/java/org/elasticsearch/datastreams/lifecycle/DataStreamLifecycleServiceIT.java b/modules/data-streams/src/internalClusterTest/java/org/elasticsearch/datastreams/lifecycle/DataStreamLifecycleServiceIT.java
index 7252d31d838c5..97c6c1ddff977 100644
--- a/modules/data-streams/src/internalClusterTest/java/org/elasticsearch/datastreams/lifecycle/DataStreamLifecycleServiceIT.java
+++ b/modules/data-streams/src/internalClusterTest/java/org/elasticsearch/datastreams/lifecycle/DataStreamLifecycleServiceIT.java
@@ -203,6 +203,7 @@ public void testSystemDataStreamRetention() throws Exception {
             client().execute(
                 PutDataStreamGlobalRetentionAction.INSTANCE,
                 new PutDataStreamGlobalRetentionAction.Request(
+                    TimeValue.THIRTY_SECONDS,
                     TimeValue.timeValueSeconds(globalRetentionSeconds),
                     TimeValue.timeValueSeconds(globalRetentionSeconds)
                 )
@@ -290,7 +291,10 @@ public void testSystemDataStreamRetention() throws Exception {
 
                 client().execute(DeleteDataStreamAction.INSTANCE, new DeleteDataStreamAction.Request(SYSTEM_DATA_STREAM_NAME)).actionGet();
             } finally {
-                client().execute(DeleteDataStreamGlobalRetentionAction.INSTANCE, new DeleteDataStreamGlobalRetentionAction.Request());
+                client().execute(
+                    DeleteDataStreamGlobalRetentionAction.INSTANCE,
+                    new DeleteDataStreamGlobalRetentionAction.Request(TimeValue.THIRTY_SECONDS)
+                );
             }
         } finally {
             dataStreamLifecycleServices.forEach(dataStreamLifecycleService -> dataStreamLifecycleService.setNowSupplier(clock::millis));
diff --git a/modules/data-streams/src/internalClusterTest/java/org/elasticsearch/datastreams/lifecycle/ExplainDataStreamLifecycleIT.java b/modules/data-streams/src/internalClusterTest/java/org/elasticsearch/datastreams/lifecycle/ExplainDataStreamLifecycleIT.java
index 2723637b2959b..35ee41fca18e8 100644
--- a/modules/data-streams/src/internalClusterTest/java/org/elasticsearch/datastreams/lifecycle/ExplainDataStreamLifecycleIT.java
+++ b/modules/data-streams/src/internalClusterTest/java/org/elasticsearch/datastreams/lifecycle/ExplainDataStreamLifecycleIT.java
@@ -213,6 +213,7 @@ public void testSystemExplainLifecycle() throws Exception {
         client().execute(
             PutDataStreamGlobalRetentionAction.INSTANCE,
             new PutDataStreamGlobalRetentionAction.Request(
+                TimeValue.THIRTY_SECONDS,
                 TimeValue.timeValueSeconds(globalRetentionSeconds),
                 TimeValue.timeValueSeconds(globalRetentionSeconds)
             )
@@ -260,7 +261,10 @@ public void testSystemExplainLifecycle() throws Exception {
                 );
             }
         } finally {
-            client().execute(DeleteDataStreamGlobalRetentionAction.INSTANCE, new DeleteDataStreamGlobalRetentionAction.Request());
+            client().execute(
+                DeleteDataStreamGlobalRetentionAction.INSTANCE,
+                new DeleteDataStreamGlobalRetentionAction.Request(TimeValue.THIRTY_SECONDS)
+            );
         }
     }
 
diff --git a/modules/data-streams/src/main/java/org/elasticsearch/datastreams/lifecycle/action/DeleteDataStreamGlobalRetentionAction.java b/modules/data-streams/src/main/java/org/elasticsearch/datastreams/lifecycle/action/DeleteDataStreamGlobalRetentionAction.java
index e3cdd6a8c14d9..92cb855b7cb4e 100644
--- a/modules/data-streams/src/main/java/org/elasticsearch/datastreams/lifecycle/action/DeleteDataStreamGlobalRetentionAction.java
+++ b/modules/data-streams/src/main/java/org/elasticsearch/datastreams/lifecycle/action/DeleteDataStreamGlobalRetentionAction.java
@@ -24,6 +24,7 @@
 import org.elasticsearch.common.inject.Inject;
 import org.elasticsearch.common.io.stream.StreamInput;
 import org.elasticsearch.common.io.stream.StreamOutput;
+import org.elasticsearch.core.TimeValue;
 import org.elasticsearch.datastreams.lifecycle.UpdateDataStreamGlobalRetentionService;
 import org.elasticsearch.features.FeatureService;
 import org.elasticsearch.tasks.Task;
@@ -64,8 +65,8 @@ public void writeTo(StreamOutput out) throws IOException {
             out.writeBoolean(dryRun);
         }
 
-        public Request() {
-            super(TRAPPY_IMPLICIT_DEFAULT_MASTER_NODE_TIMEOUT);
+        public Request(TimeValue masterNodeTimeout) {
+            super(masterNodeTimeout);
         }
 
         public boolean dryRun() {
diff --git a/modules/data-streams/src/main/java/org/elasticsearch/datastreams/lifecycle/action/DeleteDataStreamLifecycleAction.java b/modules/data-streams/src/main/java/org/elasticsearch/datastreams/lifecycle/action/DeleteDataStreamLifecycleAction.java
index 3bd100a106dd6..70f822ddee72a 100644
--- a/modules/data-streams/src/main/java/org/elasticsearch/datastreams/lifecycle/action/DeleteDataStreamLifecycleAction.java
+++ b/modules/data-streams/src/main/java/org/elasticsearch/datastreams/lifecycle/action/DeleteDataStreamLifecycleAction.java
@@ -15,6 +15,7 @@
 import org.elasticsearch.action.support.master.AcknowledgedResponse;
 import org.elasticsearch.common.io.stream.StreamInput;
 import org.elasticsearch.common.io.stream.StreamOutput;
+import org.elasticsearch.core.TimeValue;
 
 import java.io.IOException;
 import java.util.Arrays;
@@ -47,8 +48,8 @@ public void writeTo(StreamOutput out) throws IOException {
             indicesOptions.writeIndicesOptions(out);
         }
 
-        public Request(String[] names) {
-            super(TRAPPY_IMPLICIT_DEFAULT_MASTER_NODE_TIMEOUT, DEFAULT_ACK_TIMEOUT);
+        public Request(TimeValue masterNodeTimeout, TimeValue ackTimeout, String[] names) {
+            super(masterNodeTimeout, ackTimeout);
             this.names = names;
         }
 
diff --git a/modules/data-streams/src/main/java/org/elasticsearch/datastreams/lifecycle/action/GetDataStreamGlobalRetentionAction.java b/modules/data-streams/src/main/java/org/elasticsearch/datastreams/lifecycle/action/GetDataStreamGlobalRetentionAction.java
index 5816823ed710a..1d1064dd42b1a 100644
--- a/modules/data-streams/src/main/java/org/elasticsearch/datastreams/lifecycle/action/GetDataStreamGlobalRetentionAction.java
+++ b/modules/data-streams/src/main/java/org/elasticsearch/datastreams/lifecycle/action/GetDataStreamGlobalRetentionAction.java
@@ -47,10 +47,6 @@ private GetDataStreamGlobalRetentionAction() {/* no instances */}
 
     public static final class Request extends MasterNodeReadRequest<Request> {
 
-        public Request() {
-            super(TRAPPY_IMPLICIT_DEFAULT_MASTER_NODE_TIMEOUT);
-        }
-
         public Request(StreamInput in) throws IOException {
             super(in);
         }
diff --git a/modules/data-streams/src/main/java/org/elasticsearch/datastreams/lifecycle/action/GetDataStreamLifecycleStatsAction.java b/modules/data-streams/src/main/java/org/elasticsearch/datastreams/lifecycle/action/GetDataStreamLifecycleStatsAction.java
index cc61c7fe664be..6e930defd4e0b 100644
--- a/modules/data-streams/src/main/java/org/elasticsearch/datastreams/lifecycle/action/GetDataStreamLifecycleStatsAction.java
+++ b/modules/data-streams/src/main/java/org/elasticsearch/datastreams/lifecycle/action/GetDataStreamLifecycleStatsAction.java
@@ -43,8 +43,8 @@ public Request(StreamInput in) throws IOException {
             super(in);
         }
 
-        public Request() {
-            super(TRAPPY_IMPLICIT_DEFAULT_MASTER_NODE_TIMEOUT);
+        public Request(TimeValue masterNodeTimeout) {
+            super(masterNodeTimeout);
         }
 
         @Override
diff --git a/modules/data-streams/src/main/java/org/elasticsearch/datastreams/lifecycle/action/PutDataStreamGlobalRetentionAction.java b/modules/data-streams/src/main/java/org/elasticsearch/datastreams/lifecycle/action/PutDataStreamGlobalRetentionAction.java
index 65ca34a99da23..cd9156ad8b2c8 100644
--- a/modules/data-streams/src/main/java/org/elasticsearch/datastreams/lifecycle/action/PutDataStreamGlobalRetentionAction.java
+++ b/modules/data-streams/src/main/java/org/elasticsearch/datastreams/lifecycle/action/PutDataStreamGlobalRetentionAction.java
@@ -32,9 +32,6 @@
 import org.elasticsearch.tasks.Task;
 import org.elasticsearch.threadpool.ThreadPool;
 import org.elasticsearch.transport.TransportService;
-import org.elasticsearch.xcontent.ConstructingObjectParser;
-import org.elasticsearch.xcontent.ObjectParser;
-import org.elasticsearch.xcontent.XContentParser;
 
 import java.io.IOException;
 import java.util.List;
@@ -53,34 +50,9 @@ private PutDataStreamGlobalRetentionAction() {/* no instances */}
 
     public static final class Request extends MasterNodeRequest<Request> {
 
-        public static final ConstructingObjectParser<PutDataStreamGlobalRetentionAction.Request, Void> PARSER =
-            new ConstructingObjectParser<>(
-                "put_data_stream_global_retention_request",
-                args -> new PutDataStreamGlobalRetentionAction.Request((TimeValue) args[0], (TimeValue) args[1])
-            );
-
-        static {
-            PARSER.declareField(
-                ConstructingObjectParser.optionalConstructorArg(),
-                (p, c) -> TimeValue.parseTimeValue(p.textOrNull(), DataStreamGlobalRetention.DEFAULT_RETENTION_FIELD.getPreferredName()),
-                DataStreamGlobalRetention.DEFAULT_RETENTION_FIELD,
-                ObjectParser.ValueType.STRING_OR_NULL
-            );
-            PARSER.declareField(
-                ConstructingObjectParser.optionalConstructorArg(),
-                (p, c) -> TimeValue.parseTimeValue(p.textOrNull(), DataStreamGlobalRetention.MAX_RETENTION_FIELD.getPreferredName()),
-                DataStreamGlobalRetention.MAX_RETENTION_FIELD,
-                ObjectParser.ValueType.STRING_OR_NULL
-            );
-        }
-
         private final DataStreamGlobalRetention globalRetention;
         private boolean dryRun = false;
 
-        public static PutDataStreamGlobalRetentionAction.Request parseRequest(XContentParser parser) {
-            return PARSER.apply(parser, null);
-        }
-
         public Request(StreamInput in) throws IOException {
             super(in);
             globalRetention = DataStreamGlobalRetention.read(in);
@@ -107,8 +79,8 @@ public void writeTo(StreamOutput out) throws IOException {
             out.writeBoolean(dryRun);
         }
 
-        public Request(@Nullable TimeValue defaultRetention, @Nullable TimeValue maxRetention) {
-            super(TRAPPY_IMPLICIT_DEFAULT_MASTER_NODE_TIMEOUT);
+        public Request(TimeValue masterNodeTimeout, @Nullable TimeValue defaultRetention, @Nullable TimeValue maxRetention) {
+            super(masterNodeTimeout);
             this.globalRetention = new DataStreamGlobalRetention(defaultRetention, maxRetention);
         }
 
diff --git a/modules/data-streams/src/main/java/org/elasticsearch/datastreams/lifecycle/rest/RestDataStreamLifecycleStatsAction.java b/modules/data-streams/src/main/java/org/elasticsearch/datastreams/lifecycle/rest/RestDataStreamLifecycleStatsAction.java
index a10a955b33975..a3959ae818218 100644
--- a/modules/data-streams/src/main/java/org/elasticsearch/datastreams/lifecycle/rest/RestDataStreamLifecycleStatsAction.java
+++ b/modules/data-streams/src/main/java/org/elasticsearch/datastreams/lifecycle/rest/RestDataStreamLifecycleStatsAction.java
@@ -36,8 +36,7 @@ public List<Route> routes() {
 
     @Override
     protected RestChannelConsumer prepareRequest(RestRequest restRequest, NodeClient client) {
-        GetDataStreamLifecycleStatsAction.Request request = new GetDataStreamLifecycleStatsAction.Request();
-        request.masterNodeTimeout(getMasterNodeTimeout(restRequest));
+        final var request = new GetDataStreamLifecycleStatsAction.Request(getMasterNodeTimeout(restRequest));
         return channel -> client.execute(
             GetDataStreamLifecycleStatsAction.INSTANCE,
             request,
diff --git a/modules/data-streams/src/main/java/org/elasticsearch/datastreams/lifecycle/rest/RestDeleteDataStreamLifecycleAction.java b/modules/data-streams/src/main/java/org/elasticsearch/datastreams/lifecycle/rest/RestDeleteDataStreamLifecycleAction.java
index b624892ac6bba..a8a64eaf5cfa3 100644
--- a/modules/data-streams/src/main/java/org/elasticsearch/datastreams/lifecycle/rest/RestDeleteDataStreamLifecycleAction.java
+++ b/modules/data-streams/src/main/java/org/elasticsearch/datastreams/lifecycle/rest/RestDeleteDataStreamLifecycleAction.java
@@ -8,6 +8,7 @@
 package org.elasticsearch.datastreams.lifecycle.rest;
 
 import org.elasticsearch.action.support.IndicesOptions;
+import org.elasticsearch.action.support.master.AcknowledgedRequest;
 import org.elasticsearch.client.internal.node.NodeClient;
 import org.elasticsearch.common.Strings;
 import org.elasticsearch.datastreams.lifecycle.action.DeleteDataStreamLifecycleAction;
@@ -20,6 +21,7 @@
 import java.util.List;
 
 import static org.elasticsearch.rest.RestRequest.Method.DELETE;
+import static org.elasticsearch.rest.RestUtils.getMasterNodeTimeout;
 
 @ServerlessScope(Scope.INTERNAL)
 public class RestDeleteDataStreamLifecycleAction extends BaseRestHandler {
@@ -36,7 +38,9 @@ public List<Route> routes() {
 
     @Override
     protected RestChannelConsumer prepareRequest(RestRequest request, NodeClient client) {
-        DeleteDataStreamLifecycleAction.Request deleteDataLifecycleRequest = new DeleteDataStreamLifecycleAction.Request(
+        final var deleteDataLifecycleRequest = new DeleteDataStreamLifecycleAction.Request(
+            getMasterNodeTimeout(request),
+            request.paramAsTime("timeout", AcknowledgedRequest.DEFAULT_ACK_TIMEOUT),
             Strings.splitStringByCommaToArray(request.param("name"))
         );
         deleteDataLifecycleRequest.indicesOptions(IndicesOptions.fromRequest(request, deleteDataLifecycleRequest.indicesOptions()));
diff --git a/modules/ingest-geoip/src/main/java/org/elasticsearch/ingest/geoip/Database.java b/modules/ingest-geoip/src/main/java/org/elasticsearch/ingest/geoip/Database.java
index 5a9b00dde58cc..641d8bad2b135 100644
--- a/modules/ingest-geoip/src/main/java/org/elasticsearch/ingest/geoip/Database.java
+++ b/modules/ingest-geoip/src/main/java/org/elasticsearch/ingest/geoip/Database.java
@@ -96,7 +96,11 @@ enum Database {
             Property.ANONYMOUS,
             Property.PUBLIC_PROXY,
             Property.RESIDENTIAL_PROXY,
-            Property.DOMAIN
+            Property.DOMAIN,
+            Property.ISP,
+            Property.ISP_ORGANIZATION_NAME,
+            Property.MOBILE_COUNTRY_CODE,
+            Property.MOBILE_NETWORK_CODE
         ),
         Set.of(
             Property.COUNTRY_ISO_CODE,
@@ -107,6 +111,28 @@ enum Database {
             Property.CITY_NAME,
             Property.LOCATION
         )
+    ),
+    Isp(
+        Set.of(
+            Property.IP,
+            Property.ASN,
+            Property.ORGANIZATION_NAME,
+            Property.NETWORK,
+            Property.ISP,
+            Property.ISP_ORGANIZATION_NAME,
+            Property.MOBILE_COUNTRY_CODE,
+            Property.MOBILE_NETWORK_CODE
+        ),
+        Set.of(
+            Property.IP,
+            Property.ASN,
+            Property.ORGANIZATION_NAME,
+            Property.NETWORK,
+            Property.ISP,
+            Property.ISP_ORGANIZATION_NAME,
+            Property.MOBILE_COUNTRY_CODE,
+            Property.MOBILE_NETWORK_CODE
+        )
     );
 
     private static final String CITY_DB_SUFFIX = "-City";
@@ -115,6 +141,7 @@ enum Database {
     private static final String ANONYMOUS_IP_DB_SUFFIX = "-Anonymous-IP";
     private static final String DOMAIN_DB_SUFFIX = "-Domain";
     private static final String ENTERPRISE_DB_SUFFIX = "-Enterprise";
+    private static final String ISP_DB_SUFFIX = "-ISP";
 
     /**
      * Parses the passed-in databaseType (presumably from the passed-in databaseFile) and return the Database instance that is
@@ -140,6 +167,8 @@ public static Database getDatabase(final String databaseType, final String datab
                 database = Database.Domain;
             } else if (databaseType.endsWith(Database.ENTERPRISE_DB_SUFFIX)) {
                 database = Database.Enterprise;
+            } else if (databaseType.endsWith(Database.ISP_DB_SUFFIX)) {
+                database = Database.Isp;
             }
         }
 
@@ -215,7 +244,11 @@ enum Property {
         ANONYMOUS,
         PUBLIC_PROXY,
         RESIDENTIAL_PROXY,
-        DOMAIN;
+        DOMAIN,
+        ISP,
+        ISP_ORGANIZATION_NAME,
+        MOBILE_COUNTRY_CODE,
+        MOBILE_NETWORK_CODE;
 
         /**
          * Parses a string representation of a property into an actual Property instance. Not all properties that exist are
diff --git a/modules/ingest-geoip/src/main/java/org/elasticsearch/ingest/geoip/DatabaseReaderLazyLoader.java b/modules/ingest-geoip/src/main/java/org/elasticsearch/ingest/geoip/DatabaseReaderLazyLoader.java
index 97b90f612ea92..a6f2be9c1fb79 100644
--- a/modules/ingest-geoip/src/main/java/org/elasticsearch/ingest/geoip/DatabaseReaderLazyLoader.java
+++ b/modules/ingest-geoip/src/main/java/org/elasticsearch/ingest/geoip/DatabaseReaderLazyLoader.java
@@ -18,6 +18,7 @@
 import com.maxmind.geoip2.model.CountryResponse;
 import com.maxmind.geoip2.model.DomainResponse;
 import com.maxmind.geoip2.model.EnterpriseResponse;
+import com.maxmind.geoip2.model.IspResponse;
 
 import org.apache.logging.log4j.LogManager;
 import org.apache.logging.log4j.Logger;
@@ -190,6 +191,12 @@ public EnterpriseResponse getEnterprise(InetAddress ipAddress) {
         return getResponse(ipAddress, DatabaseReader::tryEnterprise);
     }
 
+    @Nullable
+    @Override
+    public IspResponse getIsp(InetAddress ipAddress) {
+        return getResponse(ipAddress, DatabaseReader::tryIsp);
+    }
+
     boolean preLookup() {
         return currentUsages.updateAndGet(current -> current < 0 ? current : current + 1) > 0;
     }
diff --git a/modules/ingest-geoip/src/main/java/org/elasticsearch/ingest/geoip/GeoIpDatabase.java b/modules/ingest-geoip/src/main/java/org/elasticsearch/ingest/geoip/GeoIpDatabase.java
index 7cbd423a5f2e9..681751f0f525a 100644
--- a/modules/ingest-geoip/src/main/java/org/elasticsearch/ingest/geoip/GeoIpDatabase.java
+++ b/modules/ingest-geoip/src/main/java/org/elasticsearch/ingest/geoip/GeoIpDatabase.java
@@ -14,6 +14,7 @@
 import com.maxmind.geoip2.model.CountryResponse;
 import com.maxmind.geoip2.model.DomainResponse;
 import com.maxmind.geoip2.model.EnterpriseResponse;
+import com.maxmind.geoip2.model.IspResponse;
 
 import org.elasticsearch.core.Nullable;
 
@@ -65,6 +66,9 @@ public interface GeoIpDatabase {
     @Nullable
     EnterpriseResponse getEnterprise(InetAddress ipAddress);
 
+    @Nullable
+    IspResponse getIsp(InetAddress ipAddress);
+
     /**
      * Releases the current database object. Called after processing a single document. Databases should be closed or returned to a
      * resource pool. No further interactions should be expected.
diff --git a/modules/ingest-geoip/src/main/java/org/elasticsearch/ingest/geoip/GeoIpProcessor.java b/modules/ingest-geoip/src/main/java/org/elasticsearch/ingest/geoip/GeoIpProcessor.java
index 16485987176b7..6d420b0547293 100644
--- a/modules/ingest-geoip/src/main/java/org/elasticsearch/ingest/geoip/GeoIpProcessor.java
+++ b/modules/ingest-geoip/src/main/java/org/elasticsearch/ingest/geoip/GeoIpProcessor.java
@@ -15,6 +15,7 @@
 import com.maxmind.geoip2.model.CountryResponse;
 import com.maxmind.geoip2.model.DomainResponse;
 import com.maxmind.geoip2.model.EnterpriseResponse;
+import com.maxmind.geoip2.model.IspResponse;
 import com.maxmind.geoip2.record.City;
 import com.maxmind.geoip2.record.Continent;
 import com.maxmind.geoip2.record.Country;
@@ -178,6 +179,7 @@ private Map<String, Object> getGeoData(GeoIpDatabase geoIpDatabase, String ip) t
             case AnonymousIp -> retrieveAnonymousIpGeoData(geoIpDatabase, ipAddress);
             case Domain -> retrieveDomainGeoData(geoIpDatabase, ipAddress);
             case Enterprise -> retrieveEnterpriseGeoData(geoIpDatabase, ipAddress);
+            case Isp -> retrieveIspGeoData(geoIpDatabase, ipAddress);
         };
     }
 
@@ -424,6 +426,11 @@ private Map<String, Object> retrieveEnterpriseGeoData(GeoIpDatabase geoIpDatabas
         String organization_name = response.getTraits().getAutonomousSystemOrganization();
         Network network = response.getTraits().getNetwork();
 
+        String isp = response.getTraits().getIsp();
+        String ispOrganization = response.getTraits().getOrganization();
+        String mobileCountryCode = response.getTraits().getMobileCountryCode();
+        String mobileNetworkCode = response.getTraits().getMobileNetworkCode();
+
         boolean isHostingProvider = response.getTraits().isHostingProvider();
         boolean isTorExitNode = response.getTraits().isTorExitNode();
         boolean isAnonymousVpn = response.getTraits().isAnonymousVpn();
@@ -531,6 +538,84 @@ private Map<String, Object> retrieveEnterpriseGeoData(GeoIpDatabase geoIpDatabas
                         geoData.put("domain", domain);
                     }
                 }
+                case ISP -> {
+                    if (isp != null) {
+                        geoData.put("isp", isp);
+                    }
+                }
+                case ISP_ORGANIZATION_NAME -> {
+                    if (ispOrganization != null) {
+                        geoData.put("isp_organization", ispOrganization);
+                    }
+                }
+                case MOBILE_COUNTRY_CODE -> {
+                    if (mobileCountryCode != null) {
+                        geoData.put("mobile_country_code", mobileCountryCode);
+                    }
+                }
+                case MOBILE_NETWORK_CODE -> {
+                    if (mobileNetworkCode != null) {
+                        geoData.put("mobile_network_code", mobileNetworkCode);
+                    }
+                }
+            }
+        }
+        return geoData;
+    }
+
+    private Map<String, Object> retrieveIspGeoData(GeoIpDatabase geoIpDatabase, InetAddress ipAddress) {
+        IspResponse response = geoIpDatabase.getIsp(ipAddress);
+        if (response == null) {
+            return Map.of();
+        }
+
+        String isp = response.getIsp();
+        String ispOrganization = response.getOrganization();
+        String mobileNetworkCode = response.getMobileNetworkCode();
+        String mobileCountryCode = response.getMobileCountryCode();
+        Long asn = response.getAutonomousSystemNumber();
+        String organization_name = response.getAutonomousSystemOrganization();
+        Network network = response.getNetwork();
+
+        Map<String, Object> geoData = new HashMap<>();
+        for (Property property : this.properties) {
+            switch (property) {
+                case IP -> geoData.put("ip", NetworkAddress.format(ipAddress));
+                case ASN -> {
+                    if (asn != null) {
+                        geoData.put("asn", asn);
+                    }
+                }
+                case ORGANIZATION_NAME -> {
+                    if (organization_name != null) {
+                        geoData.put("organization_name", organization_name);
+                    }
+                }
+                case NETWORK -> {
+                    if (network != null) {
+                        geoData.put("network", network.toString());
+                    }
+                }
+                case ISP -> {
+                    if (isp != null) {
+                        geoData.put("isp", isp);
+                    }
+                }
+                case ISP_ORGANIZATION_NAME -> {
+                    if (ispOrganization != null) {
+                        geoData.put("isp_organization", ispOrganization);
+                    }
+                }
+                case MOBILE_COUNTRY_CODE -> {
+                    if (mobileCountryCode != null) {
+                        geoData.put("mobile_country_code", mobileCountryCode);
+                    }
+                }
+                case MOBILE_NETWORK_CODE -> {
+                    if (mobileNetworkCode != null) {
+                        geoData.put("mobile_network_code", mobileNetworkCode);
+                    }
+                }
             }
         }
         return geoData;
diff --git a/modules/ingest-geoip/src/test/java/org/elasticsearch/ingest/geoip/GeoIpProcessorTests.java b/modules/ingest-geoip/src/test/java/org/elasticsearch/ingest/geoip/GeoIpProcessorTests.java
index cd6737cced308..3f1216c515f5d 100644
--- a/modules/ingest-geoip/src/test/java/org/elasticsearch/ingest/geoip/GeoIpProcessorTests.java
+++ b/modules/ingest-geoip/src/test/java/org/elasticsearch/ingest/geoip/GeoIpProcessorTests.java
@@ -387,7 +387,7 @@ public void testEnterprise() throws Exception {
         assertThat(ingestDocument.getSourceAndMetadata().get("source_field"), equalTo(ip));
         @SuppressWarnings("unchecked")
         Map<String, Object> geoData = (Map<String, Object>) ingestDocument.getSourceAndMetadata().get("target_field");
-        assertThat(geoData.size(), equalTo(19));
+        assertThat(geoData.size(), equalTo(21));
         assertThat(geoData.get("ip"), equalTo(ip));
         assertThat(geoData.get("country_iso_code"), equalTo("US"));
         assertThat(geoData.get("country_name"), equalTo("United States"));
@@ -410,6 +410,42 @@ public void testEnterprise() throws Exception {
         assertThat(geoData.get("public_proxy"), equalTo(false));
         assertThat(geoData.get("residential_proxy"), equalTo(false));
         assertThat(geoData.get("domain"), equalTo("frpt.net"));
+        assertThat(geoData.get("isp"), equalTo("Fairpoint Communications"));
+        assertThat(geoData.get("isp_organization"), equalTo("Fairpoint Communications"));
+    }
+
+    public void testIsp() throws Exception {
+        String ip = "149.101.100.1";
+        GeoIpProcessor processor = new GeoIpProcessor(
+            randomAlphaOfLength(10),
+            null,
+            "source_field",
+            loader("/GeoIP2-ISP-Test.mmdb"),
+            () -> true,
+            "target_field",
+            ALL_PROPERTIES,
+            false,
+            false,
+            "filename"
+        );
+
+        Map<String, Object> document = new HashMap<>();
+        document.put("source_field", ip);
+        IngestDocument ingestDocument = RandomDocumentPicks.randomIngestDocument(random(), document);
+        processor.execute(ingestDocument);
+
+        assertThat(ingestDocument.getSourceAndMetadata().get("source_field"), equalTo(ip));
+        @SuppressWarnings("unchecked")
+        Map<String, Object> geoData = (Map<String, Object>) ingestDocument.getSourceAndMetadata().get("target_field");
+        assertThat(geoData.size(), equalTo(8));
+        assertThat(geoData.get("ip"), equalTo(ip));
+        assertThat(geoData.get("asn"), equalTo(6167L));
+        assertThat(geoData.get("organization_name"), equalTo("CELLCO-PART"));
+        assertThat(geoData.get("network"), equalTo("149.101.100.0/28"));
+        assertThat(geoData.get("isp"), equalTo("Verizon Wireless"));
+        assertThat(geoData.get("isp_organization"), equalTo("Verizon Wireless"));
+        assertThat(geoData.get("mobile_network_code"), equalTo("004"));
+        assertThat(geoData.get("mobile_country_code"), equalTo("310"));
     }
 
     public void testAddressIsNotInTheDatabase() throws Exception {
diff --git a/modules/ingest-geoip/src/test/java/org/elasticsearch/ingest/geoip/MaxMindSupportTests.java b/modules/ingest-geoip/src/test/java/org/elasticsearch/ingest/geoip/MaxMindSupportTests.java
index 07ea7f59eb521..a396995663da7 100644
--- a/modules/ingest-geoip/src/test/java/org/elasticsearch/ingest/geoip/MaxMindSupportTests.java
+++ b/modules/ingest-geoip/src/test/java/org/elasticsearch/ingest/geoip/MaxMindSupportTests.java
@@ -220,7 +220,11 @@ public class MaxMindSupportTests extends ESTestCase {
         "traits.autonomousSystemOrganization",
         "traits.domain",
         "traits.hostingProvider",
+        "traits.isp",
+        "traits.mobileCountryCode",
+        "traits.mobileNetworkCode",
         "traits.network",
+        "traits.organization",
         "traits.publicProxy",
         "traits.residentialProxy",
         "traits.torExitNode"
@@ -273,17 +277,25 @@ public class MaxMindSupportTests extends ESTestCase {
         "traits.anycast",
         "traits.connectionType",
         "traits.ipAddress",
-        "traits.isp",
         "traits.legitimateProxy",
-        "traits.mobileCountryCode",
-        "traits.mobileNetworkCode",
-        "traits.organization",
         "traits.satelliteProvider",
         "traits.staticIpScore",
         "traits.userCount",
         "traits.userType"
     );
 
+    private static final Set<String> ISP_SUPPORTED_FIELDS = Set.of(
+        "autonomousSystemNumber",
+        "autonomousSystemOrganization",
+        "network",
+        "isp",
+        "mobileCountryCode",
+        "mobileNetworkCode",
+        "organization"
+    );
+
+    private static final Set<String> ISP_UNSUPPORTED_FIELDS = Set.of("ipAddress");
+
     private static final Map<Database, Set<String>> TYPE_TO_SUPPORTED_FIELDS_MAP = Map.of(
         Database.AnonymousIp,
         ANONYMOUS_IP_SUPPORTED_FIELDS,
@@ -296,7 +308,9 @@ public class MaxMindSupportTests extends ESTestCase {
         Database.Domain,
         DOMAIN_SUPPORTED_FIELDS,
         Database.Enterprise,
-        ENTERPRISE_SUPPORTED_FIELDS
+        ENTERPRISE_SUPPORTED_FIELDS,
+        Database.Isp,
+        ISP_SUPPORTED_FIELDS
     );
     private static final Map<Database, Set<String>> TYPE_TO_UNSUPPORTED_FIELDS_MAP = Map.of(
         Database.AnonymousIp,
@@ -310,7 +324,9 @@ public class MaxMindSupportTests extends ESTestCase {
         Database.Domain,
         DOMAIN_UNSUPPORTED_FIELDS,
         Database.Enterprise,
-        ENTERPRISE_UNSUPPORTED_FIELDS
+        ENTERPRISE_UNSUPPORTED_FIELDS,
+        Database.Isp,
+        ISP_UNSUPPORTED_FIELDS
     );
     private static final Map<Database, Class<? extends AbstractResponse>> TYPE_TO_MAX_MIND_CLASS = Map.of(
         Database.AnonymousIp,
@@ -324,12 +340,13 @@ public class MaxMindSupportTests extends ESTestCase {
         Database.Domain,
         DomainResponse.class,
         Database.Enterprise,
-        EnterpriseResponse.class
+        EnterpriseResponse.class,
+        Database.Isp,
+        IspResponse.class
     );
 
     private static final Set<Class<? extends AbstractResponse>> KNOWN_UNSUPPORTED_RESPONSE_CLASSES = Set.of(
         ConnectionTypeResponse.class,
-        IspResponse.class,
         IpRiskResponse.class
     );
 
diff --git a/modules/ingest-geoip/src/test/resources/GeoIP2-ISP-Test.mmdb b/modules/ingest-geoip/src/test/resources/GeoIP2-ISP-Test.mmdb
new file mode 100644
index 0000000000000..d16b0eee4c5e5
Binary files /dev/null and b/modules/ingest-geoip/src/test/resources/GeoIP2-ISP-Test.mmdb differ
diff --git a/modules/kibana/src/internalClusterTest/java/org/elasticsearch/kibana/KibanaThreadPoolIT.java b/modules/kibana/src/internalClusterTest/java/org/elasticsearch/kibana/KibanaThreadPoolIT.java
index 275666eec5c42..98eb69aa9e21e 100644
--- a/modules/kibana/src/internalClusterTest/java/org/elasticsearch/kibana/KibanaThreadPoolIT.java
+++ b/modules/kibana/src/internalClusterTest/java/org/elasticsearch/kibana/KibanaThreadPoolIT.java
@@ -8,6 +8,8 @@
 
 package org.elasticsearch.kibana;
 
+import org.apache.logging.log4j.LogManager;
+import org.apache.logging.log4j.Logger;
 import org.elasticsearch.action.bulk.BulkResponse;
 import org.elasticsearch.action.search.SearchPhaseExecutionException;
 import org.elasticsearch.action.search.SearchRequest;
@@ -15,12 +17,15 @@
 import org.elasticsearch.client.internal.Client;
 import org.elasticsearch.common.settings.Settings;
 import org.elasticsearch.common.util.concurrent.EsRejectedExecutionException;
+import org.elasticsearch.common.util.concurrent.EsThreadPoolExecutor;
 import org.elasticsearch.index.IndexingPressure;
 import org.elasticsearch.index.query.QueryBuilders;
 import org.elasticsearch.plugins.Plugin;
 import org.elasticsearch.test.ESIntegTestCase;
+import org.elasticsearch.test.junit.annotations.TestLogging;
 import org.elasticsearch.threadpool.ThreadPool;
 
+import java.util.Arrays;
 import java.util.Collection;
 import java.util.List;
 import java.util.Locale;
@@ -42,7 +47,9 @@
  * threads that wait on a phaser. This lets us verify that operations on system indices
  * are being directed to other thread pools.</p>
  */
+@TestLogging(reason = "investigate", value = "org.elasticsearch.kibana.KibanaThreadPoolIT:DEBUG")
 public class KibanaThreadPoolIT extends ESIntegTestCase {
+    private static final Logger logger = LogManager.getLogger(KibanaThreadPoolIT.class);
 
     @Override
     protected Settings nodeSettings(int nodeOrdinal, Settings otherSettings) {
@@ -195,10 +202,21 @@ private static void fillThreadPoolQueues(String threadPoolName, ThreadPool threa
             try {
                 threadPool.executor(threadPoolName).execute(() -> {});
             } catch (EsRejectedExecutionException e) {
+                logger.debug("Exception when filling the queue " + threadPoolName, e);
+                logThreadPoolQueue(threadPoolName, threadPool);
                 // we can't be sure that some other task won't get queued in a test cluster
                 // but the threadpool's thread is already blocked
             }
         }
+
+        logThreadPoolQueue(threadPoolName, threadPool);
+    }
+
+    private static void logThreadPoolQueue(String threadPoolName, ThreadPool threadPool) {
+        if (threadPool.executor(threadPoolName) instanceof EsThreadPoolExecutor tpe) {
+            logger.debug("Thread pool details " + threadPoolName + " " + tpe);
+            logger.debug(Arrays.toString(tpe.getTasks().toArray()));
+        }
     }
 
 }
diff --git a/qa/packaging/src/test/java/org/elasticsearch/packaging/test/DockerTests.java b/qa/packaging/src/test/java/org/elasticsearch/packaging/test/DockerTests.java
index 81ac8ab1200f6..40752e5b296bc 100644
--- a/qa/packaging/src/test/java/org/elasticsearch/packaging/test/DockerTests.java
+++ b/qa/packaging/src/test/java/org/elasticsearch/packaging/test/DockerTests.java
@@ -1211,6 +1211,7 @@ private List<String> listPlugins() {
     /**
      * Check that readiness listener works
      */
+    @AwaitsFix(bugUrl = "https://github.com/elastic/elasticsearch/issues/108523")
     public void test500Readiness() throws Exception {
         assertFalse(readinessProbe(9399));
         // Disabling security so we wait for green
diff --git a/server/src/main/java/org/elasticsearch/TransportVersions.java b/server/src/main/java/org/elasticsearch/TransportVersions.java
index f1232d2442c8b..b1c43a478f94f 100644
--- a/server/src/main/java/org/elasticsearch/TransportVersions.java
+++ b/server/src/main/java/org/elasticsearch/TransportVersions.java
@@ -165,6 +165,9 @@ static TransportVersion def(int id) {
     public static final TransportVersion JOIN_STATUS_AGE_SERIALIZATION = def(8_656_00_0);
     public static final TransportVersion ML_RERANK_DOC_OPTIONAL = def(8_657_00_0);
     public static final TransportVersion FAILURE_STORE_FIELD_PARITY = def(8_658_00_0);
+    public static final TransportVersion ML_INFERENCE_AZURE_AI_STUDIO = def(8_659_00_0);
+    public static final TransportVersion ML_INFERENCE_COHERE_COMPLETION_ADDED = def(8_660_00_0);
+
     /*
      * STOP! READ THIS FIRST! No, really,
      *        ____ _____ ___  ____  _        ____  _____    _    ____    _____ _   _ ___ ____    _____ ___ ____  ____ _____ _
diff --git a/server/src/main/java/org/elasticsearch/action/admin/cluster/snapshots/create/CreateSnapshotRequest.java b/server/src/main/java/org/elasticsearch/action/admin/cluster/snapshots/create/CreateSnapshotRequest.java
index 5d20443fa3989..c2fd49eb91a42 100644
--- a/server/src/main/java/org/elasticsearch/action/admin/cluster/snapshots/create/CreateSnapshotRequest.java
+++ b/server/src/main/java/org/elasticsearch/action/admin/cluster/snapshots/create/CreateSnapshotRequest.java
@@ -15,6 +15,7 @@
 import org.elasticsearch.action.IndicesRequest;
 import org.elasticsearch.action.support.IndicesOptions;
 import org.elasticsearch.action.support.master.MasterNodeRequest;
+import org.elasticsearch.cluster.metadata.DataStream;
 import org.elasticsearch.common.Strings;
 import org.elasticsearch.common.bytes.BytesReference;
 import org.elasticsearch.common.io.stream.StreamInput;
@@ -65,7 +66,9 @@ public class CreateSnapshotRequest extends MasterNodeRequest<CreateSnapshotReque
 
     private String[] indices = EMPTY_ARRAY;
 
-    private IndicesOptions indicesOptions = IndicesOptions.strictExpandHidden();
+    private IndicesOptions indicesOptions = DataStream.isFailureStoreFeatureFlagEnabled()
+        ? IndicesOptions.strictExpandHiddenIncludeFailureStore()
+        : IndicesOptions.strictExpandHidden();
 
     private String[] featureStates = EMPTY_ARRAY;
 
diff --git a/server/src/main/java/org/elasticsearch/action/admin/cluster/snapshots/restore/RestoreSnapshotRequest.java b/server/src/main/java/org/elasticsearch/action/admin/cluster/snapshots/restore/RestoreSnapshotRequest.java
index 73339cedb96e0..674fe117410e5 100644
--- a/server/src/main/java/org/elasticsearch/action/admin/cluster/snapshots/restore/RestoreSnapshotRequest.java
+++ b/server/src/main/java/org/elasticsearch/action/admin/cluster/snapshots/restore/RestoreSnapshotRequest.java
@@ -13,6 +13,7 @@
 import org.elasticsearch.action.ActionRequestValidationException;
 import org.elasticsearch.action.support.IndicesOptions;
 import org.elasticsearch.action.support.master.MasterNodeRequest;
+import org.elasticsearch.cluster.metadata.DataStream;
 import org.elasticsearch.common.Strings;
 import org.elasticsearch.common.io.stream.StreamInput;
 import org.elasticsearch.common.io.stream.StreamOutput;
@@ -41,7 +42,9 @@ public class RestoreSnapshotRequest extends MasterNodeRequest<RestoreSnapshotReq
     private String snapshot;
     private String repository;
     private String[] indices = Strings.EMPTY_ARRAY;
-    private IndicesOptions indicesOptions = IndicesOptions.strictExpandOpen();
+    private IndicesOptions indicesOptions = DataStream.isFailureStoreFeatureFlagEnabled()
+        ? IndicesOptions.strictExpandOpenIncludeFailureStore()
+        : IndicesOptions.strictExpandOpen();
     private String[] featureStates = Strings.EMPTY_ARRAY;
     private String renamePattern;
     private String renameReplacement;
diff --git a/server/src/main/java/org/elasticsearch/action/support/IndicesOptions.java b/server/src/main/java/org/elasticsearch/action/support/IndicesOptions.java
index 1070a5d0bddd0..33bc7d32bf48a 100644
--- a/server/src/main/java/org/elasticsearch/action/support/IndicesOptions.java
+++ b/server/src/main/java/org/elasticsearch/action/support/IndicesOptions.java
@@ -570,6 +570,25 @@ private enum Option {
         )
         .failureStoreOptions(FailureStoreOptions.builder().includeRegularIndices(true).includeFailureIndices(false))
         .build();
+    public static final IndicesOptions STRICT_EXPAND_OPEN_FAILURE_STORE = IndicesOptions.builder()
+        .concreteTargetOptions(ConcreteTargetOptions.ERROR_WHEN_UNAVAILABLE_TARGETS)
+        .wildcardOptions(
+            WildcardOptions.builder()
+                .matchOpen(true)
+                .matchClosed(false)
+                .includeHidden(false)
+                .allowEmptyExpressions(true)
+                .resolveAliases(true)
+        )
+        .gatekeeperOptions(
+            GatekeeperOptions.builder()
+                .allowAliasToMultipleIndices(true)
+                .allowClosedIndices(true)
+                .allowFailureIndices(true)
+                .ignoreThrottled(false)
+        )
+        .failureStoreOptions(FailureStoreOptions.builder().includeRegularIndices(true).includeFailureIndices(true))
+        .build();
     public static final IndicesOptions LENIENT_EXPAND_OPEN = IndicesOptions.builder()
         .concreteTargetOptions(ConcreteTargetOptions.ALLOW_UNAVAILABLE_TARGETS)
         .wildcardOptions(
@@ -674,6 +693,58 @@ private enum Option {
         )
         .failureStoreOptions(FailureStoreOptions.builder().includeRegularIndices(true).includeFailureIndices(false))
         .build();
+    public static final IndicesOptions LENIENT_EXPAND_OPEN_CLOSED_FAILURE_STORE = IndicesOptions.builder()
+        .concreteTargetOptions(ConcreteTargetOptions.ALLOW_UNAVAILABLE_TARGETS)
+        .wildcardOptions(
+            WildcardOptions.builder()
+                .matchOpen(true)
+                .matchClosed(true)
+                .includeHidden(false)
+                .allowEmptyExpressions(true)
+                .resolveAliases(true)
+        )
+        .gatekeeperOptions(
+            GatekeeperOptions.builder()
+                .allowAliasToMultipleIndices(true)
+                .allowClosedIndices(true)
+                .allowFailureIndices(true)
+                .ignoreThrottled(false)
+        )
+        .failureStoreOptions(FailureStoreOptions.builder().includeRegularIndices(true).includeFailureIndices(true))
+        .build();
+    public static final IndicesOptions STRICT_EXPAND_OPEN_CLOSED_HIDDEN_FAILURE_STORE = IndicesOptions.builder()
+        .concreteTargetOptions(ConcreteTargetOptions.ERROR_WHEN_UNAVAILABLE_TARGETS)
+        .wildcardOptions(
+            WildcardOptions.builder().matchOpen(true).matchClosed(true).includeHidden(true).allowEmptyExpressions(true).resolveAliases(true)
+        )
+        .gatekeeperOptions(
+            GatekeeperOptions.builder()
+                .allowAliasToMultipleIndices(true)
+                .allowClosedIndices(true)
+                .allowFailureIndices(true)
+                .ignoreThrottled(false)
+        )
+        .failureStoreOptions(FailureStoreOptions.builder().includeRegularIndices(true).includeFailureIndices(true))
+        .build();
+    public static final IndicesOptions STRICT_EXPAND_OPEN_CLOSED_FAILURE_STORE = IndicesOptions.builder()
+        .concreteTargetOptions(ConcreteTargetOptions.ERROR_WHEN_UNAVAILABLE_TARGETS)
+        .wildcardOptions(
+            WildcardOptions.builder()
+                .matchOpen(true)
+                .matchClosed(true)
+                .includeHidden(false)
+                .allowEmptyExpressions(true)
+                .resolveAliases(true)
+        )
+        .gatekeeperOptions(
+            GatekeeperOptions.builder()
+                .allowAliasToMultipleIndices(true)
+                .allowClosedIndices(true)
+                .allowFailureIndices(true)
+                .ignoreThrottled(false)
+        )
+        .failureStoreOptions(FailureStoreOptions.builder().includeRegularIndices(true).includeFailureIndices(true))
+        .build();
     public static final IndicesOptions STRICT_EXPAND_OPEN_FORBID_CLOSED = IndicesOptions.builder()
         .concreteTargetOptions(ConcreteTargetOptions.ERROR_WHEN_UNAVAILABLE_TARGETS)
         .wildcardOptions(
@@ -1321,6 +1392,14 @@ public static IndicesOptions strictExpandOpen() {
         return STRICT_EXPAND_OPEN;
     }
 
+    /**
+     * @return indices options that requires every specified index to exist, expands wildcards only to open indices and
+     * allows that no indices are resolved from wildcard expressions (not returning an error).
+     */
+    public static IndicesOptions strictExpandOpenIncludeFailureStore() {
+        return STRICT_EXPAND_OPEN_FAILURE_STORE;
+    }
+
     /**
      * @return indices options that requires every specified index to exist, expands wildcards only to open indices,
      * allows that no indices are resolved from wildcard expressions (not returning an error) and forbids the
@@ -1355,6 +1434,24 @@ public static IndicesOptions strictExpandHidden() {
         return STRICT_EXPAND_OPEN_CLOSED_HIDDEN;
     }
 
+    /**
+     * @return indices option that expands wildcards to both open and closed indices, includes failure store
+     * (with data stream) and allows that indices can be missing and no indices are resolved from wildcard expressions
+     * (not returning an error).
+     */
+    public static IndicesOptions lenientExpandIncludeFailureStore() {
+        return LENIENT_EXPAND_OPEN_CLOSED_FAILURE_STORE;
+    }
+
+    /**
+     * @return indices option that requires every specified index to exist, expands wildcards to both open and closed indices, includes
+     * hidden indices, includes failure store (with data stream) and allows that no indices are resolved from wildcard expressions
+     * (not returning an error).
+     */
+    public static IndicesOptions strictExpandHiddenIncludeFailureStore() {
+        return STRICT_EXPAND_OPEN_CLOSED_HIDDEN_FAILURE_STORE;
+    }
+
     /**
      * @return indices option that requires each specified index or alias to exist, doesn't expand wildcards.
      */
diff --git a/server/src/main/java/org/elasticsearch/cluster/coordination/LeaderChecker.java b/server/src/main/java/org/elasticsearch/cluster/coordination/LeaderChecker.java
index d7c9dd1feb2b5..1963a9bfe643e 100644
--- a/server/src/main/java/org/elasticsearch/cluster/coordination/LeaderChecker.java
+++ b/server/src/main/java/org/elasticsearch/cluster/coordination/LeaderChecker.java
@@ -381,17 +381,18 @@ void handleDisconnectedNode(DiscoveryNode discoveryNode) {
 
         private void scheduleNextWakeUp() {
             logger.trace("scheduling next check of {} for [{}] = {}", leader, LEADER_CHECK_INTERVAL_SETTING.getKey(), leaderCheckInterval);
-            transportService.getThreadPool().schedule(new Runnable() {
-                @Override
-                public void run() {
-                    handleWakeUp();
-                }
+            transportService.getThreadPool()
+                .scheduleUnlessShuttingDown(leaderCheckInterval, EsExecutors.DIRECT_EXECUTOR_SERVICE, new Runnable() {
+                    @Override
+                    public void run() {
+                        handleWakeUp();
+                    }
 
-                @Override
-                public String toString() {
-                    return "scheduled check of leader " + leader;
-                }
-            }, leaderCheckInterval, EsExecutors.DIRECT_EXECUTOR_SERVICE);
+                    @Override
+                    public String toString() {
+                        return "scheduled check of leader " + leader;
+                    }
+                });
         }
     }
 
diff --git a/server/src/main/java/org/elasticsearch/cluster/metadata/DataStreamFailureStoreDefinition.java b/server/src/main/java/org/elasticsearch/cluster/metadata/DataStreamFailureStoreDefinition.java
index 43c4eae41c948..08f07a0378bee 100644
--- a/server/src/main/java/org/elasticsearch/cluster/metadata/DataStreamFailureStoreDefinition.java
+++ b/server/src/main/java/org/elasticsearch/cluster/metadata/DataStreamFailureStoreDefinition.java
@@ -57,7 +57,7 @@ public class DataStreamFailureStoreDefinition {
              *       "error": {
              *         "properties": {
              *           "message": {
-             *              "type": "wildcard"
+             *              "type": "match_only_text"
              *           },
              *           "stack_trace": {
              *              "type": "text"
@@ -109,7 +109,7 @@ public class DataStreamFailureStoreDefinition {
                     .startObject("error")
                     .startObject("properties")
                     .startObject("message")
-                    .field("type", "wildcard")
+                    .field("type", "match_only_text")
                     .endObject()
                     .startObject("stack_trace")
                     .field("type", "text")
diff --git a/server/src/main/java/org/elasticsearch/common/time/Iso8601Parser.java b/server/src/main/java/org/elasticsearch/common/time/Iso8601Parser.java
index 4f1d131dd8ced..d03efe4a23670 100644
--- a/server/src/main/java/org/elasticsearch/common/time/Iso8601Parser.java
+++ b/server/src/main/java/org/elasticsearch/common/time/Iso8601Parser.java
@@ -427,7 +427,7 @@ private ZoneId parseZoneId(CharSequence str, int pos) {
         pos++;  // read the + or -
 
         Integer hours = parseInt(str, pos, pos += 2);
-        if (hours == null) return null;
+        if (hours == null || hours > 23) return null;
         if (len == pos) return ofHoursMinutesSeconds(hours, 0, 0, positive);
 
         boolean hasColon = false;
@@ -437,7 +437,7 @@ private ZoneId parseZoneId(CharSequence str, int pos) {
         }
 
         Integer minutes = parseInt(str, pos, pos += 2);
-        if (minutes == null) return null;
+        if (minutes == null || minutes > 59) return null;
         if (len == pos) return ofHoursMinutesSeconds(hours, minutes, 0, positive);
 
         // either both dividers have a colon, or neither do
@@ -447,7 +447,7 @@ private ZoneId parseZoneId(CharSequence str, int pos) {
         }
 
         Integer seconds = parseInt(str, pos, pos += 2);
-        if (seconds == null) return null;
+        if (seconds == null || seconds > 59) return null;
         if (len == pos) return ofHoursMinutesSeconds(hours, minutes, seconds, positive);
 
         // there's some text left over...
diff --git a/server/src/main/java/org/elasticsearch/index/shard/IndexShard.java b/server/src/main/java/org/elasticsearch/index/shard/IndexShard.java
index 41efbae5603b7..9c16f62335d56 100644
--- a/server/src/main/java/org/elasticsearch/index/shard/IndexShard.java
+++ b/server/src/main/java/org/elasticsearch/index/shard/IndexShard.java
@@ -4233,12 +4233,13 @@ public IndexCommitRef acquireSafeIndexCommit() {
 
                 @Override
                 public void close() throws IOException {
-                    assert Thread.holdsLock(engineMutex);
-
-                    Engine newEngine = newEngineReference.get();
-                    if (newEngine == currentEngineReference.get()) {
-                        // we successfully installed the new engine so do not close it.
-                        newEngine = null;
+                    Engine newEngine;
+                    synchronized (engineMutex) {
+                        newEngine = newEngineReference.get();
+                        if (newEngine == currentEngineReference.get()) {
+                            // we successfully installed the new engine so do not close it.
+                            newEngine = null;
+                        }
                     }
                     IOUtils.close(super::close, newEngine);
                 }
diff --git a/server/src/main/java/org/elasticsearch/snapshots/RestoreService.java b/server/src/main/java/org/elasticsearch/snapshots/RestoreService.java
index fa6ea9c6519d8..7f505eeacef63 100644
--- a/server/src/main/java/org/elasticsearch/snapshots/RestoreService.java
+++ b/server/src/main/java/org/elasticsearch/snapshots/RestoreService.java
@@ -388,18 +388,28 @@ private void startRestore(
         // Remove the data streams from the list of requested indices
         requestIndices.removeAll(dataStreamsToRestore.keySet());
 
-        // And add the backing indices
-        final Set<String> nonSystemDataStreamIndices;
+        // And add the backing indices and failure indices of data streams (the distinction is important for renaming)
         final Set<String> systemDataStreamIndices;
+        final Set<String> nonSystemDataStreamBackingIndices;
+        final Set<String> nonSystemDataStreamFailureIndices;
         {
-            Map<Boolean, Set<String>> dataStreamIndices = dataStreamsToRestore.values()
+            Map<Boolean, Set<String>> backingIndices = dataStreamsToRestore.values()
                 .stream()
                 .flatMap(ds -> ds.getIndices().stream().map(idx -> new Tuple<>(ds.isSystem(), idx.getName())))
                 .collect(Collectors.partitioningBy(Tuple::v1, Collectors.mapping(Tuple::v2, Collectors.toSet())));
-            systemDataStreamIndices = dataStreamIndices.get(true);
-            nonSystemDataStreamIndices = dataStreamIndices.get(false);
+            Map<Boolean, Set<String>> failureIndices = Map.of();
+            if (DataStream.isFailureStoreFeatureFlagEnabled()) {
+                failureIndices = dataStreamsToRestore.values()
+                    .stream()
+                    .flatMap(ds -> ds.getFailureIndices().getIndices().stream().map(idx -> new Tuple<>(ds.isSystem(), idx.getName())))
+                    .collect(Collectors.partitioningBy(Tuple::v1, Collectors.mapping(Tuple::v2, Collectors.toSet())));
+            }
+            systemDataStreamIndices = Sets.union(backingIndices.get(true), failureIndices.get(true));
+            nonSystemDataStreamBackingIndices = backingIndices.get(false);
+            nonSystemDataStreamFailureIndices = failureIndices.get(false);
         }
-        requestIndices.addAll(nonSystemDataStreamIndices);
+        requestIndices.addAll(nonSystemDataStreamBackingIndices);
+        requestIndices.addAll(nonSystemDataStreamFailureIndices);
         final Set<String> allSystemIndicesToRestore = Stream.of(systemDataStreamIndices, featureStateIndices)
             .flatMap(Collection::stream)
             .collect(Collectors.toSet());
@@ -472,7 +482,8 @@ private void startRestore(
                 renamedIndices(
                     request,
                     requestedIndicesIncludingSystem,
-                    nonSystemDataStreamIndices,
+                    nonSystemDataStreamBackingIndices,
+                    nonSystemDataStreamFailureIndices,
                     allSystemIndicesToRestore,
                     repositoryData
                 ),
@@ -555,7 +566,7 @@ private static Tuple<Map<String, DataStream>, Map<String, DataStreamAlias>> getD
         List<String> requestedDataStreams = filterIndices(
             snapshotInfo.dataStreams(),
             Stream.of(requestIndices, featureStateDataStreams).flatMap(Collection::stream).toArray(String[]::new),
-            IndicesOptions.fromOptions(true, true, true, true)
+            IndicesOptions.lenientExpand()
         );
         if (requestedDataStreams.isEmpty()) {
             dataStreams = Map.of();
@@ -702,11 +713,19 @@ static DataStream updateDataStream(DataStream dataStream, Metadata.Builder metad
         }
         List<Index> updatedIndices = dataStream.getIndices()
             .stream()
-            .map(i -> metadata.get(renameIndex(i.getName(), request, true)).getIndex())
+            .map(i -> metadata.get(renameIndex(i.getName(), request, true, false)).getIndex())
             .toList();
+        List<Index> updatedFailureIndices = DataStream.isFailureStoreFeatureFlagEnabled()
+            ? dataStream.getFailureIndices()
+                .getIndices()
+                .stream()
+                .map(i -> metadata.get(renameIndex(i.getName(), request, false, true)).getIndex())
+                .toList()
+            : List.of();
         return dataStream.copy()
             .setName(dataStreamName)
             .setBackingIndices(dataStream.getBackingIndices().copy().setIndices(updatedIndices).build())
+            .setFailureIndices(dataStream.getFailureIndices().copy().setIndices(updatedFailureIndices).build())
             .build();
     }
 
@@ -900,10 +919,33 @@ public static int failedShards(Map<ShardId, RestoreInProgress.ShardRestoreStatus
         return failedShards;
     }
 
+    private static String renameIndex(String index, RestoreSnapshotRequest request, boolean isBackingIndex, boolean isFailureStore) {
+        if (request.renameReplacement() == null || request.renamePattern() == null) {
+            return index;
+        }
+        String prefix = null;
+        if (isBackingIndex && index.startsWith(DataStream.BACKING_INDEX_PREFIX)) {
+            prefix = DataStream.BACKING_INDEX_PREFIX;
+        }
+        if (isFailureStore && index.startsWith(DataStream.FAILURE_STORE_PREFIX)) {
+            prefix = DataStream.FAILURE_STORE_PREFIX;
+        }
+        String renamedIndex;
+        if (prefix != null) {
+            index = index.substring(prefix.length());
+        }
+        renamedIndex = index.replaceAll(request.renamePattern(), request.renameReplacement());
+        if (prefix != null) {
+            renamedIndex = prefix + renamedIndex;
+        }
+        return renamedIndex;
+    }
+
     private static Map<String, IndexId> renamedIndices(
         RestoreSnapshotRequest request,
         List<String> filteredIndices,
-        Set<String> dataStreamIndices,
+        Set<String> dataStreamBackingIndices,
+        Set<String> dataStreamFailureIndices,
         Set<String> featureIndices,
         RepositoryData repositoryData
     ) {
@@ -914,7 +956,12 @@ private static Map<String, IndexId> renamedIndices(
                 // Don't rename system indices
                 renamedIndex = index;
             } else {
-                renamedIndex = renameIndex(index, request, dataStreamIndices.contains(index));
+                renamedIndex = renameIndex(
+                    index,
+                    request,
+                    dataStreamBackingIndices.contains(index),
+                    dataStreamFailureIndices.contains(index)
+                );
             }
             IndexId previousIndex = renamedIndices.put(renamedIndex, repositoryData.resolveIndexId(index));
             if (previousIndex != null) {
@@ -928,21 +975,6 @@ private static Map<String, IndexId> renamedIndices(
         return Collections.unmodifiableMap(renamedIndices);
     }
 
-    private static String renameIndex(String index, RestoreSnapshotRequest request, boolean partOfDataStream) {
-        String renamedIndex = index;
-        if (request.renameReplacement() != null && request.renamePattern() != null) {
-            partOfDataStream = partOfDataStream && index.startsWith(DataStream.BACKING_INDEX_PREFIX);
-            if (partOfDataStream) {
-                index = index.substring(DataStream.BACKING_INDEX_PREFIX.length());
-            }
-            renamedIndex = index.replaceAll(request.renamePattern(), request.renameReplacement());
-            if (partOfDataStream) {
-                renamedIndex = DataStream.BACKING_INDEX_PREFIX + renamedIndex;
-            }
-        }
-        return renamedIndex;
-    }
-
     /**
      * Checks that snapshots can be restored and have compatible version
      * @param repository      repository name
diff --git a/server/src/main/java/org/elasticsearch/snapshots/SnapshotUtils.java b/server/src/main/java/org/elasticsearch/snapshots/SnapshotUtils.java
index ab5f1f4ea9f26..c1fddabbf6504 100644
--- a/server/src/main/java/org/elasticsearch/snapshots/SnapshotUtils.java
+++ b/server/src/main/java/org/elasticsearch/snapshots/SnapshotUtils.java
@@ -27,7 +27,8 @@ public class SnapshotUtils {
      *
      * @param availableIndices list of available indices
      * @param selectedIndices  list of selected indices
-     * @param indicesOptions    ignore indices flag
+     * @param indicesOptions   from the indices options it only uses {@link IndicesOptions.ConcreteTargetOptions#allowUnavailableTargets()}
+     *                         and {@link IndicesOptions.WildcardOptions#allowEmptyExpressions()}
      * @return filtered out indices
      */
     public static List<String> filterIndices(List<String> availableIndices, String[] selectedIndices, IndicesOptions indicesOptions) {
diff --git a/server/src/test/java/org/elasticsearch/common/time/Iso8601ParserTests.java b/server/src/test/java/org/elasticsearch/common/time/Iso8601ParserTests.java
index bfb03ea9496e5..a355f3d69f314 100644
--- a/server/src/test/java/org/elasticsearch/common/time/Iso8601ParserTests.java
+++ b/server/src/test/java/org/elasticsearch/common/time/Iso8601ParserTests.java
@@ -70,6 +70,9 @@ public void testOutOfRange() {
         assertThat(defaultParser().tryParse("2023-12-31T23:60", null), hasError(14));
         assertThat(defaultParser().tryParse("2023-12-31T23:59:60", null), hasError(17));
         assertThat(defaultParser().tryParse("2023-12-31T23:59:59+18:30", null), hasError(19));
+        assertThat(defaultParser().tryParse("2023-12-31T23:59:59+24", null), hasError(19));
+        assertThat(defaultParser().tryParse("2023-12-31T23:59:59+1060", null), hasError(19));
+        assertThat(defaultParser().tryParse("2023-12-31T23:59:59+105960", null), hasError(19));
     }
 
     public void testMandatoryFields() {
diff --git a/server/src/test/java/org/elasticsearch/snapshots/RestoreServiceTests.java b/server/src/test/java/org/elasticsearch/snapshots/RestoreServiceTests.java
index e7e6aae195bec..2d84dfd0cc907 100644
--- a/server/src/test/java/org/elasticsearch/snapshots/RestoreServiceTests.java
+++ b/server/src/test/java/org/elasticsearch/snapshots/RestoreServiceTests.java
@@ -47,77 +47,112 @@
 public class RestoreServiceTests extends ESTestCase {
 
     public void testUpdateDataStream() {
+        long now = System.currentTimeMillis();
         String dataStreamName = "data-stream-1";
         String backingIndexName = DataStream.getDefaultBackingIndexName(dataStreamName, 1);
-        List<Index> indices = Collections.singletonList(new Index(backingIndexName, "uuid"));
+        List<Index> indices = List.of(new Index(backingIndexName, randomUUID()));
+        String failureIndexName = DataStream.getDefaultFailureStoreName(dataStreamName, 1, now);
+        List<Index> failureIndices = List.of(new Index(failureIndexName, randomUUID()));
 
-        DataStream dataStream = DataStreamTestHelper.newInstance(dataStreamName, indices);
+        DataStream dataStream = DataStreamTestHelper.newInstance(dataStreamName, indices, failureIndices);
 
         Metadata.Builder metadata = mock(Metadata.Builder.class);
-        IndexMetadata indexMetadata = mock(IndexMetadata.class);
-        when(metadata.get(eq(backingIndexName))).thenReturn(indexMetadata);
-        Index updatedIndex = new Index(backingIndexName, "uuid2");
-        when(indexMetadata.getIndex()).thenReturn(updatedIndex);
+
+        IndexMetadata backingIndexMetadata = mock(IndexMetadata.class);
+        when(metadata.get(eq(backingIndexName))).thenReturn(backingIndexMetadata);
+        Index updatedBackingIndex = new Index(backingIndexName, randomUUID());
+        when(backingIndexMetadata.getIndex()).thenReturn(updatedBackingIndex);
+
+        IndexMetadata failureIndexMetadata = mock(IndexMetadata.class);
+        when(metadata.get(eq(failureIndexName))).thenReturn(failureIndexMetadata);
+        Index updatedFailureIndex = new Index(failureIndexName, randomUUID());
+        when(failureIndexMetadata.getIndex()).thenReturn(updatedFailureIndex);
 
         RestoreSnapshotRequest request = new RestoreSnapshotRequest();
 
         DataStream updateDataStream = RestoreService.updateDataStream(dataStream, metadata, request);
 
         assertEquals(dataStreamName, updateDataStream.getName());
-        assertEquals(Collections.singletonList(updatedIndex), updateDataStream.getIndices());
+        assertEquals(List.of(updatedBackingIndex), updateDataStream.getIndices());
+        assertEquals(List.of(updatedFailureIndex), updateDataStream.getFailureIndices().getIndices());
     }
 
     public void testUpdateDataStreamRename() {
+        long now = System.currentTimeMillis();
         String dataStreamName = "data-stream-1";
         String renamedDataStreamName = "data-stream-2";
         String backingIndexName = DataStream.getDefaultBackingIndexName(dataStreamName, 1);
         String renamedBackingIndexName = DataStream.getDefaultBackingIndexName(renamedDataStreamName, 1);
-        List<Index> indices = Collections.singletonList(new Index(backingIndexName, "uuid"));
+        List<Index> indices = List.of(new Index(backingIndexName, randomUUID()));
 
-        DataStream dataStream = DataStreamTestHelper.newInstance(dataStreamName, indices);
+        String failureIndexName = DataStream.getDefaultFailureStoreName(dataStreamName, 1, now);
+        String renamedFailureIndexName = DataStream.getDefaultFailureStoreName(renamedDataStreamName, 1, now);
+        List<Index> failureIndices = List.of(new Index(failureIndexName, randomUUID()));
+
+        DataStream dataStream = DataStreamTestHelper.newInstance(dataStreamName, indices, failureIndices);
 
         Metadata.Builder metadata = mock(Metadata.Builder.class);
-        IndexMetadata indexMetadata = mock(IndexMetadata.class);
-        when(metadata.get(eq(renamedBackingIndexName))).thenReturn(indexMetadata);
-        Index renamedIndex = new Index(renamedBackingIndexName, "uuid2");
-        when(indexMetadata.getIndex()).thenReturn(renamedIndex);
+
+        IndexMetadata backingIndexMetadata = mock(IndexMetadata.class);
+        when(metadata.get(eq(renamedBackingIndexName))).thenReturn(backingIndexMetadata);
+        Index renamedBackingIndex = new Index(renamedBackingIndexName, randomUUID());
+        when(backingIndexMetadata.getIndex()).thenReturn(renamedBackingIndex);
+
+        IndexMetadata failureIndexMetadata = mock(IndexMetadata.class);
+        when(metadata.get(eq(renamedFailureIndexName))).thenReturn(failureIndexMetadata);
+        Index renamedFailureIndex = new Index(renamedFailureIndexName, randomUUID());
+        when(failureIndexMetadata.getIndex()).thenReturn(renamedFailureIndex);
 
         RestoreSnapshotRequest request = new RestoreSnapshotRequest().renamePattern("data-stream-1").renameReplacement("data-stream-2");
 
         DataStream renamedDataStream = RestoreService.updateDataStream(dataStream, metadata, request);
 
         assertEquals(renamedDataStreamName, renamedDataStream.getName());
-        assertEquals(Collections.singletonList(renamedIndex), renamedDataStream.getIndices());
+        assertEquals(List.of(renamedBackingIndex), renamedDataStream.getIndices());
+        assertEquals(List.of(renamedFailureIndex), renamedDataStream.getFailureIndices().getIndices());
     }
 
     public void testPrefixNotChanged() {
+        long now = System.currentTimeMillis();
         String dataStreamName = "ds-000001";
         String renamedDataStreamName = "ds2-000001";
         String backingIndexName = DataStream.getDefaultBackingIndexName(dataStreamName, 1);
         String renamedBackingIndexName = DataStream.getDefaultBackingIndexName(renamedDataStreamName, 1);
-        List<Index> indices = Collections.singletonList(new Index(backingIndexName, "uuid"));
+        List<Index> indices = Collections.singletonList(new Index(backingIndexName, randomUUID()));
 
-        DataStream dataStream = DataStreamTestHelper.newInstance(dataStreamName, indices);
+        String failureIndexName = DataStream.getDefaultFailureStoreName(dataStreamName, 1, now);
+        String renamedFailureIndexName = DataStream.getDefaultFailureStoreName(renamedDataStreamName, 1, now);
+        List<Index> failureIndices = Collections.singletonList(new Index(failureIndexName, randomUUID()));
+
+        DataStream dataStream = DataStreamTestHelper.newInstance(dataStreamName, indices, failureIndices);
 
         Metadata.Builder metadata = mock(Metadata.Builder.class);
+
         IndexMetadata indexMetadata = mock(IndexMetadata.class);
         when(metadata.get(eq(renamedBackingIndexName))).thenReturn(indexMetadata);
-        Index renamedIndex = new Index(renamedBackingIndexName, "uuid2");
+        Index renamedIndex = new Index(renamedBackingIndexName, randomUUID());
         when(indexMetadata.getIndex()).thenReturn(renamedIndex);
 
+        IndexMetadata failureIndexMetadata = mock(IndexMetadata.class);
+        when(metadata.get(eq(renamedFailureIndexName))).thenReturn(failureIndexMetadata);
+        Index renamedFailureIndex = new Index(renamedFailureIndexName, randomUUID());
+        when(failureIndexMetadata.getIndex()).thenReturn(renamedFailureIndex);
+
         RestoreSnapshotRequest request = new RestoreSnapshotRequest().renamePattern("ds-").renameReplacement("ds2-");
 
         DataStream renamedDataStream = RestoreService.updateDataStream(dataStream, metadata, request);
 
         assertEquals(renamedDataStreamName, renamedDataStream.getName());
-        assertEquals(Collections.singletonList(renamedIndex), renamedDataStream.getIndices());
+        assertEquals(List.of(renamedIndex), renamedDataStream.getIndices());
+        assertEquals(List.of(renamedFailureIndex), renamedDataStream.getFailureIndices().getIndices());
 
         request = new RestoreSnapshotRequest().renamePattern("ds-000001").renameReplacement("ds2-000001");
 
         renamedDataStream = RestoreService.updateDataStream(dataStream, metadata, request);
 
         assertEquals(renamedDataStreamName, renamedDataStream.getName());
-        assertEquals(Collections.singletonList(renamedIndex), renamedDataStream.getIndices());
+        assertEquals(List.of(renamedIndex), renamedDataStream.getIndices());
+        assertEquals(List.of(renamedFailureIndex), renamedDataStream.getFailureIndices().getIndices());
     }
 
     public void testRefreshRepositoryUuidsDoesNothingIfDisabled() {
diff --git a/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/security/action/apikey/CrossClusterApiKeyRoleDescriptorBuilder.java b/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/security/action/apikey/CrossClusterApiKeyRoleDescriptorBuilder.java
index 0cdb04c0516d7..3958cb4373853 100644
--- a/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/security/action/apikey/CrossClusterApiKeyRoleDescriptorBuilder.java
+++ b/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/security/action/apikey/CrossClusterApiKeyRoleDescriptorBuilder.java
@@ -81,6 +81,9 @@ public RoleDescriptor build() {
             clusterPrivileges = CCS_CLUSTER_PRIVILEGE_NAMES;
         } else {
             clusterPrivileges = CCS_AND_CCR_CLUSTER_PRIVILEGE_NAMES;
+            if (search.stream().anyMatch(RoleDescriptor.IndicesPrivileges::isUsingDocumentOrFieldLevelSecurity)) {
+                throw new IllegalArgumentException("search does not support document or field level security if replication is assigned");
+            }
         }
 
         if (replication.stream().anyMatch(RoleDescriptor.IndicesPrivileges::isUsingDocumentOrFieldLevelSecurity)) {
@@ -121,9 +124,9 @@ static void validate(RoleDescriptor roleDescriptor) {
             throw new IllegalArgumentException("remote cluster permissions must be empty");
         }
         final String[] clusterPrivileges = roleDescriptor.getClusterPrivileges();
-        if (false == Arrays.equals(clusterPrivileges, CCS_CLUSTER_PRIVILEGE_NAMES)
-            && false == Arrays.equals(clusterPrivileges, CCR_CLUSTER_PRIVILEGE_NAMES)
-            && false == Arrays.equals(clusterPrivileges, CCS_AND_CCR_CLUSTER_PRIVILEGE_NAMES)) {
+        // must contain either "cross_cluster_search" or "cross_cluster_replication" or both
+        if ((Arrays.asList(clusterPrivileges).contains("cross_cluster_search")
+            || Arrays.asList(clusterPrivileges).contains("cross_cluster_replication")) == false) {
             throw new IllegalArgumentException(
                 "invalid cluster privileges: [" + Strings.arrayToCommaDelimitedString(clusterPrivileges) + "]"
             );
@@ -143,5 +146,42 @@ static void validate(RoleDescriptor roleDescriptor) {
                 throw new IllegalArgumentException("invalid indices privileges: [" + Strings.arrayToCommaDelimitedString(privileges));
             }
         }
+        // Note: we are skipping the check for document or field level security on search (with replication) here, since validate is called
+        // for instance as part of the Get and Query APIs, which need to continue to handle legacy role descriptors.
+    }
+
+    /**
+     * Pre-GA versions of RCS 2.0 (8.13-) allowed users to use DLS/FLS for "search" when both "search" and "replication" are both defined.
+     * Post-GA versions of RCS 2.0 (8.14+) allow users to use DLS/FLS only when "search" is defined. Defining DLS/FLS when both "search"
+     * and "replication" are defined in not allowed. Legacy here is in reference to pre-GA CCx API keys. This method should only be
+     * called to check the fulfilling cluster's API key role descriptor.
+     */
+    public static void checkForInvalidLegacyRoleDescriptors(String apiKeyId, List<RoleDescriptor> roleDescriptors) {
+        assert roleDescriptors.size() == 1;
+        final var roleDescriptor = roleDescriptors.get(0);
+        final String[] clusterPrivileges = roleDescriptor.getClusterPrivileges();
+        // only need to check if both "search" and "replication" are defined
+        // no need to check for DLS if set of cluster privileges are not the set used pre 8.14
+        final String[] pre8_14ClusterPrivileges = { "cross_cluster_search", "cross_cluster_replication" };
+        final boolean hasBoth = Arrays.equals(clusterPrivileges, pre8_14ClusterPrivileges);
+        if (false == hasBoth) {
+            return;
+        }
+
+        final RoleDescriptor.IndicesPrivileges[] indicesPrivileges = roleDescriptor.getIndicesPrivileges();
+        for (RoleDescriptor.IndicesPrivileges indexPrivilege : indicesPrivileges) {
+            final String[] privileges = indexPrivilege.getPrivileges();
+            final String[] pre8_14IndicesPrivileges = { "read", "read_cross_cluster", "view_index_metadata" };
+            // find the "search" privilege, no need to check for DLS if set of index privileges are not the set used pre 8.14
+            if (Arrays.equals(privileges, pre8_14IndicesPrivileges)) {
+                if (indexPrivilege.isUsingDocumentOrFieldLevelSecurity()) {
+                    throw new IllegalArgumentException(
+                        "Cross cluster API key ["
+                            + apiKeyId
+                            + "] is invalid: search does not support document or field level security if replication is assigned"
+                    );
+                }
+            }
+        }
     }
 }
diff --git a/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/security/authc/Subject.java b/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/security/authc/Subject.java
index 4769af47b7c09..703cc18c66f49 100644
--- a/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/security/authc/Subject.java
+++ b/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/security/authc/Subject.java
@@ -283,7 +283,7 @@ RoleReference.ApiKeyRoleReference buildRoleReferenceForCrossClusterApiKey() {
         final BytesReference limitedByRoleDescriptorsBytes = (BytesReference) metadata.get(API_KEY_LIMITED_ROLE_DESCRIPTORS_KEY);
         assert isEmptyRoleDescriptorsBytes(limitedByRoleDescriptorsBytes)
             : "cross cluster API keys must have empty limited-by role descriptors";
-        return new RoleReference.ApiKeyRoleReference(apiKeyId, roleDescriptorsBytes, RoleReference.ApiKeyRoleType.ASSIGNED);
+        return new RoleReference.ApiKeyRoleReference(apiKeyId, roleDescriptorsBytes, RoleReference.ApiKeyRoleType.ASSIGNED, true);
     }
 
     private RoleReferenceIntersection buildRoleReferencesForCrossClusterAccess() {
diff --git a/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/security/authz/store/RoleReference.java b/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/security/authz/store/RoleReference.java
index e6dd6f58984cc..3e631c2516967 100644
--- a/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/security/authz/store/RoleReference.java
+++ b/x-pack/plugin/core/src/main/java/org/elasticsearch/xpack/core/security/authz/store/RoleReference.java
@@ -81,11 +81,22 @@ final class ApiKeyRoleReference implements RoleReference {
         private final BytesReference roleDescriptorsBytes;
         private final ApiKeyRoleType roleType;
         private RoleKey id = null;
+        private final boolean checkForInvalidLegacyRoleDescriptorsForCrossClusterAccess;
 
         public ApiKeyRoleReference(String apiKeyId, BytesReference roleDescriptorsBytes, ApiKeyRoleType roleType) {
+            this(apiKeyId, roleDescriptorsBytes, roleType, false);
+        }
+
+        public ApiKeyRoleReference(
+            String apiKeyId,
+            BytesReference roleDescriptorsBytes,
+            ApiKeyRoleType roleType,
+            boolean checkForInvalidLegacyRoleDescriptorsForCrossClusterAccess
+        ) {
             this.apiKeyId = apiKeyId;
             this.roleDescriptorsBytes = roleDescriptorsBytes;
             this.roleType = roleType;
+            this.checkForInvalidLegacyRoleDescriptorsForCrossClusterAccess = checkForInvalidLegacyRoleDescriptorsForCrossClusterAccess;
         }
 
         @Override
@@ -116,6 +127,10 @@ public BytesReference getRoleDescriptorsBytes() {
         public ApiKeyRoleType getRoleType() {
             return roleType;
         }
+
+        public boolean checkForInvalidLegacyRoleDescriptorsForCrossClusterAccess() {
+            return checkForInvalidLegacyRoleDescriptorsForCrossClusterAccess;
+        }
     }
 
     final class CrossClusterAccessRoleReference implements RoleReference {
diff --git a/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/security/action/apikey/CrossClusterApiKeyRoleDescriptorBuilderTests.java b/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/security/action/apikey/CrossClusterApiKeyRoleDescriptorBuilderTests.java
index b64e8cadf5203..beeca751a1dbc 100644
--- a/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/security/action/apikey/CrossClusterApiKeyRoleDescriptorBuilderTests.java
+++ b/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/security/action/apikey/CrossClusterApiKeyRoleDescriptorBuilderTests.java
@@ -17,9 +17,11 @@
 import org.elasticsearch.xpack.core.security.authz.permission.RemoteClusterPermissions;
 
 import java.io.IOException;
+import java.util.List;
 import java.util.Set;
 
 import static org.elasticsearch.xpack.core.security.action.apikey.CrossClusterApiKeyRoleDescriptorBuilder.CCS_CLUSTER_PRIVILEGE_NAMES;
+import static org.elasticsearch.xpack.core.security.action.apikey.CrossClusterApiKeyRoleDescriptorBuilder.ROLE_DESCRIPTOR_NAME;
 import static org.hamcrest.Matchers.arrayContainingInAnyOrder;
 import static org.hamcrest.Matchers.containsString;
 import static org.hamcrest.Matchers.equalTo;
@@ -51,6 +53,60 @@ public void testBuildForSearchOnly() throws IOException {
         );
     }
 
+    public void testBuildForSearchWithDls() throws IOException {
+        final CrossClusterApiKeyRoleDescriptorBuilder access = parseForAccess("""
+            {
+              "search": [
+                {
+                  "names": ["metrics"],
+                  "query": {"term":{"tag":42}}
+                }
+              ]
+            }""");
+
+        final RoleDescriptor roleDescriptor = access.build();
+
+        assertRoleDescriptor(
+            roleDescriptor,
+            new String[] { "cross_cluster_search", "monitor_enrich" },
+            new RoleDescriptor.IndicesPrivileges[] {
+                RoleDescriptor.IndicesPrivileges.builder()
+                    .indices("metrics")
+                    .privileges("read", "read_cross_cluster", "view_index_metadata")
+                    .query("{\"term\":{\"tag\":42}}")
+                    .build() }
+        );
+    }
+
+    public void testBuildForSearchWithFls() throws IOException {
+        final CrossClusterApiKeyRoleDescriptorBuilder access = parseForAccess("""
+            {
+              "search": [
+                {
+                  "names": ["metrics"],
+                  "field_security": {
+                    "grant": ["*"],
+                    "except": ["private"]
+                  }
+                }
+              ]
+            }""");
+
+        final RoleDescriptor roleDescriptor = access.build();
+
+        assertRoleDescriptor(
+            roleDescriptor,
+            new String[] { "cross_cluster_search", "monitor_enrich" },
+            new RoleDescriptor.IndicesPrivileges[] {
+                RoleDescriptor.IndicesPrivileges.builder()
+                    .indices("metrics")
+                    .privileges("read", "read_cross_cluster", "view_index_metadata")
+                    .grantedFields("*")
+                    .deniedFields("private")
+                    .build() }
+        );
+    }
+
     public void testBuildForReplicationOnly() throws IOException {
         final CrossClusterApiKeyRoleDescriptorBuilder access = parseForAccess("""
             {
@@ -79,15 +135,10 @@ public void testBuildForSearchAndReplication() throws IOException {
             {
               "search": [
                 {
-                  "names": ["metrics"],
-                  "query": {"term":{"tag":42}}
+                  "names": ["metrics"]
                 },
                 {
-                  "names": ["logs"],
-                  "field_security": {
-                    "grant": ["*"],
-                    "except": ["private"]
-                  }
+                  "names": ["logs"]
                 }
               ],
               "replication": [
@@ -107,13 +158,10 @@ public void testBuildForSearchAndReplication() throws IOException {
                 RoleDescriptor.IndicesPrivileges.builder()
                     .indices("metrics")
                     .privileges("read", "read_cross_cluster", "view_index_metadata")
-                    .query("{\"term\":{\"tag\":42}}")
                     .build(),
                 RoleDescriptor.IndicesPrivileges.builder()
                     .indices("logs")
                     .privileges("read", "read_cross_cluster", "view_index_metadata")
-                    .grantedFields("*")
-                    .deniedFields("private")
                     .build(),
                 RoleDescriptor.IndicesPrivileges.builder()
                     .indices("archive")
@@ -123,6 +171,155 @@ public void testBuildForSearchAndReplication() throws IOException {
         );
     }
 
+    public void testBuildForSearchAndReplicationWithDLSandFLS() throws IOException {
+        // DLS
+        CrossClusterApiKeyRoleDescriptorBuilder access = parseForAccess("""
+            {
+              "search": [
+                {
+                  "names": ["metrics"],
+                  "query": {"term":{"tag":42}}
+                }
+              ],
+              "replication": [
+                {
+                  "names": [ "archive" ]
+                }
+              ]
+            }""");
+
+        IllegalArgumentException exception = expectThrows(IllegalArgumentException.class, access::build);
+        assertThat(
+            exception.getMessage(),
+            containsString("search does not support document or field level security if " + "replication is assigned")
+        );
+
+        // FLS
+        access = parseForAccess("""
+            {
+              "search": [
+                {
+                  "names": ["metrics"],
+                   "field_security": {
+                      "grant": ["*"],
+                      "except": ["private"]
+                  }
+                }
+              ],
+              "replication": [
+                {
+                  "names": [ "archive" ]
+                }
+              ]
+            }""");
+        exception = expectThrows(IllegalArgumentException.class, access::build);
+        assertThat(
+            exception.getMessage(),
+            containsString("search does not support document or field level security if " + "replication is assigned")
+        );
+
+        // DLS and FLS
+        access = parseForAccess("""
+            {
+              "search": [
+                {
+                  "names": ["metrics"],
+                   "query": {"term":{"tag":42}},
+                   "field_security": {
+                      "grant": ["*"],
+                      "except": ["private"]
+                  }
+                }
+              ],
+              "replication": [
+                {
+                  "names": [ "archive" ]
+                }
+              ]
+            }""");
+
+        exception = expectThrows(IllegalArgumentException.class, access::build);
+        assertThat(
+            exception.getMessage(),
+            containsString("search does not support document or field level security if " + "replication is assigned")
+        );
+    }
+
+    public void testCheckForInvalidLegacyRoleDescriptors() {
+        final String[] pre8_14ClusterPrivileges_searchAndReplication = { "cross_cluster_search", "cross_cluster_replication" };
+        final String[] pre8_14ClusterPrivileges_searchOnly = { "cross_cluster_search" };
+        final String[] pre8_14IndexPrivileges = { "read", "read_cross_cluster", "view_index_metadata" };
+        final String[] otherPrivileges = randomArray(1, 5, String[]::new, () -> randomAlphaOfLength(5));
+        String apiKeyId = randomAlphaOfLength(5);
+        RoleDescriptor.IndicesPrivileges pre8_14SearchIndexPrivileges_noDLS = RoleDescriptor.IndicesPrivileges.builder()
+            .indices(randomAlphaOfLength(5))
+            .privileges(pre8_14IndexPrivileges)
+            .build();
+        RoleDescriptor.IndicesPrivileges pre8_14SearchIndexPrivileges_withDLS = RoleDescriptor.IndicesPrivileges.builder()
+            .indices(randomAlphaOfLength(5))
+            .privileges(pre8_14IndexPrivileges)
+            .query("{\"term\":{\"tag\":42}}")
+            .build();
+        RoleDescriptor.IndicesPrivileges otherIndexPrivilege = RoleDescriptor.IndicesPrivileges.builder()
+            .indices(randomAlphaOfLength(5))
+            .privileges(otherPrivileges) // replication has fixed index privileges, but for this test we don't care about the actual values
+            .build();
+
+        // role descriptor emulates pre 8.14 with search and replication with DLS: this is the primary case we are trying to catch
+        RoleDescriptor pre8_14ApiKeyRoleDescriptor_withSearchAndReplication_withDLS = new RoleDescriptor(
+            ROLE_DESCRIPTOR_NAME,
+            pre8_14ClusterPrivileges_searchAndReplication,
+            new RoleDescriptor.IndicesPrivileges[] { pre8_14SearchIndexPrivileges_withDLS, otherIndexPrivilege },
+            null
+        );
+        IllegalArgumentException exception = expectThrows(
+            IllegalArgumentException.class,
+            () -> CrossClusterApiKeyRoleDescriptorBuilder.checkForInvalidLegacyRoleDescriptors(
+                apiKeyId,
+                List.of(pre8_14ApiKeyRoleDescriptor_withSearchAndReplication_withDLS)
+            )
+        );
+        assertThat(
+            exception.getMessage(),
+            equalTo(
+                "Cross cluster API key ["
+                    + apiKeyId
+                    + "] is invalid: search does not support document or field level security if replication is assigned"
+            )
+        );
+        // role descriptor emulates search only with DLS, this could be a valid role descriptor for pre/post 8.14
+        RoleDescriptor apiKeyRoleDescriptor_withSearch_withDLS = new RoleDescriptor(
+            ROLE_DESCRIPTOR_NAME,
+            pre8_14ClusterPrivileges_searchOnly,
+            new RoleDescriptor.IndicesPrivileges[] { pre8_14SearchIndexPrivileges_withDLS },
+            null
+        );
+        noErrorCheckRoleDescriptor(apiKeyRoleDescriptor_withSearch_withDLS);
+
+        // role descriptor emulates search and replication without DLS, this could be a valid role descriptor for pre/post 8.14
+        RoleDescriptor apiKeyRoleDescriptor_withSearchAndReplication_noDLS = new RoleDescriptor(
+            ROLE_DESCRIPTOR_NAME,
+            pre8_14ClusterPrivileges_searchAndReplication,
+            new RoleDescriptor.IndicesPrivileges[] { pre8_14SearchIndexPrivileges_noDLS, otherIndexPrivilege },
+            null
+        );
+        noErrorCheckRoleDescriptor(apiKeyRoleDescriptor_withSearchAndReplication_noDLS);
+
+        // role descriptor that will never have search and replication with DLS but may have other privileges
+        RoleDescriptor notpre8_14_apiKeyRoleDescriptor_withSearchAndReplication_DLS = new RoleDescriptor(
+            ROLE_DESCRIPTOR_NAME,
+            otherPrivileges,
+            new RoleDescriptor.IndicesPrivileges[] { otherIndexPrivilege, otherIndexPrivilege },
+            null
+        );
+        noErrorCheckRoleDescriptor(notpre8_14_apiKeyRoleDescriptor_withSearchAndReplication_DLS);
+    }
+
+    private void noErrorCheckRoleDescriptor(RoleDescriptor roleDescriptor) {
+        // should not raise an exception
+        CrossClusterApiKeyRoleDescriptorBuilder.checkForInvalidLegacyRoleDescriptors(randomAlphaOfLength(5), List.of(roleDescriptor));
+    }
+
     public void testExplicitlySpecifyingPrivilegesIsNotAllowed() {
         final XContentParseException e = expectThrows(XContentParseException.class, () -> parseForAccess(Strings.format("""
             {
@@ -156,7 +353,7 @@ public void testEmptyAccessIsNotAllowed() throws IOException {
         assertThat(e2.getMessage(), containsString("doesn't support values of type: VALUE_NULL"));
     }
 
-    public void testAPIKeyAllowsAllRemoteClusterPrivilegesForCCS() throws IOException {
+    public void testAPIKeyAllowsAllRemoteClusterPrivilegesForCCS() {
         // if users can add remote cluster permissions to a role, then the APIKey should also allow that for that permission
         // the inverse however, is not guaranteed. cross_cluster_search exists largely for internal use and is not exposed to the users role
         assertTrue(Set.of(CCS_CLUSTER_PRIVILEGE_NAMES).containsAll(RemoteClusterPermissions.getSupportedRemoteClusterPermissions()));
diff --git a/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/security/authz/RoleDescriptorTestHelper.java b/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/security/authz/RoleDescriptorTestHelper.java
index e6b9097a023cc..2d8b62335f4ef 100644
--- a/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/security/authz/RoleDescriptorTestHelper.java
+++ b/x-pack/plugin/core/src/test/java/org/elasticsearch/xpack/core/security/authz/RoleDescriptorTestHelper.java
@@ -201,7 +201,9 @@ public static RoleDescriptor randomCrossClusterAccessRoleDescriptor() {
                 .privileges(CCS_INDICES_PRIVILEGE_NAMES)
                 .indices(generateRandomStringArray(5, randomIntBetween(3, 9), false, false))
                 .allowRestrictedIndices(randomBoolean());
-            randomDlsFls(builder);
+            if (replicationSize == 0) {
+                randomDlsFls(builder);
+            }
             indexPrivileges.add(builder.build());
         }
         for (int i = 0; i < replicationSize; i++) {
diff --git a/x-pack/plugin/esql/build.gradle b/x-pack/plugin/esql/build.gradle
index c6220a8ce73e5..102319d74d3d5 100644
--- a/x-pack/plugin/esql/build.gradle
+++ b/x-pack/plugin/esql/build.gradle
@@ -65,6 +65,7 @@ tasks.named("test").configure {
           String tag = it[2]
           boolean isJson = it[3]
           String allExamples = new File("${projectDir}/qa/testFixtures/src/main/resources/${file}").text
+            .replaceAll(System.lineSeparator(), "\n")
           int start = allExamples.indexOf("tag::${tag}[]")
           int end = allExamples.indexOf("end::${tag}[]", start)
           if (start < 0 || end < 0) {
diff --git a/x-pack/plugin/esql/qa/server/src/main/java/org/elasticsearch/xpack/esql/qa/rest/EsqlSpecTestCase.java b/x-pack/plugin/esql/qa/server/src/main/java/org/elasticsearch/xpack/esql/qa/rest/EsqlSpecTestCase.java
index 0b653a1d92106..f44e82a3002f2 100644
--- a/x-pack/plugin/esql/qa/server/src/main/java/org/elasticsearch/xpack/esql/qa/rest/EsqlSpecTestCase.java
+++ b/x-pack/plugin/esql/qa/server/src/main/java/org/elasticsearch/xpack/esql/qa/rest/EsqlSpecTestCase.java
@@ -17,6 +17,7 @@
 import org.elasticsearch.client.ResponseException;
 import org.elasticsearch.client.RestClient;
 import org.elasticsearch.common.xcontent.XContentHelper;
+import org.elasticsearch.features.NodeFeature;
 import org.elasticsearch.geometry.Geometry;
 import org.elasticsearch.geometry.Point;
 import org.elasticsearch.geometry.utils.GeometryValidator;
@@ -27,6 +28,7 @@
 import org.elasticsearch.test.rest.TestFeatureService;
 import org.elasticsearch.xcontent.XContentType;
 import org.elasticsearch.xpack.esql.CsvTestUtils;
+import org.elasticsearch.xpack.esql.plugin.EsqlFeatures;
 import org.elasticsearch.xpack.esql.qa.rest.RestEsqlTestCase.RequestObjectBuilder;
 import org.elasticsearch.xpack.esql.version.EsqlVersion;
 import org.elasticsearch.xpack.ql.CsvSpecReader.CsvTestCase;
@@ -43,6 +45,8 @@
 import java.util.Map;
 import java.util.Set;
 import java.util.regex.Pattern;
+import java.util.stream.Collectors;
+import java.util.stream.Stream;
 
 import static org.apache.lucene.geo.GeoEncodingUtils.decodeLatitude;
 import static org.apache.lucene.geo.GeoEncodingUtils.decodeLongitude;
@@ -182,8 +186,16 @@ protected static void checkCapabilities(RestClient client, TestFeatureService te
                 throw e;
             }
         }
+
+        var features = Stream.concat(
+            new EsqlFeatures().getFeatures().stream(),
+            new EsqlFeatures().getHistoricalFeatures().keySet().stream()
+        ).map(NodeFeature::id).collect(Collectors.toSet());
+
         for (String feature : testCase.requiredCapabilities) {
-            assumeTrue("Test " + testName + " requires " + feature, testFeatureService.clusterHasFeature("esql." + feature));
+            var esqlFeature = "esql." + feature;
+            assumeTrue("Requested capability " + feature + " is an ESQL cluster feature", features.contains(esqlFeature));
+            assumeTrue("Test " + testName + " requires " + feature, testFeatureService.clusterHasFeature(esqlFeature));
         }
     }
 
diff --git a/x-pack/plugin/esql/qa/testFixtures/src/main/resources/math.csv-spec b/x-pack/plugin/esql/qa/testFixtures/src/main/resources/math.csv-spec
index 4e080bac0ed2e..be6cd058d24e9 100644
--- a/x-pack/plugin/esql/qa/testFixtures/src/main/resources/math.csv-spec
+++ b/x-pack/plugin/esql/qa/testFixtures/src/main/resources/math.csv-spec
@@ -1304,6 +1304,68 @@ d:double | s:double
 -0.0     | -0.0
 ;
 
+cbrt
+required_capability: fn_cbrt
+// tag::cbrt[]
+ROW d = 1000.0
+| EVAL c = cbrt(d)
+// end::cbrt[]
+;
+
+// tag::cbrt-result[]
+d: double | c:double
+1000.0    | 10.0
+// end::cbrt-result[]
+;
+
+cbrtOfInteger
+required_capability: fn_cbrt
+row i = 27 | eval c = cbrt(i);
+
+i:integer | c:double
+27        | 3
+;
+
+cbrtOfLong
+required_capability: fn_cbrt
+row l = to_long(1000000000000) | eval c = cbrt(l);
+
+l:long            | c:double
+1000000000000     | 10000
+;
+
+cbrtOfUnsignedLong
+required_capability: fn_cbrt
+row l = to_ul(1000000000000000000) | eval c = cbrt(l);
+
+l:ul                  | c:double
+1000000000000000000   | 1000000
+;
+
+cbrtOfNegative
+required_capability: fn_cbrt
+row d = -1.0 | eval c = cbrt(d);
+
+d:double | c:double
+-1.0     | -1.0
+;
+
+cbrtOfZero
+required_capability: fn_cbrt
+row d = 0.0 | eval c = cbrt(d);
+
+d:double | c:double
+0.0      | 0.0
+;
+
+cbrtOfNegativeZero
+required_capability: fn_cbrt
+row d = -0.0 | eval c = cbrt(d);
+
+d:double | c:double
+-0.0     | -0.0
+;
+
 least
 // tag::least[]
 ROW a = 10, b = 20
diff --git a/x-pack/plugin/esql/qa/testFixtures/src/main/resources/meta.csv-spec b/x-pack/plugin/esql/qa/testFixtures/src/main/resources/meta.csv-spec
index bd52d3b26b336..c824f837bf249 100644
--- a/x-pack/plugin/esql/qa/testFixtures/src/main/resources/meta.csv-spec
+++ b/x-pack/plugin/esql/qa/testFixtures/src/main/resources/meta.csv-spec
@@ -11,6 +11,7 @@ synopsis:keyword
 "double|date bin(field:integer|long|double|date, buckets:integer|double|date_period|time_duration, ?from:integer|long|double|date, ?to:integer|long|double|date)"
 "double|date bucket(field:integer|long|double|date, buckets:integer|double|date_period|time_duration, ?from:integer|long|double|date, ?to:integer|long|double|date)"
 "boolean|cartesian_point|date|double|geo_point|integer|ip|keyword|long|text|unsigned_long|version case(condition:boolean, trueValue...:boolean|cartesian_point|date|double|geo_point|integer|ip|keyword|long|text|unsigned_long|version)"
+"double cbrt(number:double|integer|long|unsigned_long)"
 "double|integer|long|unsigned_long ceil(number:double|integer|long|unsigned_long)"
 "boolean cidr_match(ip:ip, blockX...:keyword|text)"
 "boolean|text|integer|keyword|long coalesce(first:boolean|text|integer|keyword|long, ?rest...:boolean|text|integer|keyword|long)"
@@ -124,6 +125,7 @@ avg           |number                              |"double|integer|long"
 bin           |[field, buckets, from, to]          |["integer|long|double|date", "integer|double|date_period|time_duration", "integer|long|double|date", "integer|long|double|date"]  |[Numeric or date expression from which to derive buckets., Target number of buckets., Start of the range. Can be a number or a date expressed as a string., End of the range. Can be a number or a date expressed as a string.]
 bucket        |[field, buckets, from, to]          |["integer|long|double|date", "integer|double|date_period|time_duration", "integer|long|double|date", "integer|long|double|date"]  |[Numeric or date expression from which to derive buckets., Target number of buckets., Start of the range. Can be a number or a date expressed as a string., End of the range. Can be a number or a date expressed as a string.]
 case          |[condition, trueValue]              |[boolean, "boolean|cartesian_point|date|double|geo_point|integer|ip|keyword|long|text|unsigned_long|version"]                     |[A condition., The value that's returned when the corresponding condition is the first to evaluate to `true`. The default value is returned when no condition matches.]
+cbrt          |number                              |"double|integer|long|unsigned_long"                                                                                               |"Numeric expression. If `null`, the function returns `null`."
 ceil          |number                              |"double|integer|long|unsigned_long"                                                                                               |Numeric expression. If `null`, the function returns `null`.
 cidr_match    |[ip, blockX]                        |[ip, "keyword|text"]                                                                                                              |[IP address of type `ip` (both IPv4 and IPv6 are supported)., CIDR block to test the IP against.]
 coalesce      |first                               |"boolean|text|integer|keyword|long"                                                                                               |Expression to evaluate.
@@ -238,6 +240,7 @@ avg           |The average of a numeric field.
 bin           |Creates groups of values - buckets - out of a datetime or numeric input. The size of the buckets can either be provided directly, or chosen based on a recommended count and values range.
 bucket        |Creates groups of values - buckets - out of a datetime or numeric input. The size of the buckets can either be provided directly, or chosen based on a recommended count and values range.
 case          |Accepts pairs of conditions and values. The function returns the value that belongs to the first condition that evaluates to `true`.  If the number of arguments is odd, the last argument is the default value which is returned when no condition matches. If the number of arguments is even, and no condition matches, the function returns `null`.
+cbrt          |Returns the cube root of a number. The input can be any numeric value, the return value is always a double. Cube roots of infinities are null.
 ceil          |Round a number up to the nearest integer.
 cidr_match    |Returns true if the provided IP is contained in one of the provided CIDR blocks.
 coalesce      |Returns the first of its arguments that is not null. If all arguments are null, it returns `null`.
@@ -292,7 +295,7 @@ signum        |Returns the sign of the given number. It returns `-1` for negativ
 sin           |Returns ths {wikipedia}/Sine_and_cosine[Sine] trigonometric function of an angle.
 sinh          |Returns the {wikipedia}/Hyperbolic_functions[hyperbolic sine] of an angle.
 split         |Split a single valued string into multiple strings.
-sqrt          |Returns the square root of a number. The input can be any numeric value, the return value is always a double. Square roots of negative numbers and infinites are null.
+sqrt          |Returns the square root of a number. The input can be any numeric value, the return value is always a double. Square roots of negative numbers and infinities are null.
 st_centroid_ag|The centroid of a spatial field.
 st_contains   |Returns whether the first geometry contains the second geometry. This is the inverse of the <<esql-st_within,ST_WITHIN>> function.
 st_disjoint   |Returns whether the two geometries or geometry columns are disjoint. This is the inverse of the <<esql-st_intersects,ST_INTERSECTS>> function. In mathematical terms: ST_Disjoint(A, B) ⇔ A ⋂ B = ∅
@@ -353,6 +356,7 @@ avg           |double
 bin           |"double|date"                                                                                                               |[false, false, true, true]  |false           |false
 bucket        |"double|date"                                                                                                               |[false, false, true, true]  |false           |false
 case          |"boolean|cartesian_point|date|double|geo_point|integer|ip|keyword|long|text|unsigned_long|version"                          |[false, false]              |true            |false
+cbrt          |double                                                                                                                      |false                       |false           |false
 ceil          |"double|integer|long|unsigned_long"                                                                                         |false                       |false           |false
 cidr_match    |boolean                                                                                                                     |[false, false]              |true            |false
 coalesce      |"boolean|text|integer|keyword|long"                                                                                         |false                       |true            |false
@@ -467,5 +471,5 @@ countFunctions#[skip:-8.14.99, reason:BIN added]
 meta functions |  stats  a = count(*), b = count(*), c = count(*) |  mv_expand c;
 
 a:long | b:long | c:long
-105    | 105    | 105
+106    | 106    | 106
 ;
diff --git a/x-pack/plugin/esql/src/main/generated/org/elasticsearch/xpack/esql/expression/function/scalar/math/CbrtDoubleEvaluator.java b/x-pack/plugin/esql/src/main/generated/org/elasticsearch/xpack/esql/expression/function/scalar/math/CbrtDoubleEvaluator.java
new file mode 100644
index 0000000000000..67549b6c8daa7
--- /dev/null
+++ b/x-pack/plugin/esql/src/main/generated/org/elasticsearch/xpack/esql/expression/function/scalar/math/CbrtDoubleEvaluator.java
@@ -0,0 +1,119 @@
+// Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+// or more contributor license agreements. Licensed under the Elastic License
+// 2.0; you may not use this file except in compliance with the Elastic License
+// 2.0.
+package org.elasticsearch.xpack.esql.expression.function.scalar.math;
+
+import java.lang.ArithmeticException;
+import java.lang.IllegalArgumentException;
+import java.lang.Override;
+import java.lang.String;
+import org.elasticsearch.compute.data.Block;
+import org.elasticsearch.compute.data.DoubleBlock;
+import org.elasticsearch.compute.data.DoubleVector;
+import org.elasticsearch.compute.data.Page;
+import org.elasticsearch.compute.operator.DriverContext;
+import org.elasticsearch.compute.operator.EvalOperator;
+import org.elasticsearch.core.Releasables;
+import org.elasticsearch.xpack.esql.expression.function.Warnings;
+import org.elasticsearch.xpack.ql.tree.Source;
+
+/**
+ * {@link EvalOperator.ExpressionEvaluator} implementation for {@link Cbrt}.
+ * This class is generated. Do not edit it.
+ */
+public final class CbrtDoubleEvaluator implements EvalOperator.ExpressionEvaluator {
+  private final Warnings warnings;
+
+  private final EvalOperator.ExpressionEvaluator val;
+
+  private final DriverContext driverContext;
+
+  public CbrtDoubleEvaluator(Source source, EvalOperator.ExpressionEvaluator val,
+      DriverContext driverContext) {
+    this.warnings = new Warnings(source);
+    this.val = val;
+    this.driverContext = driverContext;
+  }
+
+  @Override
+  public Block eval(Page page) {
+    try (DoubleBlock valBlock = (DoubleBlock) val.eval(page)) {
+      DoubleVector valVector = valBlock.asVector();
+      if (valVector == null) {
+        return eval(page.getPositionCount(), valBlock);
+      }
+      return eval(page.getPositionCount(), valVector);
+    }
+  }
+
+  public DoubleBlock eval(int positionCount, DoubleBlock valBlock) {
+    try(DoubleBlock.Builder result = driverContext.blockFactory().newDoubleBlockBuilder(positionCount)) {
+      position: for (int p = 0; p < positionCount; p++) {
+        if (valBlock.isNull(p)) {
+          result.appendNull();
+          continue position;
+        }
+        if (valBlock.getValueCount(p) != 1) {
+          if (valBlock.getValueCount(p) > 1) {
+            warnings.registerException(new IllegalArgumentException("single-value function encountered multi-value"));
+          }
+          result.appendNull();
+          continue position;
+        }
+        try {
+          result.appendDouble(Cbrt.process(valBlock.getDouble(valBlock.getFirstValueIndex(p))));
+        } catch (ArithmeticException e) {
+          warnings.registerException(e);
+          result.appendNull();
+        }
+      }
+      return result.build();
+    }
+  }
+
+  public DoubleBlock eval(int positionCount, DoubleVector valVector) {
+    try(DoubleBlock.Builder result = driverContext.blockFactory().newDoubleBlockBuilder(positionCount)) {
+      position: for (int p = 0; p < positionCount; p++) {
+        try {
+          result.appendDouble(Cbrt.process(valVector.getDouble(p)));
+        } catch (ArithmeticException e) {
+          warnings.registerException(e);
+          result.appendNull();
+        }
+      }
+      return result.build();
+    }
+  }
+
+  @Override
+  public String toString() {
+    return "CbrtDoubleEvaluator[" + "val=" + val + "]";
+  }
+
+  @Override
+  public void close() {
+    Releasables.closeExpectNoException(val);
+  }
+
+  static class Factory implements EvalOperator.ExpressionEvaluator.Factory {
+    private final Source source;
+
+    private final EvalOperator.ExpressionEvaluator.Factory val;
+
+    public Factory(Source source, EvalOperator.ExpressionEvaluator.Factory val) {
+      this.source = source;
+      this.val = val;
+    }
+
+    @Override
+    public CbrtDoubleEvaluator get(DriverContext context) {
+      return new CbrtDoubleEvaluator(source, val.get(context), context);
+    }
+
+    @Override
+    public String toString() {
+      return "CbrtDoubleEvaluator[" + "val=" + val + "]";
+    }
+  }
+}
diff --git a/x-pack/plugin/esql/src/main/generated/org/elasticsearch/xpack/esql/expression/function/scalar/math/CbrtIntEvaluator.java b/x-pack/plugin/esql/src/main/generated/org/elasticsearch/xpack/esql/expression/function/scalar/math/CbrtIntEvaluator.java
new file mode 100644
index 0000000000000..4b582cf5e1653
--- /dev/null
+++ b/x-pack/plugin/esql/src/main/generated/org/elasticsearch/xpack/esql/expression/function/scalar/math/CbrtIntEvaluator.java
@@ -0,0 +1,120 @@
+// Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+// or more contributor license agreements. Licensed under the Elastic License
+// 2.0; you may not use this file except in compliance with the Elastic License
+// 2.0.
+package org.elasticsearch.xpack.esql.expression.function.scalar.math;
+
+import java.lang.ArithmeticException;
+import java.lang.IllegalArgumentException;
+import java.lang.Override;
+import java.lang.String;
+import org.elasticsearch.compute.data.Block;
+import org.elasticsearch.compute.data.DoubleBlock;
+import org.elasticsearch.compute.data.IntBlock;
+import org.elasticsearch.compute.data.IntVector;
+import org.elasticsearch.compute.data.Page;
+import org.elasticsearch.compute.operator.DriverContext;
+import org.elasticsearch.compute.operator.EvalOperator;
+import org.elasticsearch.core.Releasables;
+import org.elasticsearch.xpack.esql.expression.function.Warnings;
+import org.elasticsearch.xpack.ql.tree.Source;
+
+/**
+ * {@link EvalOperator.ExpressionEvaluator} implementation for {@link Cbrt}.
+ * This class is generated. Do not edit it.
+ */
+public final class CbrtIntEvaluator implements EvalOperator.ExpressionEvaluator {
+  private final Warnings warnings;
+
+  private final EvalOperator.ExpressionEvaluator val;
+
+  private final DriverContext driverContext;
+
+  public CbrtIntEvaluator(Source source, EvalOperator.ExpressionEvaluator val,
+      DriverContext driverContext) {
+    this.warnings = new Warnings(source);
+    this.val = val;
+    this.driverContext = driverContext;
+  }
+
+  @Override
+  public Block eval(Page page) {
+    try (IntBlock valBlock = (IntBlock) val.eval(page)) {
+      IntVector valVector = valBlock.asVector();
+      if (valVector == null) {
+        return eval(page.getPositionCount(), valBlock);
+      }
+      return eval(page.getPositionCount(), valVector);
+    }
+  }
+
+  public DoubleBlock eval(int positionCount, IntBlock valBlock) {
+    try(DoubleBlock.Builder result = driverContext.blockFactory().newDoubleBlockBuilder(positionCount)) {
+      position: for (int p = 0; p < positionCount; p++) {
+        if (valBlock.isNull(p)) {
+          result.appendNull();
+          continue position;
+        }
+        if (valBlock.getValueCount(p) != 1) {
+          if (valBlock.getValueCount(p) > 1) {
+            warnings.registerException(new IllegalArgumentException("single-value function encountered multi-value"));
+          }
+          result.appendNull();
+          continue position;
+        }
+        try {
+          result.appendDouble(Cbrt.process(valBlock.getInt(valBlock.getFirstValueIndex(p))));
+        } catch (ArithmeticException e) {
+          warnings.registerException(e);
+          result.appendNull();
+        }
+      }
+      return result.build();
+    }
+  }
+
+  public DoubleBlock eval(int positionCount, IntVector valVector) {
+    try(DoubleBlock.Builder result = driverContext.blockFactory().newDoubleBlockBuilder(positionCount)) {
+      position: for (int p = 0; p < positionCount; p++) {
+        try {
+          result.appendDouble(Cbrt.process(valVector.getInt(p)));
+        } catch (ArithmeticException e) {
+          warnings.registerException(e);
+          result.appendNull();
+        }
+      }
+      return result.build();
+    }
+  }
+
+  @Override
+  public String toString() {
+    return "CbrtIntEvaluator[" + "val=" + val + "]";
+  }
+
+  @Override
+  public void close() {
+    Releasables.closeExpectNoException(val);
+  }
+
+  static class Factory implements EvalOperator.ExpressionEvaluator.Factory {
+    private final Source source;
+
+    private final EvalOperator.ExpressionEvaluator.Factory val;
+
+    public Factory(Source source, EvalOperator.ExpressionEvaluator.Factory val) {
+      this.source = source;
+      this.val = val;
+    }
+
+    @Override
+    public CbrtIntEvaluator get(DriverContext context) {
+      return new CbrtIntEvaluator(source, val.get(context), context);
+    }
+
+    @Override
+    public String toString() {
+      return "CbrtIntEvaluator[" + "val=" + val + "]";
+    }
+  }
+}
diff --git a/x-pack/plugin/esql/src/main/generated/org/elasticsearch/xpack/esql/expression/function/scalar/math/CbrtLongEvaluator.java b/x-pack/plugin/esql/src/main/generated/org/elasticsearch/xpack/esql/expression/function/scalar/math/CbrtLongEvaluator.java
new file mode 100644
index 0000000000000..b23f2a6935dd2
--- /dev/null
+++ b/x-pack/plugin/esql/src/main/generated/org/elasticsearch/xpack/esql/expression/function/scalar/math/CbrtLongEvaluator.java
@@ -0,0 +1,120 @@
+// Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+// or more contributor license agreements. Licensed under the Elastic License
+// 2.0; you may not use this file except in compliance with the Elastic License
+// 2.0.
+package org.elasticsearch.xpack.esql.expression.function.scalar.math;
+
+import java.lang.ArithmeticException;
+import java.lang.IllegalArgumentException;
+import java.lang.Override;
+import java.lang.String;
+import org.elasticsearch.compute.data.Block;
+import org.elasticsearch.compute.data.DoubleBlock;
+import org.elasticsearch.compute.data.LongBlock;
+import org.elasticsearch.compute.data.LongVector;
+import org.elasticsearch.compute.data.Page;
+import org.elasticsearch.compute.operator.DriverContext;
+import org.elasticsearch.compute.operator.EvalOperator;
+import org.elasticsearch.core.Releasables;
+import org.elasticsearch.xpack.esql.expression.function.Warnings;
+import org.elasticsearch.xpack.ql.tree.Source;
+
+/**
+ * {@link EvalOperator.ExpressionEvaluator} implementation for {@link Cbrt}.
+ * This class is generated. Do not edit it.
+ */
+public final class CbrtLongEvaluator implements EvalOperator.ExpressionEvaluator {
+  private final Warnings warnings;
+
+  private final EvalOperator.ExpressionEvaluator val;
+
+  private final DriverContext driverContext;
+
+  public CbrtLongEvaluator(Source source, EvalOperator.ExpressionEvaluator val,
+      DriverContext driverContext) {
+    this.warnings = new Warnings(source);
+    this.val = val;
+    this.driverContext = driverContext;
+  }
+
+  @Override
+  public Block eval(Page page) {
+    try (LongBlock valBlock = (LongBlock) val.eval(page)) {
+      LongVector valVector = valBlock.asVector();
+      if (valVector == null) {
+        return eval(page.getPositionCount(), valBlock);
+      }
+      return eval(page.getPositionCount(), valVector);
+    }
+  }
+
+  public DoubleBlock eval(int positionCount, LongBlock valBlock) {
+    try(DoubleBlock.Builder result = driverContext.blockFactory().newDoubleBlockBuilder(positionCount)) {
+      position: for (int p = 0; p < positionCount; p++) {
+        if (valBlock.isNull(p)) {
+          result.appendNull();
+          continue position;
+        }
+        if (valBlock.getValueCount(p) != 1) {
+          if (valBlock.getValueCount(p) > 1) {
+            warnings.registerException(new IllegalArgumentException("single-value function encountered multi-value"));
+          }
+          result.appendNull();
+          continue position;
+        }
+        try {
+          result.appendDouble(Cbrt.process(valBlock.getLong(valBlock.getFirstValueIndex(p))));
+        } catch (ArithmeticException e) {
+          warnings.registerException(e);
+          result.appendNull();
+        }
+      }
+      return result.build();
+    }
+  }
+
+  public DoubleBlock eval(int positionCount, LongVector valVector) {
+    try(DoubleBlock.Builder result = driverContext.blockFactory().newDoubleBlockBuilder(positionCount)) {
+      position: for (int p = 0; p < positionCount; p++) {
+        try {
+          result.appendDouble(Cbrt.process(valVector.getLong(p)));
+        } catch (ArithmeticException e) {
+          warnings.registerException(e);
+          result.appendNull();
+        }
+      }
+      return result.build();
+    }
+  }
+
+  @Override
+  public String toString() {
+    return "CbrtLongEvaluator[" + "val=" + val + "]";
+  }
+
+  @Override
+  public void close() {
+    Releasables.closeExpectNoException(val);
+  }
+
+  static class Factory implements EvalOperator.ExpressionEvaluator.Factory {
+    private final Source source;
+
+    private final EvalOperator.ExpressionEvaluator.Factory val;
+
+    public Factory(Source source, EvalOperator.ExpressionEvaluator.Factory val) {
+      this.source = source;
+      this.val = val;
+    }
+
+    @Override
+    public CbrtLongEvaluator get(DriverContext context) {
+      return new CbrtLongEvaluator(source, val.get(context), context);
+    }
+
+    @Override
+    public String toString() {
+      return "CbrtLongEvaluator[" + "val=" + val + "]";
+    }
+  }
+}
diff --git a/x-pack/plugin/esql/src/main/generated/org/elasticsearch/xpack/esql/expression/function/scalar/math/CbrtUnsignedLongEvaluator.java b/x-pack/plugin/esql/src/main/generated/org/elasticsearch/xpack/esql/expression/function/scalar/math/CbrtUnsignedLongEvaluator.java
new file mode 100644
index 0000000000000..61b5808b4cb80
--- /dev/null
+++ b/x-pack/plugin/esql/src/main/generated/org/elasticsearch/xpack/esql/expression/function/scalar/math/CbrtUnsignedLongEvaluator.java
@@ -0,0 +1,110 @@
+// Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+// or more contributor license agreements. Licensed under the Elastic License
+// 2.0; you may not use this file except in compliance with the Elastic License
+// 2.0.
+package org.elasticsearch.xpack.esql.expression.function.scalar.math;
+
+import java.lang.IllegalArgumentException;
+import java.lang.Override;
+import java.lang.String;
+import org.elasticsearch.compute.data.Block;
+import org.elasticsearch.compute.data.DoubleBlock;
+import org.elasticsearch.compute.data.DoubleVector;
+import org.elasticsearch.compute.data.LongBlock;
+import org.elasticsearch.compute.data.LongVector;
+import org.elasticsearch.compute.data.Page;
+import org.elasticsearch.compute.operator.DriverContext;
+import org.elasticsearch.compute.operator.EvalOperator;
+import org.elasticsearch.core.Releasables;
+import org.elasticsearch.xpack.esql.expression.function.Warnings;
+import org.elasticsearch.xpack.ql.tree.Source;
+
+/**
+ * {@link EvalOperator.ExpressionEvaluator} implementation for {@link Cbrt}.
+ * This class is generated. Do not edit it.
+ */
+public final class CbrtUnsignedLongEvaluator implements EvalOperator.ExpressionEvaluator {
+  private final Warnings warnings;
+
+  private final EvalOperator.ExpressionEvaluator val;
+
+  private final DriverContext driverContext;
+
+  public CbrtUnsignedLongEvaluator(Source source, EvalOperator.ExpressionEvaluator val,
+      DriverContext driverContext) {
+    this.warnings = new Warnings(source);
+    this.val = val;
+    this.driverContext = driverContext;
+  }
+
+  @Override
+  public Block eval(Page page) {
+    try (LongBlock valBlock = (LongBlock) val.eval(page)) {
+      LongVector valVector = valBlock.asVector();
+      if (valVector == null) {
+        return eval(page.getPositionCount(), valBlock);
+      }
+      return eval(page.getPositionCount(), valVector).asBlock();
+    }
+  }
+
+  public DoubleBlock eval(int positionCount, LongBlock valBlock) {
+    try(DoubleBlock.Builder result = driverContext.blockFactory().newDoubleBlockBuilder(positionCount)) {
+      position: for (int p = 0; p < positionCount; p++) {
+        if (valBlock.isNull(p)) {
+          result.appendNull();
+          continue position;
+        }
+        if (valBlock.getValueCount(p) != 1) {
+          if (valBlock.getValueCount(p) > 1) {
+            warnings.registerException(new IllegalArgumentException("single-value function encountered multi-value"));
+          }
+          result.appendNull();
+          continue position;
+        }
+        result.appendDouble(Cbrt.processUnsignedLong(valBlock.getLong(valBlock.getFirstValueIndex(p))));
+      }
+      return result.build();
+    }
+  }
+
+  public DoubleVector eval(int positionCount, LongVector valVector) {
+    try(DoubleVector.Builder result = driverContext.blockFactory().newDoubleVectorBuilder(positionCount)) {
+      position: for (int p = 0; p < positionCount; p++) {
+        result.appendDouble(Cbrt.processUnsignedLong(valVector.getLong(p)));
+      }
+      return result.build();
+    }
+  }
+
+  @Override
+  public String toString() {
+    return "CbrtUnsignedLongEvaluator[" + "val=" + val + "]";
+  }
+
+  @Override
+  public void close() {
+    Releasables.closeExpectNoException(val);
+  }
+
+  static class Factory implements EvalOperator.ExpressionEvaluator.Factory {
+    private final Source source;
+
+    private final EvalOperator.ExpressionEvaluator.Factory val;
+
+    public Factory(Source source, EvalOperator.ExpressionEvaluator.Factory val) {
+      this.source = source;
+      this.val = val;
+    }
+
+    @Override
+    public CbrtUnsignedLongEvaluator get(DriverContext context) {
+      return new CbrtUnsignedLongEvaluator(source, val.get(context), context);
+    }
+
+    @Override
+    public String toString() {
+      return "CbrtUnsignedLongEvaluator[" + "val=" + val + "]";
+    }
+  }
+}
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/action/EsqlCapabilities.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/action/EsqlCapabilities.java
index fa23466f54f83..73799566e44b9 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/action/EsqlCapabilities.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/action/EsqlCapabilities.java
@@ -21,13 +21,19 @@
  * {@link RestNodesCapabilitiesAction} and we use them to enable tests.
  */
 public class EsqlCapabilities {
+    /**
+     * Support for function {@code CBRT}. Done in #108574.
+     */
+    private static final String FN_CBRT = "fn_cbrt";
+
     static final Set<String> CAPABILITIES = capabilities();
 
     private static Set<String> capabilities() {
+        List<String> caps = new ArrayList<>(List.of(FN_CBRT));
+
         /*
          * Add all of our cluster features without the leading "esql."
          */
-        List<String> caps = new ArrayList<>();
         for (NodeFeature feature : new EsqlFeatures().getFeatures()) {
             caps.add(cap(feature));
         }
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/function/EsqlFunctionRegistry.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/function/EsqlFunctionRegistry.java
index f7d737a82c279..4dfdf547f9405 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/function/EsqlFunctionRegistry.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/function/EsqlFunctionRegistry.java
@@ -51,6 +51,7 @@
 import org.elasticsearch.xpack.esql.expression.function.scalar.math.Asin;
 import org.elasticsearch.xpack.esql.expression.function.scalar.math.Atan;
 import org.elasticsearch.xpack.esql.expression.function.scalar.math.Atan2;
+import org.elasticsearch.xpack.esql.expression.function.scalar.math.Cbrt;
 import org.elasticsearch.xpack.esql.expression.function.scalar.math.Ceil;
 import org.elasticsearch.xpack.esql.expression.function.scalar.math.Cos;
 import org.elasticsearch.xpack.esql.expression.function.scalar.math.Cosh;
@@ -197,6 +198,7 @@ private FunctionDefinition[][] functions() {
                 def(Asin.class, Asin::new, "asin"),
                 def(Atan.class, Atan::new, "atan"),
                 def(Atan2.class, Atan2::new, "atan2"),
+                def(Cbrt.class, Cbrt::new, "cbrt"),
                 def(Ceil.class, Ceil::new, "ceil"),
                 def(Cos.class, Cos::new, "cos"),
                 def(Cosh.class, Cosh::new, "cosh"),
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/function/scalar/math/Cbrt.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/function/scalar/math/Cbrt.java
new file mode 100644
index 0000000000000..455e460b25e8e
--- /dev/null
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/function/scalar/math/Cbrt.java
@@ -0,0 +1,109 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.esql.expression.function.scalar.math;
+
+import org.elasticsearch.compute.ann.Evaluator;
+import org.elasticsearch.compute.operator.EvalOperator.ExpressionEvaluator;
+import org.elasticsearch.xpack.esql.EsqlIllegalArgumentException;
+import org.elasticsearch.xpack.esql.expression.function.Example;
+import org.elasticsearch.xpack.esql.expression.function.FunctionInfo;
+import org.elasticsearch.xpack.esql.expression.function.Param;
+import org.elasticsearch.xpack.esql.expression.function.scalar.UnaryScalarFunction;
+import org.elasticsearch.xpack.ql.expression.Expression;
+import org.elasticsearch.xpack.ql.tree.NodeInfo;
+import org.elasticsearch.xpack.ql.tree.Source;
+import org.elasticsearch.xpack.ql.type.DataType;
+import org.elasticsearch.xpack.ql.type.DataTypes;
+
+import java.util.List;
+import java.util.function.Function;
+
+import static org.elasticsearch.xpack.esql.type.EsqlDataTypeConverter.unsignedLongToDouble;
+import static org.elasticsearch.xpack.ql.expression.TypeResolutions.ParamOrdinal.DEFAULT;
+import static org.elasticsearch.xpack.ql.expression.TypeResolutions.isNumeric;
+
+public class Cbrt extends UnaryScalarFunction {
+    @FunctionInfo(returnType = "double", description = """
+        Returns the cube root of a number. The input can be any numeric value, the return value is always a double.
+        Cube roots of infinities are null.""", examples = @Example(file = "math", tag = "cbrt"))
+    public Cbrt(
+        Source source,
+        @Param(
+            name = "number",
+            type = { "double", "integer", "long", "unsigned_long" },
+            description = "Numeric expression. If `null`, the function returns `null`."
+        ) Expression n
+    ) {
+        super(source, n);
+    }
+
+    @Override
+    public ExpressionEvaluator.Factory toEvaluator(Function<Expression, ExpressionEvaluator.Factory> toEvaluator) {
+        var field = toEvaluator.apply(field());
+        var fieldType = field().dataType();
+
+        if (fieldType == DataTypes.DOUBLE) {
+            return new CbrtDoubleEvaluator.Factory(source(), field);
+        }
+        if (fieldType == DataTypes.INTEGER) {
+            return new CbrtIntEvaluator.Factory(source(), field);
+        }
+        if (fieldType == DataTypes.LONG) {
+            return new CbrtLongEvaluator.Factory(source(), field);
+        }
+        if (fieldType == DataTypes.UNSIGNED_LONG) {
+            return new CbrtUnsignedLongEvaluator.Factory(source(), field);
+        }
+
+        throw EsqlIllegalArgumentException.illegalDataType(fieldType);
+    }
+
+    @Evaluator(extraName = "Double", warnExceptions = ArithmeticException.class)
+    static double process(double val) {
+        return Math.cbrt(val);
+    }
+
+    @Evaluator(extraName = "Long", warnExceptions = ArithmeticException.class)
+    static double process(long val) {
+        return Math.cbrt(val);
+    }
+
+    @Evaluator(extraName = "UnsignedLong")
+    static double processUnsignedLong(long val) {
+        return Math.cbrt(unsignedLongToDouble(val));
+    }
+
+    @Evaluator(extraName = "Int", warnExceptions = ArithmeticException.class)
+    static double process(int val) {
+        return Math.cbrt(val);
+    }
+
+    @Override
+    public final Expression replaceChildren(List<Expression> newChildren) {
+        return new Cbrt(source(), newChildren.get(0));
+    }
+
+    @Override
+    protected NodeInfo<? extends Expression> info() {
+        return NodeInfo.create(this, Cbrt::new, field());
+    }
+
+    @Override
+    public DataType dataType() {
+        return DataTypes.DOUBLE;
+    }
+
+    @Override
+    protected TypeResolution resolveType() {
+        if (childrenResolved() == false) {
+            return new TypeResolution("Unresolved children");
+        }
+
+        return isNumeric(field, sourceText(), DEFAULT);
+    }
+}
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/function/scalar/math/Sqrt.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/function/scalar/math/Sqrt.java
index c000f56a3a653..c0bd74ea90e73 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/function/scalar/math/Sqrt.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/function/scalar/math/Sqrt.java
@@ -30,7 +30,7 @@
 public class Sqrt extends UnaryScalarFunction {
     @FunctionInfo(returnType = "double", description = """
         Returns the square root of a number. The input can be any numeric value, the return value is always a double.
-        Square roots of negative numbers and infinites are null.""", examples = @Example(file = "math", tag = "sqrt"))
+        Square roots of negative numbers and infinities are null.""", examples = @Example(file = "math", tag = "sqrt"))
     public Sqrt(
         Source source,
         @Param(
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/function/scalar/package-info.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/function/scalar/package-info.java
index 9469889285fd3..a8d4139ed2cf0 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/function/scalar/package-info.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/expression/function/scalar/package-info.java
@@ -97,35 +97,11 @@
  *     </li>
  *     <li>
  *         Now you can run all of the ESQL tests like CI:
- *         {@code ./gradlew -p x-pack/plugin/esql/ check}
+ *         {@code ./gradlew -p x-pack/plugin/esql/ test}
  *     </li>
  *     <li>
- *         Now it's time to write some docs! Open {@code docs/reference/esql/esql-functions-operators.asciidoc}
- *         and add your function in alphabetical order to the list at the top and then add it to
- *         the includes below.
- *     </li>
- *     <li>
- *         Now go make a file to include. You can start by copying one of it's neighbors.
- *     </li>
- *     <li>
- *         It's important that any examples you add to the docs be included from the csv-spec file.
- *         That looks like:
- *         <pre>{@code
- * [source.merge.styled,esql]
- * ----
- * include::{esql-specs}/math.csv-spec[tag=mv_min]
- * ----
- * [%header.monospaced.styled,format=dsv,separator=|]
- * |===
- * include::{esql-specs}/math.csv-spec[tag=mv_min-result]
- * |===
- *         }</pre>
- *         This includes the bit of the csv-spec file fenced by {@code // tag::mv_min[]}. You'll
- *         want a fence descriptive for your function. Consider the non-includes lines to be
- *         asciidoc ceremony to make the result look right in the rendered docs.
- *     </li>
- *     <li>
- *         Generate a syntax diagram and a table with supported types by running the tests via
+ *         Now it's time to write some docs!
+ *         Generate the docs, a syntax diagram and a table with supported types by running the tests via
  *         gradle: {@code ./gradlew x-pack:plugin:esql:test}
  *         The generated files are
  *         <ol>
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/io/stream/PlanNamedTypes.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/io/stream/PlanNamedTypes.java
index 4a5748f26a07f..b8b91fd706d51 100644
--- a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/io/stream/PlanNamedTypes.java
+++ b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/io/stream/PlanNamedTypes.java
@@ -67,6 +67,7 @@
 import org.elasticsearch.xpack.esql.expression.function.scalar.math.Asin;
 import org.elasticsearch.xpack.esql.expression.function.scalar.math.Atan;
 import org.elasticsearch.xpack.esql.expression.function.scalar.math.Atan2;
+import org.elasticsearch.xpack.esql.expression.function.scalar.math.Cbrt;
 import org.elasticsearch.xpack.esql.expression.function.scalar.math.Ceil;
 import org.elasticsearch.xpack.esql.expression.function.scalar.math.Cos;
 import org.elasticsearch.xpack.esql.expression.function.scalar.math.Cosh;
@@ -344,6 +345,7 @@ public static List<PlanNameRegistry.Entry> namedTypeEntries() {
             of(ESQL_UNARY_SCLR_CLS, Acos.class, PlanNamedTypes::writeESQLUnaryScalar, PlanNamedTypes::readESQLUnaryScalar),
             of(ESQL_UNARY_SCLR_CLS, Asin.class, PlanNamedTypes::writeESQLUnaryScalar, PlanNamedTypes::readESQLUnaryScalar),
             of(ESQL_UNARY_SCLR_CLS, Atan.class, PlanNamedTypes::writeESQLUnaryScalar, PlanNamedTypes::readESQLUnaryScalar),
+            of(ESQL_UNARY_SCLR_CLS, Cbrt.class, PlanNamedTypes::writeESQLUnaryScalar, PlanNamedTypes::readESQLUnaryScalar),
             of(ESQL_UNARY_SCLR_CLS, Ceil.class, PlanNamedTypes::writeESQLUnaryScalar, PlanNamedTypes::readESQLUnaryScalar),
             of(ESQL_UNARY_SCLR_CLS, Cos.class, PlanNamedTypes::writeESQLUnaryScalar, PlanNamedTypes::readESQLUnaryScalar),
             of(ESQL_UNARY_SCLR_CLS, Cosh.class, PlanNamedTypes::writeESQLUnaryScalar, PlanNamedTypes::readESQLUnaryScalar),
@@ -1289,6 +1291,7 @@ static void writeBinaryLogic(PlanStreamOutput out, BinaryLogic binaryLogic) thro
         entry(name(Acos.class), Acos::new),
         entry(name(Asin.class), Asin::new),
         entry(name(Atan.class), Atan::new),
+        entry(name(Cbrt.class), Cbrt::new),
         entry(name(Ceil.class), Ceil::new),
         entry(name(Cos.class), Cos::new),
         entry(name(Cosh.class), Cosh::new),
diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/expression/function/scalar/math/CbrtTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/expression/function/scalar/math/CbrtTests.java
new file mode 100644
index 0000000000000..3d67b4d2b1efe
--- /dev/null
+++ b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/expression/function/scalar/math/CbrtTests.java
@@ -0,0 +1,82 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.esql.expression.function.scalar.math;
+
+import com.carrotsearch.randomizedtesting.annotations.Name;
+import com.carrotsearch.randomizedtesting.annotations.ParametersFactory;
+
+import org.elasticsearch.xpack.esql.expression.function.AbstractFunctionTestCase;
+import org.elasticsearch.xpack.esql.expression.function.TestCaseSupplier;
+import org.elasticsearch.xpack.ql.expression.Expression;
+import org.elasticsearch.xpack.ql.tree.Source;
+import org.elasticsearch.xpack.ql.type.DataTypes;
+import org.elasticsearch.xpack.ql.util.NumericUtils;
+
+import java.math.BigInteger;
+import java.util.ArrayList;
+import java.util.List;
+import java.util.function.Supplier;
+
+import static org.elasticsearch.xpack.esql.type.EsqlDataTypeConverter.unsignedLongToDouble;
+
+public class CbrtTests extends AbstractFunctionTestCase {
+    public CbrtTests(@Name("TestCase") Supplier<TestCaseSupplier.TestCase> testCaseSupplier) {
+        this.testCase = testCaseSupplier.get();
+    }
+
+    @ParametersFactory
+    public static Iterable<Object[]> parameters() {
+        String read = "Attribute[channel=0]";
+        List<TestCaseSupplier> suppliers = new ArrayList<>();
+        // Valid values
+        TestCaseSupplier.forUnaryInt(
+            suppliers,
+            "CbrtIntEvaluator[val=" + read + "]",
+            DataTypes.DOUBLE,
+            Math::cbrt,
+            Integer.MIN_VALUE,
+            Integer.MAX_VALUE,
+            List.of()
+        );
+        TestCaseSupplier.forUnaryLong(
+            suppliers,
+            "CbrtLongEvaluator[val=" + read + "]",
+            DataTypes.DOUBLE,
+            Math::cbrt,
+            Long.MIN_VALUE,
+            Long.MAX_VALUE,
+            List.of()
+        );
+        TestCaseSupplier.forUnaryUnsignedLong(
+            suppliers,
+            "CbrtUnsignedLongEvaluator[val=" + read + "]",
+            DataTypes.DOUBLE,
+            ul -> Math.cbrt(unsignedLongToDouble(NumericUtils.asLongUnsigned(ul))),
+            BigInteger.ZERO,
+            UNSIGNED_LONG_MAX,
+            List.of()
+        );
+        TestCaseSupplier.forUnaryDouble(
+            suppliers,
+            "CbrtDoubleEvaluator[val=" + read + "]",
+            DataTypes.DOUBLE,
+            Math::cbrt,
+            Double.MIN_VALUE,
+            Double.MAX_VALUE,
+            List.of()
+        );
+        suppliers = anyNullIsNull(true, suppliers);
+
+        return parameterSuppliersFromTypedData(errorsForCasesWithoutExamples(suppliers));
+    }
+
+    @Override
+    protected Expression build(Source source, List<Expression> args) {
+        return new Cbrt(source, args.get(0));
+    }
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/InferenceNamedWriteablesProvider.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/InferenceNamedWriteablesProvider.java
index 41bef3521cdf2..4931b4da6f724 100644
--- a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/InferenceNamedWriteablesProvider.java
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/InferenceNamedWriteablesProvider.java
@@ -25,12 +25,17 @@
 import org.elasticsearch.xpack.core.inference.results.SparseEmbeddingResults;
 import org.elasticsearch.xpack.core.inference.results.TextEmbeddingByteResults;
 import org.elasticsearch.xpack.core.inference.results.TextEmbeddingResults;
+import org.elasticsearch.xpack.inference.services.azureaistudio.completion.AzureAiStudioChatCompletionServiceSettings;
+import org.elasticsearch.xpack.inference.services.azureaistudio.completion.AzureAiStudioChatCompletionTaskSettings;
+import org.elasticsearch.xpack.inference.services.azureaistudio.embeddings.AzureAiStudioEmbeddingsServiceSettings;
+import org.elasticsearch.xpack.inference.services.azureaistudio.embeddings.AzureAiStudioEmbeddingsTaskSettings;
 import org.elasticsearch.xpack.inference.services.azureopenai.AzureOpenAiSecretSettings;
 import org.elasticsearch.xpack.inference.services.azureopenai.completion.AzureOpenAiCompletionServiceSettings;
 import org.elasticsearch.xpack.inference.services.azureopenai.completion.AzureOpenAiCompletionTaskSettings;
 import org.elasticsearch.xpack.inference.services.azureopenai.embeddings.AzureOpenAiEmbeddingsServiceSettings;
 import org.elasticsearch.xpack.inference.services.azureopenai.embeddings.AzureOpenAiEmbeddingsTaskSettings;
 import org.elasticsearch.xpack.inference.services.cohere.CohereServiceSettings;
+import org.elasticsearch.xpack.inference.services.cohere.completion.CohereCompletionServiceSettings;
 import org.elasticsearch.xpack.inference.services.cohere.embeddings.CohereEmbeddingsServiceSettings;
 import org.elasticsearch.xpack.inference.services.cohere.embeddings.CohereEmbeddingsTaskSettings;
 import org.elasticsearch.xpack.inference.services.cohere.rerank.CohereRerankServiceSettings;
@@ -69,106 +74,144 @@ public static List<NamedWriteableRegistry.Entry> getNamedWriteables() {
             new NamedWriteableRegistry.Entry(InferenceResults.class, LegacyTextEmbeddingResults.NAME, LegacyTextEmbeddingResults::new)
         );
 
-        // Inference results
-        namedWriteables.add(
-            new NamedWriteableRegistry.Entry(InferenceServiceResults.class, SparseEmbeddingResults.NAME, SparseEmbeddingResults::new)
-        );
-        namedWriteables.add(
-            new NamedWriteableRegistry.Entry(InferenceServiceResults.class, TextEmbeddingResults.NAME, TextEmbeddingResults::new)
-        );
-        namedWriteables.add(
-            new NamedWriteableRegistry.Entry(InferenceServiceResults.class, TextEmbeddingByteResults.NAME, TextEmbeddingByteResults::new)
-        );
+        addInferenceResultsNamedWriteables(namedWriteables);
+        addChunkedInferenceResultsNamedWriteables(namedWriteables);
+
+        // Empty default task settings
+        namedWriteables.add(new NamedWriteableRegistry.Entry(TaskSettings.class, EmptyTaskSettings.NAME, EmptyTaskSettings::new));
+
+        // Default secret settings
+        namedWriteables.add(new NamedWriteableRegistry.Entry(SecretSettings.class, DefaultSecretSettings.NAME, DefaultSecretSettings::new));
+
+        addInternalElserNamedWriteables(namedWriteables);
+
+        // Internal TextEmbedding service config
         namedWriteables.add(
-            new NamedWriteableRegistry.Entry(InferenceServiceResults.class, ChatCompletionResults.NAME, ChatCompletionResults::new)
+            new NamedWriteableRegistry.Entry(
+                ServiceSettings.class,
+                ElasticsearchInternalServiceSettings.NAME,
+                ElasticsearchInternalServiceSettings::new
+            )
         );
         namedWriteables.add(
-            new NamedWriteableRegistry.Entry(InferenceServiceResults.class, RankedDocsResults.NAME, RankedDocsResults::new)
+            new NamedWriteableRegistry.Entry(
+                ServiceSettings.class,
+                MultilingualE5SmallInternalServiceSettings.NAME,
+                MultilingualE5SmallInternalServiceSettings::new
+            )
         );
 
-        // Chunked inference results
+        addHuggingFaceNamedWriteables(namedWriteables);
+        addOpenAiNamedWriteables(namedWriteables);
+        addCohereNamedWriteables(namedWriteables);
+        addAzureOpenAiNamedWriteables(namedWriteables);
+        addAzureAiStudioNamedWriteables(namedWriteables);
+
+        return namedWriteables;
+    }
+
+    private static void addAzureAiStudioNamedWriteables(List<NamedWriteableRegistry.Entry> namedWriteables) {
         namedWriteables.add(
             new NamedWriteableRegistry.Entry(
-                InferenceServiceResults.class,
-                ErrorChunkedInferenceResults.NAME,
-                ErrorChunkedInferenceResults::new
+                ServiceSettings.class,
+                AzureAiStudioEmbeddingsServiceSettings.NAME,
+                AzureAiStudioEmbeddingsServiceSettings::new
             )
         );
         namedWriteables.add(
             new NamedWriteableRegistry.Entry(
-                InferenceServiceResults.class,
-                ChunkedSparseEmbeddingResults.NAME,
-                ChunkedSparseEmbeddingResults::new
+                TaskSettings.class,
+                AzureAiStudioEmbeddingsTaskSettings.NAME,
+                AzureAiStudioEmbeddingsTaskSettings::new
             )
         );
+
         namedWriteables.add(
             new NamedWriteableRegistry.Entry(
-                InferenceServiceResults.class,
-                ChunkedTextEmbeddingResults.NAME,
-                ChunkedTextEmbeddingResults::new
+                ServiceSettings.class,
+                AzureAiStudioChatCompletionServiceSettings.NAME,
+                AzureAiStudioChatCompletionServiceSettings::new
             )
         );
         namedWriteables.add(
             new NamedWriteableRegistry.Entry(
-                InferenceServiceResults.class,
-                ChunkedTextEmbeddingFloatResults.NAME,
-                ChunkedTextEmbeddingFloatResults::new
+                TaskSettings.class,
+                AzureAiStudioChatCompletionTaskSettings.NAME,
+                AzureAiStudioChatCompletionTaskSettings::new
             )
         );
+    }
+
+    private static void addAzureOpenAiNamedWriteables(List<NamedWriteableRegistry.Entry> namedWriteables) {
         namedWriteables.add(
             new NamedWriteableRegistry.Entry(
-                InferenceServiceResults.class,
-                ChunkedTextEmbeddingByteResults.NAME,
-                ChunkedTextEmbeddingByteResults::new
+                AzureOpenAiSecretSettings.class,
+                AzureOpenAiSecretSettings.NAME,
+                AzureOpenAiSecretSettings::new
             )
         );
 
-        // Empty default task settings
-        namedWriteables.add(new NamedWriteableRegistry.Entry(TaskSettings.class, EmptyTaskSettings.NAME, EmptyTaskSettings::new));
-
-        // Default secret settings
-        namedWriteables.add(new NamedWriteableRegistry.Entry(SecretSettings.class, DefaultSecretSettings.NAME, DefaultSecretSettings::new));
-
-        // Internal ELSER config
         namedWriteables.add(
-            new NamedWriteableRegistry.Entry(ServiceSettings.class, ElserInternalServiceSettings.NAME, ElserInternalServiceSettings::new)
+            new NamedWriteableRegistry.Entry(
+                ServiceSettings.class,
+                AzureOpenAiEmbeddingsServiceSettings.NAME,
+                AzureOpenAiEmbeddingsServiceSettings::new
+            )
         );
         namedWriteables.add(
-            new NamedWriteableRegistry.Entry(TaskSettings.class, ElserMlNodeTaskSettings.NAME, ElserMlNodeTaskSettings::new)
+            new NamedWriteableRegistry.Entry(
+                TaskSettings.class,
+                AzureOpenAiEmbeddingsTaskSettings.NAME,
+                AzureOpenAiEmbeddingsTaskSettings::new
+            )
         );
 
-        // Internal TextEmbedding service config
         namedWriteables.add(
             new NamedWriteableRegistry.Entry(
                 ServiceSettings.class,
-                ElasticsearchInternalServiceSettings.NAME,
-                ElasticsearchInternalServiceSettings::new
+                AzureOpenAiCompletionServiceSettings.NAME,
+                AzureOpenAiCompletionServiceSettings::new
             )
         );
         namedWriteables.add(
             new NamedWriteableRegistry.Entry(
-                ServiceSettings.class,
-                MultilingualE5SmallInternalServiceSettings.NAME,
-                MultilingualE5SmallInternalServiceSettings::new
+                TaskSettings.class,
+                AzureOpenAiCompletionTaskSettings.NAME,
+                AzureOpenAiCompletionTaskSettings::new
             )
         );
+    }
 
-        // Hugging Face config
+    private static void addCohereNamedWriteables(List<NamedWriteableRegistry.Entry> namedWriteables) {
+        namedWriteables.add(
+            new NamedWriteableRegistry.Entry(ServiceSettings.class, CohereServiceSettings.NAME, CohereServiceSettings::new)
+        );
         namedWriteables.add(
             new NamedWriteableRegistry.Entry(
                 ServiceSettings.class,
-                HuggingFaceElserServiceSettings.NAME,
-                HuggingFaceElserServiceSettings::new
+                CohereEmbeddingsServiceSettings.NAME,
+                CohereEmbeddingsServiceSettings::new
             )
         );
         namedWriteables.add(
-            new NamedWriteableRegistry.Entry(ServiceSettings.class, HuggingFaceServiceSettings.NAME, HuggingFaceServiceSettings::new)
+            new NamedWriteableRegistry.Entry(TaskSettings.class, CohereEmbeddingsTaskSettings.NAME, CohereEmbeddingsTaskSettings::new)
         );
         namedWriteables.add(
-            new NamedWriteableRegistry.Entry(SecretSettings.class, HuggingFaceElserSecretSettings.NAME, HuggingFaceElserSecretSettings::new)
+            new NamedWriteableRegistry.Entry(ServiceSettings.class, CohereRerankServiceSettings.NAME, CohereRerankServiceSettings::new)
         );
+        namedWriteables.add(
+            new NamedWriteableRegistry.Entry(TaskSettings.class, CohereRerankTaskSettings.NAME, CohereRerankTaskSettings::new)
+        );
+        namedWriteables.add(
+            new NamedWriteableRegistry.Entry(
+                ServiceSettings.class,
+                CohereCompletionServiceSettings.NAME,
+                CohereCompletionServiceSettings::new
+            )
+        );
+    }
 
-        // OpenAI
+    private static void addOpenAiNamedWriteables(List<NamedWriteableRegistry.Entry> namedWriteables) {
         namedWriteables.add(
             new NamedWriteableRegistry.Entry(
                 ServiceSettings.class,
@@ -193,67 +236,86 @@ public static List<NamedWriteableRegistry.Entry> getNamedWriteables() {
                 OpenAiChatCompletionTaskSettings::new
             )
         );
+    }
 
-        // Cohere
-        namedWriteables.add(
-            new NamedWriteableRegistry.Entry(ServiceSettings.class, CohereServiceSettings.NAME, CohereServiceSettings::new)
-        );
+    private static void addHuggingFaceNamedWriteables(List<NamedWriteableRegistry.Entry> namedWriteables) {
         namedWriteables.add(
             new NamedWriteableRegistry.Entry(
                 ServiceSettings.class,
-                CohereEmbeddingsServiceSettings.NAME,
-                CohereEmbeddingsServiceSettings::new
+                HuggingFaceElserServiceSettings.NAME,
+                HuggingFaceElserServiceSettings::new
             )
         );
         namedWriteables.add(
-            new NamedWriteableRegistry.Entry(TaskSettings.class, CohereEmbeddingsTaskSettings.NAME, CohereEmbeddingsTaskSettings::new)
+            new NamedWriteableRegistry.Entry(ServiceSettings.class, HuggingFaceServiceSettings.NAME, HuggingFaceServiceSettings::new)
         );
         namedWriteables.add(
-            new NamedWriteableRegistry.Entry(ServiceSettings.class, CohereRerankServiceSettings.NAME, CohereRerankServiceSettings::new)
+            new NamedWriteableRegistry.Entry(SecretSettings.class, HuggingFaceElserSecretSettings.NAME, HuggingFaceElserSecretSettings::new)
+        );
+    }
+
+    private static void addInternalElserNamedWriteables(List<NamedWriteableRegistry.Entry> namedWriteables) {
+        namedWriteables.add(
+            new NamedWriteableRegistry.Entry(ServiceSettings.class, ElserInternalServiceSettings.NAME, ElserInternalServiceSettings::new)
         );
         namedWriteables.add(
-            new NamedWriteableRegistry.Entry(TaskSettings.class, CohereRerankTaskSettings.NAME, CohereRerankTaskSettings::new)
+            new NamedWriteableRegistry.Entry(TaskSettings.class, ElserMlNodeTaskSettings.NAME, ElserMlNodeTaskSettings::new)
         );
+    }
 
-        // Azure OpenAI
+    private static void addChunkedInferenceResultsNamedWriteables(List<NamedWriteableRegistry.Entry> namedWriteables) {
         namedWriteables.add(
             new NamedWriteableRegistry.Entry(
-                AzureOpenAiSecretSettings.class,
-                AzureOpenAiSecretSettings.NAME,
-                AzureOpenAiSecretSettings::new
+                InferenceServiceResults.class,
+                ErrorChunkedInferenceResults.NAME,
+                ErrorChunkedInferenceResults::new
             )
         );
-
         namedWriteables.add(
             new NamedWriteableRegistry.Entry(
-                ServiceSettings.class,
-                AzureOpenAiEmbeddingsServiceSettings.NAME,
-                AzureOpenAiEmbeddingsServiceSettings::new
+                InferenceServiceResults.class,
+                ChunkedSparseEmbeddingResults.NAME,
+                ChunkedSparseEmbeddingResults::new
             )
         );
         namedWriteables.add(
             new NamedWriteableRegistry.Entry(
-                TaskSettings.class,
-                AzureOpenAiEmbeddingsTaskSettings.NAME,
-                AzureOpenAiEmbeddingsTaskSettings::new
+                InferenceServiceResults.class,
+                ChunkedTextEmbeddingResults.NAME,
+                ChunkedTextEmbeddingResults::new
             )
         );
-
         namedWriteables.add(
             new NamedWriteableRegistry.Entry(
-                ServiceSettings.class,
-                AzureOpenAiCompletionServiceSettings.NAME,
-                AzureOpenAiCompletionServiceSettings::new
+                InferenceServiceResults.class,
+                ChunkedTextEmbeddingFloatResults.NAME,
+                ChunkedTextEmbeddingFloatResults::new
             )
         );
         namedWriteables.add(
             new NamedWriteableRegistry.Entry(
-                TaskSettings.class,
-                AzureOpenAiCompletionTaskSettings.NAME,
-                AzureOpenAiCompletionTaskSettings::new
+                InferenceServiceResults.class,
+                ChunkedTextEmbeddingByteResults.NAME,
+                ChunkedTextEmbeddingByteResults::new
             )
         );
+    }
 
-        return namedWriteables;
+    private static void addInferenceResultsNamedWriteables(List<NamedWriteableRegistry.Entry> namedWriteables) {
+        namedWriteables.add(
+            new NamedWriteableRegistry.Entry(InferenceServiceResults.class, SparseEmbeddingResults.NAME, SparseEmbeddingResults::new)
+        );
+        namedWriteables.add(
+            new NamedWriteableRegistry.Entry(InferenceServiceResults.class, TextEmbeddingResults.NAME, TextEmbeddingResults::new)
+        );
+        namedWriteables.add(
+            new NamedWriteableRegistry.Entry(InferenceServiceResults.class, TextEmbeddingByteResults.NAME, TextEmbeddingByteResults::new)
+        );
+        namedWriteables.add(
+            new NamedWriteableRegistry.Entry(InferenceServiceResults.class, ChatCompletionResults.NAME, ChatCompletionResults::new)
+        );
+        namedWriteables.add(
+            new NamedWriteableRegistry.Entry(InferenceServiceResults.class, RankedDocsResults.NAME, RankedDocsResults::new)
+        );
     }
 }
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/InferencePlugin.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/InferencePlugin.java
index 34459c3beff95..6e7e675a49f9b 100644
--- a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/InferencePlugin.java
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/InferencePlugin.java
@@ -61,6 +61,7 @@
 import org.elasticsearch.xpack.inference.rest.RestInferenceAction;
 import org.elasticsearch.xpack.inference.rest.RestPutInferenceModelAction;
 import org.elasticsearch.xpack.inference.services.ServiceComponents;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioService;
 import org.elasticsearch.xpack.inference.services.azureopenai.AzureOpenAiService;
 import org.elasticsearch.xpack.inference.services.cohere.CohereService;
 import org.elasticsearch.xpack.inference.services.elasticsearch.ElasticsearchInternalService;
@@ -190,6 +191,7 @@ public List<InferenceServiceExtension.Factory> getInferenceServiceFactories() {
             context -> new OpenAiService(httpFactory.get(), serviceComponents.get()),
             context -> new CohereService(httpFactory.get(), serviceComponents.get()),
             context -> new AzureOpenAiService(httpFactory.get(), serviceComponents.get()),
+            context -> new AzureAiStudioService(httpFactory.get(), serviceComponents.get()),
             ElasticsearchInternalService::new
         );
     }
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/action/azureaistudio/AzureAiStudioAction.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/action/azureaistudio/AzureAiStudioAction.java
new file mode 100644
index 0000000000000..843084312b621
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/action/azureaistudio/AzureAiStudioAction.java
@@ -0,0 +1,45 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.action.azureaistudio;
+
+import org.elasticsearch.ElasticsearchException;
+import org.elasticsearch.action.ActionListener;
+import org.elasticsearch.core.TimeValue;
+import org.elasticsearch.inference.InferenceServiceResults;
+import org.elasticsearch.xpack.inference.external.action.ExecutableAction;
+import org.elasticsearch.xpack.inference.external.http.sender.AzureAiStudioRequestManager;
+import org.elasticsearch.xpack.inference.external.http.sender.InferenceInputs;
+import org.elasticsearch.xpack.inference.external.http.sender.Sender;
+
+import static org.elasticsearch.xpack.inference.external.action.ActionUtils.createInternalServerError;
+import static org.elasticsearch.xpack.inference.external.action.ActionUtils.wrapFailuresInElasticsearchException;
+
+public class AzureAiStudioAction implements ExecutableAction {
+    protected final Sender sender;
+    protected final AzureAiStudioRequestManager requestCreator;
+    protected final String errorMessage;
+
+    protected AzureAiStudioAction(Sender sender, AzureAiStudioRequestManager requestCreator, String errorMessage) {
+        this.sender = sender;
+        this.requestCreator = requestCreator;
+        this.errorMessage = errorMessage;
+    }
+
+    @Override
+    public void execute(InferenceInputs inferenceInputs, TimeValue timeout, ActionListener<InferenceServiceResults> listener) {
+        try {
+            ActionListener<InferenceServiceResults> wrappedListener = wrapFailuresInElasticsearchException(errorMessage, listener);
+
+            sender.send(requestCreator, inferenceInputs, timeout, wrappedListener);
+        } catch (ElasticsearchException e) {
+            listener.onFailure(e);
+        } catch (Exception e) {
+            listener.onFailure(createInternalServerError(e, errorMessage));
+        }
+    }
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/action/azureaistudio/AzureAiStudioActionCreator.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/action/azureaistudio/AzureAiStudioActionCreator.java
new file mode 100644
index 0000000000000..213ac22518922
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/action/azureaistudio/AzureAiStudioActionCreator.java
@@ -0,0 +1,51 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.action.azureaistudio;
+
+import org.elasticsearch.xpack.inference.external.action.ExecutableAction;
+import org.elasticsearch.xpack.inference.external.http.sender.AzureAiStudioChatCompletionRequestManager;
+import org.elasticsearch.xpack.inference.external.http.sender.AzureAiStudioEmbeddingsRequestManager;
+import org.elasticsearch.xpack.inference.external.http.sender.Sender;
+import org.elasticsearch.xpack.inference.services.ServiceComponents;
+import org.elasticsearch.xpack.inference.services.azureaistudio.completion.AzureAiStudioChatCompletionModel;
+import org.elasticsearch.xpack.inference.services.azureaistudio.embeddings.AzureAiStudioEmbeddingsModel;
+
+import java.util.Map;
+import java.util.Objects;
+
+import static org.elasticsearch.xpack.inference.external.action.ActionUtils.constructFailedToSendRequestMessage;
+
+public class AzureAiStudioActionCreator implements AzureAiStudioActionVisitor {
+    private final Sender sender;
+    private final ServiceComponents serviceComponents;
+
+    public AzureAiStudioActionCreator(Sender sender, ServiceComponents serviceComponents) {
+        this.sender = Objects.requireNonNull(sender);
+        this.serviceComponents = Objects.requireNonNull(serviceComponents);
+    }
+
+    @Override
+    public ExecutableAction create(AzureAiStudioChatCompletionModel completionModel, Map<String, Object> taskSettings) {
+        var overriddenModel = AzureAiStudioChatCompletionModel.of(completionModel, taskSettings);
+        var requestManager = new AzureAiStudioChatCompletionRequestManager(overriddenModel, serviceComponents.threadPool());
+        var errorMessage = constructFailedToSendRequestMessage(completionModel.uri(), "Azure AI Studio completion");
+        return new AzureAiStudioAction(sender, requestManager, errorMessage);
+    }
+
+    @Override
+    public ExecutableAction create(AzureAiStudioEmbeddingsModel embeddingsModel, Map<String, Object> taskSettings) {
+        var overriddenModel = AzureAiStudioEmbeddingsModel.of(embeddingsModel, taskSettings);
+        var requestManager = new AzureAiStudioEmbeddingsRequestManager(
+            overriddenModel,
+            serviceComponents.truncator(),
+            serviceComponents.threadPool()
+        );
+        var errorMessage = constructFailedToSendRequestMessage(embeddingsModel.uri(), "Azure AI Studio embeddings");
+        return new AzureAiStudioAction(sender, requestManager, errorMessage);
+    }
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/action/azureaistudio/AzureAiStudioActionVisitor.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/action/azureaistudio/AzureAiStudioActionVisitor.java
new file mode 100644
index 0000000000000..fee966ea2613c
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/action/azureaistudio/AzureAiStudioActionVisitor.java
@@ -0,0 +1,20 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.action.azureaistudio;
+
+import org.elasticsearch.xpack.inference.external.action.ExecutableAction;
+import org.elasticsearch.xpack.inference.services.azureaistudio.completion.AzureAiStudioChatCompletionModel;
+import org.elasticsearch.xpack.inference.services.azureaistudio.embeddings.AzureAiStudioEmbeddingsModel;
+
+import java.util.Map;
+
+public interface AzureAiStudioActionVisitor {
+    ExecutableAction create(AzureAiStudioEmbeddingsModel embeddingsModel, Map<String, Object> taskSettings);
+
+    ExecutableAction create(AzureAiStudioChatCompletionModel completionModel, Map<String, Object> taskSettings);
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/action/cohere/CohereActionCreator.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/action/cohere/CohereActionCreator.java
index 9f54950dba2d3..140c08ceef80f 100644
--- a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/action/cohere/CohereActionCreator.java
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/action/cohere/CohereActionCreator.java
@@ -11,6 +11,7 @@
 import org.elasticsearch.xpack.inference.external.action.ExecutableAction;
 import org.elasticsearch.xpack.inference.external.http.sender.Sender;
 import org.elasticsearch.xpack.inference.services.ServiceComponents;
+import org.elasticsearch.xpack.inference.services.cohere.completion.CohereCompletionModel;
 import org.elasticsearch.xpack.inference.services.cohere.embeddings.CohereEmbeddingsModel;
 import org.elasticsearch.xpack.inference.services.cohere.rerank.CohereRerankModel;
 
@@ -42,4 +43,10 @@ public ExecutableAction create(CohereRerankModel model, Map<String, Object> task
 
         return new CohereRerankAction(sender, overriddenModel, serviceComponents.threadPool());
     }
+
+    @Override
+    public ExecutableAction create(CohereCompletionModel model, Map<String, Object> taskSettings) {
+        // no overridden model as task settings are always empty for cohere completion model
+        return new CohereCompletionAction(sender, model, serviceComponents.threadPool());
+    }
 }
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/action/cohere/CohereActionVisitor.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/action/cohere/CohereActionVisitor.java
index 5431308850f36..1d81dd9e0633b 100644
--- a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/action/cohere/CohereActionVisitor.java
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/action/cohere/CohereActionVisitor.java
@@ -9,6 +9,7 @@
 
 import org.elasticsearch.inference.InputType;
 import org.elasticsearch.xpack.inference.external.action.ExecutableAction;
+import org.elasticsearch.xpack.inference.services.cohere.completion.CohereCompletionModel;
 import org.elasticsearch.xpack.inference.services.cohere.embeddings.CohereEmbeddingsModel;
 import org.elasticsearch.xpack.inference.services.cohere.rerank.CohereRerankModel;
 
@@ -18,4 +19,6 @@ public interface CohereActionVisitor {
     ExecutableAction create(CohereEmbeddingsModel model, Map<String, Object> taskSettings, InputType inputType);
 
     ExecutableAction create(CohereRerankModel model, Map<String, Object> taskSettings);
+
+    ExecutableAction create(CohereCompletionModel model, Map<String, Object> taskSettings);
 }
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/action/cohere/CohereCompletionAction.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/action/cohere/CohereCompletionAction.java
new file mode 100644
index 0000000000000..1df1019306699
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/action/cohere/CohereCompletionAction.java
@@ -0,0 +1,70 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.action.cohere;
+
+import org.elasticsearch.ElasticsearchException;
+import org.elasticsearch.ElasticsearchStatusException;
+import org.elasticsearch.action.ActionListener;
+import org.elasticsearch.core.TimeValue;
+import org.elasticsearch.inference.InferenceServiceResults;
+import org.elasticsearch.rest.RestStatus;
+import org.elasticsearch.threadpool.ThreadPool;
+import org.elasticsearch.xpack.inference.external.action.ExecutableAction;
+import org.elasticsearch.xpack.inference.external.http.sender.CohereCompletionRequestManager;
+import org.elasticsearch.xpack.inference.external.http.sender.DocumentsOnlyInput;
+import org.elasticsearch.xpack.inference.external.http.sender.InferenceInputs;
+import org.elasticsearch.xpack.inference.external.http.sender.Sender;
+import org.elasticsearch.xpack.inference.services.cohere.completion.CohereCompletionModel;
+
+import java.util.Objects;
+
+import static org.elasticsearch.xpack.inference.external.action.ActionUtils.constructFailedToSendRequestMessage;
+import static org.elasticsearch.xpack.inference.external.action.ActionUtils.createInternalServerError;
+import static org.elasticsearch.xpack.inference.external.action.ActionUtils.wrapFailuresInElasticsearchException;
+
+public class CohereCompletionAction implements ExecutableAction {
+
+    private final String failedToSendRequestErrorMessage;
+
+    private final Sender sender;
+
+    private final CohereCompletionRequestManager requestManager;
+
+    public CohereCompletionAction(Sender sender, CohereCompletionModel model, ThreadPool threadPool) {
+        Objects.requireNonNull(model);
+        this.sender = Objects.requireNonNull(sender);
+        this.failedToSendRequestErrorMessage = constructFailedToSendRequestMessage(model.getServiceSettings().uri(), "Cohere completion");
+        this.requestManager = CohereCompletionRequestManager.of(model, threadPool);
+    }
+
+    @Override
+    public void execute(InferenceInputs inferenceInputs, TimeValue timeout, ActionListener<InferenceServiceResults> listener) {
+        if (inferenceInputs instanceof DocumentsOnlyInput == false) {
+            listener.onFailure(new ElasticsearchStatusException("Invalid inference input type", RestStatus.INTERNAL_SERVER_ERROR));
+            return;
+        }
+
+        var docsOnlyInput = (DocumentsOnlyInput) inferenceInputs;
+        if (docsOnlyInput.getInputs().size() > 1) {
+            listener.onFailure(new ElasticsearchStatusException("Cohere completion only accepts 1 input", RestStatus.BAD_REQUEST));
+            return;
+        }
+
+        try {
+            ActionListener<InferenceServiceResults> wrappedListener = wrapFailuresInElasticsearchException(
+                failedToSendRequestErrorMessage,
+                listener
+            );
+            sender.send(requestManager, inferenceInputs, timeout, wrappedListener);
+        } catch (ElasticsearchException e) {
+            listener.onFailure(e);
+        } catch (Exception e) {
+            listener.onFailure(createInternalServerError(e, failedToSendRequestErrorMessage));
+        }
+    }
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/http/sender/AzureAiStudioChatCompletionRequestManager.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/http/sender/AzureAiStudioChatCompletionRequestManager.java
new file mode 100644
index 0000000000000..76ef37592d88e
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/http/sender/AzureAiStudioChatCompletionRequestManager.java
@@ -0,0 +1,61 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.http.sender;
+
+import org.apache.http.client.protocol.HttpClientContext;
+import org.apache.logging.log4j.LogManager;
+import org.apache.logging.log4j.Logger;
+import org.elasticsearch.action.ActionListener;
+import org.elasticsearch.inference.InferenceServiceResults;
+import org.elasticsearch.threadpool.ThreadPool;
+import org.elasticsearch.xpack.inference.external.http.retry.RequestSender;
+import org.elasticsearch.xpack.inference.external.http.retry.ResponseHandler;
+import org.elasticsearch.xpack.inference.external.request.azureaistudio.AzureAiStudioChatCompletionRequest;
+import org.elasticsearch.xpack.inference.external.response.AzureAndOpenAiErrorResponseEntity;
+import org.elasticsearch.xpack.inference.external.response.AzureAndOpenAiExternalResponseHandler;
+import org.elasticsearch.xpack.inference.external.response.azureaistudio.AzureAiStudioChatCompletionResponseEntity;
+import org.elasticsearch.xpack.inference.services.azureaistudio.completion.AzureAiStudioChatCompletionModel;
+
+import java.util.List;
+import java.util.function.Supplier;
+
+public class AzureAiStudioChatCompletionRequestManager extends AzureAiStudioRequestManager {
+    private static final Logger logger = LogManager.getLogger(AzureAiStudioChatCompletionRequestManager.class);
+
+    private static final ResponseHandler HANDLER = createCompletionHandler();
+
+    private final AzureAiStudioChatCompletionModel model;
+
+    public AzureAiStudioChatCompletionRequestManager(AzureAiStudioChatCompletionModel model, ThreadPool threadPool) {
+        super(threadPool, model);
+        this.model = model;
+    }
+
+    @Override
+    public Runnable create(
+        String query,
+        List<String> input,
+        RequestSender requestSender,
+        Supplier<Boolean> hasRequestCompletedFunction,
+        HttpClientContext context,
+        ActionListener<InferenceServiceResults> listener
+    ) {
+        AzureAiStudioChatCompletionRequest request = new AzureAiStudioChatCompletionRequest(model, input);
+
+        return new ExecutableInferenceRequest(requestSender, logger, request, context, HANDLER, hasRequestCompletedFunction, listener);
+    }
+
+    private static ResponseHandler createCompletionHandler() {
+        return new AzureAndOpenAiExternalResponseHandler(
+            "azure ai studio completion",
+            new AzureAiStudioChatCompletionResponseEntity(),
+            AzureAndOpenAiErrorResponseEntity::fromResponse
+        );
+    }
+
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/http/sender/AzureAiStudioEmbeddingsRequestManager.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/http/sender/AzureAiStudioEmbeddingsRequestManager.java
new file mode 100644
index 0000000000000..c2edc79dfe937
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/http/sender/AzureAiStudioEmbeddingsRequestManager.java
@@ -0,0 +1,65 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.http.sender;
+
+import org.apache.http.client.protocol.HttpClientContext;
+import org.apache.logging.log4j.LogManager;
+import org.apache.logging.log4j.Logger;
+import org.elasticsearch.action.ActionListener;
+import org.elasticsearch.inference.InferenceServiceResults;
+import org.elasticsearch.threadpool.ThreadPool;
+import org.elasticsearch.xpack.inference.common.Truncator;
+import org.elasticsearch.xpack.inference.external.http.retry.RequestSender;
+import org.elasticsearch.xpack.inference.external.http.retry.ResponseHandler;
+import org.elasticsearch.xpack.inference.external.request.azureaistudio.AzureAiStudioEmbeddingsRequest;
+import org.elasticsearch.xpack.inference.external.response.AzureAndOpenAiErrorResponseEntity;
+import org.elasticsearch.xpack.inference.external.response.AzureAndOpenAiExternalResponseHandler;
+import org.elasticsearch.xpack.inference.external.response.azureaistudio.AzureAiStudioEmbeddingsResponseEntity;
+import org.elasticsearch.xpack.inference.services.azureaistudio.embeddings.AzureAiStudioEmbeddingsModel;
+
+import java.util.List;
+import java.util.function.Supplier;
+
+import static org.elasticsearch.xpack.inference.common.Truncator.truncate;
+
+public class AzureAiStudioEmbeddingsRequestManager extends AzureAiStudioRequestManager {
+    private static final Logger logger = LogManager.getLogger(AzureAiStudioEmbeddingsRequestManager.class);
+    private static final ResponseHandler HANDLER = createEmbeddingsHandler();
+
+    private final AzureAiStudioEmbeddingsModel model;
+    private final Truncator truncator;
+
+    public AzureAiStudioEmbeddingsRequestManager(AzureAiStudioEmbeddingsModel model, Truncator truncator, ThreadPool threadPool) {
+        super(threadPool, model);
+        this.model = model;
+        this.truncator = truncator;
+    }
+
+    @Override
+    public Runnable create(
+        String query,
+        List<String> input,
+        RequestSender requestSender,
+        Supplier<Boolean> hasRequestCompletedFunction,
+        HttpClientContext context,
+        ActionListener<InferenceServiceResults> listener
+    ) {
+        var truncatedInput = truncate(input, model.getServiceSettings().maxInputTokens());
+        AzureAiStudioEmbeddingsRequest request = new AzureAiStudioEmbeddingsRequest(truncator, truncatedInput, model);
+        return new ExecutableInferenceRequest(requestSender, logger, request, context, HANDLER, hasRequestCompletedFunction, listener);
+    }
+
+    private static ResponseHandler createEmbeddingsHandler() {
+        return new AzureAndOpenAiExternalResponseHandler(
+            "azure ai studio text embedding",
+            new AzureAiStudioEmbeddingsResponseEntity(),
+            AzureAndOpenAiErrorResponseEntity::fromResponse
+        );
+    }
+
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/http/sender/AzureAiStudioRequestManager.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/http/sender/AzureAiStudioRequestManager.java
new file mode 100644
index 0000000000000..088030a22a3fb
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/http/sender/AzureAiStudioRequestManager.java
@@ -0,0 +1,28 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.http.sender;
+
+import org.elasticsearch.threadpool.ThreadPool;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioModel;
+
+import java.util.Objects;
+
+public abstract class AzureAiStudioRequestManager extends BaseRequestManager {
+
+    protected AzureAiStudioRequestManager(ThreadPool threadPool, AzureAiStudioModel model) {
+        super(threadPool, model.getInferenceEntityId(), AzureAiStudioRequestManager.RateLimitGrouping.of(model), model.rateLimitSettings());
+    }
+
+    record RateLimitGrouping(int targetHashcode) {
+        public static AzureAiStudioRequestManager.RateLimitGrouping of(AzureAiStudioModel model) {
+            Objects.requireNonNull(model);
+
+            return new AzureAiStudioRequestManager.RateLimitGrouping(model.target().hashCode());
+        }
+    }
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/http/sender/CohereCompletionRequestManager.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/http/sender/CohereCompletionRequestManager.java
new file mode 100644
index 0000000000000..255d4a3f3879f
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/http/sender/CohereCompletionRequestManager.java
@@ -0,0 +1,61 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.http.sender;
+
+import org.apache.http.client.protocol.HttpClientContext;
+import org.apache.logging.log4j.LogManager;
+import org.apache.logging.log4j.Logger;
+import org.elasticsearch.action.ActionListener;
+import org.elasticsearch.inference.InferenceServiceResults;
+import org.elasticsearch.threadpool.ThreadPool;
+import org.elasticsearch.xpack.inference.external.cohere.CohereResponseHandler;
+import org.elasticsearch.xpack.inference.external.http.retry.RequestSender;
+import org.elasticsearch.xpack.inference.external.http.retry.ResponseHandler;
+import org.elasticsearch.xpack.inference.external.request.cohere.completion.CohereCompletionRequest;
+import org.elasticsearch.xpack.inference.external.response.cohere.CohereCompletionResponseEntity;
+import org.elasticsearch.xpack.inference.services.cohere.completion.CohereCompletionModel;
+
+import java.util.List;
+import java.util.Objects;
+import java.util.function.Supplier;
+
+public class CohereCompletionRequestManager extends CohereRequestManager {
+
+    private static final Logger logger = LogManager.getLogger(CohereCompletionRequestManager.class);
+
+    private static final ResponseHandler HANDLER = createCompletionHandler();
+
+    private static ResponseHandler createCompletionHandler() {
+        return new CohereResponseHandler("cohere completion", CohereCompletionResponseEntity::fromResponse);
+    }
+
+    public static CohereCompletionRequestManager of(CohereCompletionModel model, ThreadPool threadPool) {
+        return new CohereCompletionRequestManager(Objects.requireNonNull(model), Objects.requireNonNull(threadPool));
+    }
+
+    private final CohereCompletionModel model;
+
+    private CohereCompletionRequestManager(CohereCompletionModel model, ThreadPool threadPool) {
+        super(threadPool, model);
+        this.model = Objects.requireNonNull(model);
+    }
+
+    @Override
+    public Runnable create(
+        String query,
+        List<String> input,
+        RequestSender requestSender,
+        Supplier<Boolean> hasRequestCompletedFunction,
+        HttpClientContext context,
+        ActionListener<InferenceServiceResults> listener
+    ) {
+        CohereCompletionRequest request = new CohereCompletionRequest(input, model);
+
+        return new ExecutableInferenceRequest(requestSender, logger, request, context, HANDLER, hasRequestCompletedFunction, listener);
+    }
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/azureaistudio/AzureAiStudioChatCompletionRequest.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/azureaistudio/AzureAiStudioChatCompletionRequest.java
new file mode 100644
index 0000000000000..b913f79e39202
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/azureaistudio/AzureAiStudioChatCompletionRequest.java
@@ -0,0 +1,75 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.request.azureaistudio;
+
+import org.apache.http.HttpHeaders;
+import org.apache.http.client.methods.HttpPost;
+import org.apache.http.entity.ByteArrayEntity;
+import org.elasticsearch.common.Strings;
+import org.elasticsearch.xcontent.XContentType;
+import org.elasticsearch.xpack.inference.external.request.HttpRequest;
+import org.elasticsearch.xpack.inference.external.request.Request;
+import org.elasticsearch.xpack.inference.services.azureaistudio.completion.AzureAiStudioChatCompletionModel;
+
+import java.nio.charset.StandardCharsets;
+import java.util.List;
+import java.util.Objects;
+
+public class AzureAiStudioChatCompletionRequest extends AzureAiStudioRequest {
+    private final List<String> input;
+    private final AzureAiStudioChatCompletionModel completionModel;
+
+    public AzureAiStudioChatCompletionRequest(AzureAiStudioChatCompletionModel model, List<String> input) {
+        super(model);
+        this.input = Objects.requireNonNull(input);
+        this.completionModel = Objects.requireNonNull(model);
+    }
+
+    public boolean isRealtimeEndpoint() {
+        return isRealtimeEndpoint;
+    }
+
+    @Override
+    public HttpRequest createHttpRequest() {
+        HttpPost httpPost = new HttpPost(this.uri);
+
+        ByteArrayEntity byteEntity = new ByteArrayEntity(Strings.toString(createRequestEntity()).getBytes(StandardCharsets.UTF_8));
+        httpPost.setEntity(byteEntity);
+
+        httpPost.setHeader(HttpHeaders.CONTENT_TYPE, XContentType.JSON.mediaType());
+        setAuthHeader(httpPost, completionModel);
+
+        return new HttpRequest(httpPost, getInferenceEntityId());
+    }
+
+    @Override
+    public Request truncate() {
+        // no truncation
+        return this;
+    }
+
+    @Override
+    public boolean[] getTruncationInfo() {
+        // no truncation
+        return null;
+    }
+
+    private AzureAiStudioChatCompletionRequestEntity createRequestEntity() {
+        var taskSettings = completionModel.getTaskSettings();
+        var serviceSettings = completionModel.getServiceSettings();
+        return new AzureAiStudioChatCompletionRequestEntity(
+            input,
+            serviceSettings.endpointType(),
+            taskSettings.temperature(),
+            taskSettings.topP(),
+            taskSettings.doSample(),
+            taskSettings.maxNewTokens()
+        );
+    }
+
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/azureaistudio/AzureAiStudioChatCompletionRequestEntity.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/azureaistudio/AzureAiStudioChatCompletionRequestEntity.java
new file mode 100644
index 0000000000000..a4f685530f942
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/azureaistudio/AzureAiStudioChatCompletionRequestEntity.java
@@ -0,0 +1,120 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.request.azureaistudio;
+
+import org.elasticsearch.core.Nullable;
+import org.elasticsearch.xcontent.ToXContentObject;
+import org.elasticsearch.xcontent.XContentBuilder;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioEndpointType;
+
+import java.io.IOException;
+import java.util.List;
+import java.util.Objects;
+
+import static org.elasticsearch.xpack.inference.external.request.azureaistudio.AzureAiStudioRequestFields.INPUT_DATA_OBJECT;
+import static org.elasticsearch.xpack.inference.external.request.azureaistudio.AzureAiStudioRequestFields.INPUT_STRING_ARRAY;
+import static org.elasticsearch.xpack.inference.external.request.azureaistudio.AzureAiStudioRequestFields.MESSAGES_ARRAY;
+import static org.elasticsearch.xpack.inference.external.request.azureaistudio.AzureAiStudioRequestFields.MESSAGE_CONTENT;
+import static org.elasticsearch.xpack.inference.external.request.azureaistudio.AzureAiStudioRequestFields.PARAMETERS_OBJECT;
+import static org.elasticsearch.xpack.inference.external.request.azureaistudio.AzureAiStudioRequestFields.ROLE;
+import static org.elasticsearch.xpack.inference.external.request.azureaistudio.AzureAiStudioRequestFields.USER_ROLE;
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants.DO_SAMPLE_FIELD;
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants.MAX_NEW_TOKENS_FIELD;
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants.TEMPERATURE_FIELD;
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants.TOP_P_FIELD;
+
+public record AzureAiStudioChatCompletionRequestEntity(
+    List<String> messages,
+    AzureAiStudioEndpointType endpointType,
+    @Nullable Double temperature,
+    @Nullable Double topP,
+    @Nullable Boolean doSample,
+    @Nullable Integer maxNewTokens
+) implements ToXContentObject {
+
+    public AzureAiStudioChatCompletionRequestEntity {
+        Objects.requireNonNull(messages);
+        Objects.requireNonNull(endpointType);
+    }
+
+    @Override
+    public XContentBuilder toXContent(XContentBuilder builder, Params params) throws IOException {
+        builder.startObject();
+
+        if (endpointType == AzureAiStudioEndpointType.TOKEN) {
+            createPayAsYouGoRequest(builder, params);
+        } else {
+            createRealtimeRequest(builder, params);
+        }
+
+        builder.endObject();
+        return builder;
+    }
+
+    private void createRealtimeRequest(XContentBuilder builder, Params params) throws IOException {
+        builder.startObject(INPUT_DATA_OBJECT);
+        builder.startArray(INPUT_STRING_ARRAY);
+
+        for (String message : messages) {
+            addMessageContentObject(builder, message);
+        }
+
+        builder.endArray();
+
+        addRequestParameters(builder);
+
+        builder.endObject();
+    }
+
+    private void createPayAsYouGoRequest(XContentBuilder builder, Params params) throws IOException {
+        builder.startArray(MESSAGES_ARRAY);
+
+        for (String message : messages) {
+            addMessageContentObject(builder, message);
+        }
+
+        builder.endArray();
+
+        addRequestParameters(builder);
+    }
+
+    private void addMessageContentObject(XContentBuilder builder, String message) throws IOException {
+        builder.startObject();
+
+        builder.field(MESSAGE_CONTENT, message);
+        builder.field(ROLE, USER_ROLE);
+
+        builder.endObject();
+    }
+
+    private void addRequestParameters(XContentBuilder builder) throws IOException {
+        if (temperature == null && topP == null && doSample == null && maxNewTokens == null) {
+            return;
+        }
+
+        builder.startObject(PARAMETERS_OBJECT);
+
+        if (temperature != null) {
+            builder.field(TEMPERATURE_FIELD, temperature);
+        }
+
+        if (topP != null) {
+            builder.field(TOP_P_FIELD, topP);
+        }
+
+        if (doSample != null) {
+            builder.field(DO_SAMPLE_FIELD, doSample);
+        }
+
+        if (maxNewTokens != null) {
+            builder.field(MAX_NEW_TOKENS_FIELD, maxNewTokens);
+        }
+
+        builder.endObject();
+    }
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/azureaistudio/AzureAiStudioEmbeddingsRequest.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/azureaistudio/AzureAiStudioEmbeddingsRequest.java
new file mode 100644
index 0000000000000..bf828dc5789b0
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/azureaistudio/AzureAiStudioEmbeddingsRequest.java
@@ -0,0 +1,65 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.request.azureaistudio;
+
+import org.apache.http.HttpHeaders;
+import org.apache.http.client.methods.HttpPost;
+import org.apache.http.entity.ByteArrayEntity;
+import org.elasticsearch.common.Strings;
+import org.elasticsearch.xcontent.XContentType;
+import org.elasticsearch.xpack.inference.common.Truncator;
+import org.elasticsearch.xpack.inference.external.request.HttpRequest;
+import org.elasticsearch.xpack.inference.external.request.Request;
+import org.elasticsearch.xpack.inference.services.azureaistudio.embeddings.AzureAiStudioEmbeddingsModel;
+
+import java.nio.charset.StandardCharsets;
+
+public class AzureAiStudioEmbeddingsRequest extends AzureAiStudioRequest {
+
+    private final AzureAiStudioEmbeddingsModel embeddingsModel;
+    private final Truncator.TruncationResult truncationResult;
+    private final Truncator truncator;
+
+    public AzureAiStudioEmbeddingsRequest(Truncator truncator, Truncator.TruncationResult input, AzureAiStudioEmbeddingsModel model) {
+        super(model);
+        this.embeddingsModel = model;
+        this.truncator = truncator;
+        this.truncationResult = input;
+    }
+
+    @Override
+    public HttpRequest createHttpRequest() {
+        HttpPost httpPost = new HttpPost(this.uri);
+
+        var user = embeddingsModel.getTaskSettings().user();
+        var dimensions = embeddingsModel.getServiceSettings().dimensions();
+        var dimensionsSetByUser = embeddingsModel.getServiceSettings().dimensionsSetByUser();
+
+        ByteArrayEntity byteEntity = new ByteArrayEntity(
+            Strings.toString(new AzureAiStudioEmbeddingsRequestEntity(truncationResult.input(), user, dimensions, dimensionsSetByUser))
+                .getBytes(StandardCharsets.UTF_8)
+        );
+        httpPost.setEntity(byteEntity);
+
+        httpPost.setHeader(HttpHeaders.CONTENT_TYPE, XContentType.JSON.mediaType());
+        setAuthHeader(httpPost, embeddingsModel);
+
+        return new HttpRequest(httpPost, getInferenceEntityId());
+    }
+
+    @Override
+    public Request truncate() {
+        var truncatedInput = truncator.truncate(truncationResult.input());
+        return new AzureAiStudioEmbeddingsRequest(truncator, truncatedInput, embeddingsModel);
+    }
+
+    @Override
+    public boolean[] getTruncationInfo() {
+        return truncationResult.truncated().clone();
+    }
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/azureaistudio/AzureAiStudioEmbeddingsRequestEntity.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/azureaistudio/AzureAiStudioEmbeddingsRequestEntity.java
new file mode 100644
index 0000000000000..a11a554b1f2e3
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/azureaistudio/AzureAiStudioEmbeddingsRequestEntity.java
@@ -0,0 +1,51 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.request.azureaistudio;
+
+import org.elasticsearch.core.Nullable;
+import org.elasticsearch.xcontent.ToXContentObject;
+import org.elasticsearch.xcontent.XContentBuilder;
+
+import java.io.IOException;
+import java.util.List;
+import java.util.Objects;
+
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants.DIMENSIONS_FIELD;
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants.INPUT_FIELD;
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants.USER_FIELD;
+
+public record AzureAiStudioEmbeddingsRequestEntity(
+    List<String> input,
+    @Nullable String user,
+    @Nullable Integer dimensions,
+    boolean dimensionsSetByUser
+) implements ToXContentObject {
+
+    public AzureAiStudioEmbeddingsRequestEntity {
+        Objects.requireNonNull(input);
+    }
+
+    @Override
+    public XContentBuilder toXContent(XContentBuilder builder, Params params) throws IOException {
+        builder.startObject();
+
+        builder.field(INPUT_FIELD, input);
+
+        if (user != null) {
+            builder.field(USER_FIELD, user);
+        }
+
+        if (dimensionsSetByUser && dimensions != null) {
+            builder.field(DIMENSIONS_FIELD, dimensions);
+        }
+
+        builder.endObject();
+
+        return builder;
+    }
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/azureaistudio/AzureAiStudioRequest.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/azureaistudio/AzureAiStudioRequest.java
new file mode 100644
index 0000000000000..07daad9b89dd5
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/azureaistudio/AzureAiStudioRequest.java
@@ -0,0 +1,61 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.request.azureaistudio;
+
+import org.apache.http.HttpHeaders;
+import org.apache.http.client.methods.HttpEntityEnclosingRequestBase;
+import org.elasticsearch.xpack.inference.external.request.Request;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioEndpointType;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioModel;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioProvider;
+
+import java.net.URI;
+
+import static org.elasticsearch.xpack.inference.external.request.RequestUtils.createAuthBearerHeader;
+import static org.elasticsearch.xpack.inference.external.request.azureaistudio.AzureAiStudioRequestFields.API_KEY_HEADER;
+
+public abstract class AzureAiStudioRequest implements Request {
+
+    protected final URI uri;
+    protected final String inferenceEntityId;
+
+    protected final boolean isOpenAiRequest;
+    protected final boolean isRealtimeEndpoint;
+
+    protected AzureAiStudioRequest(AzureAiStudioModel model) {
+        this.uri = model.uri();
+        this.inferenceEntityId = model.getInferenceEntityId();
+        this.isOpenAiRequest = (model.provider() == AzureAiStudioProvider.OPENAI);
+        this.isRealtimeEndpoint = (model.endpointType() == AzureAiStudioEndpointType.REALTIME);
+    }
+
+    protected void setAuthHeader(HttpEntityEnclosingRequestBase request, AzureAiStudioModel model) {
+        var apiKey = model.getSecretSettings().apiKey();
+
+        if (isOpenAiRequest) {
+            request.setHeader(API_KEY_HEADER, apiKey.toString());
+        } else {
+            if (isRealtimeEndpoint) {
+                request.setHeader(createAuthBearerHeader(apiKey));
+            } else {
+                request.setHeader(HttpHeaders.AUTHORIZATION, apiKey.toString());
+            }
+        }
+    }
+
+    @Override
+    public URI getURI() {
+        return this.uri;
+    }
+
+    @Override
+    public String getInferenceEntityId() {
+        return this.inferenceEntityId;
+    }
+
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/azureaistudio/AzureAiStudioRequestFields.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/azureaistudio/AzureAiStudioRequestFields.java
new file mode 100644
index 0000000000000..ad10410792867
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/azureaistudio/AzureAiStudioRequestFields.java
@@ -0,0 +1,21 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.request.azureaistudio;
+
+public final class AzureAiStudioRequestFields {
+    public static final String API_KEY_HEADER = "api-key";
+    public static final String MESSAGES_ARRAY = "messages";
+    public static final String INPUT_DATA_OBJECT = "input_data";
+    public static final String INPUT_STRING_ARRAY = "input_string";
+    public static final String PARAMETERS_OBJECT = "parameters";
+    public static final String MESSAGE_CONTENT = "content";
+    public static final String ROLE = "role";
+    public static final String USER_ROLE = "user";
+
+    private AzureAiStudioRequestFields() {}
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/cohere/CohereEmbeddingsRequest.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/cohere/CohereEmbeddingsRequest.java
index 5f3278788b69b..bd59cdbded9fa 100644
--- a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/cohere/CohereEmbeddingsRequest.java
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/cohere/CohereEmbeddingsRequest.java
@@ -7,12 +7,10 @@
 
 package org.elasticsearch.xpack.inference.external.request.cohere;
 
-import org.apache.http.HttpHeaders;
 import org.apache.http.client.methods.HttpPost;
 import org.apache.http.client.utils.URIBuilder;
 import org.apache.http.entity.ByteArrayEntity;
 import org.elasticsearch.common.Strings;
-import org.elasticsearch.xcontent.XContentType;
 import org.elasticsearch.xpack.inference.external.cohere.CohereAccount;
 import org.elasticsearch.xpack.inference.external.request.HttpRequest;
 import org.elasticsearch.xpack.inference.external.request.Request;
@@ -26,9 +24,7 @@
 import java.util.List;
 import java.util.Objects;
 
-import static org.elasticsearch.xpack.inference.external.request.RequestUtils.createAuthBearerHeader;
-
-public class CohereEmbeddingsRequest implements Request {
+public class CohereEmbeddingsRequest extends CohereRequest {
 
     private final CohereAccount account;
     private final List<String> input;
@@ -57,9 +53,7 @@ public HttpRequest createHttpRequest() {
         );
         httpPost.setEntity(byteEntity);
 
-        httpPost.setHeader(HttpHeaders.CONTENT_TYPE, XContentType.JSON.mediaType());
-        httpPost.setHeader(createAuthBearerHeader(account.apiKey()));
-        httpPost.setHeader(CohereUtils.createRequestSourceHeader());
+        decorateWithAuthHeader(httpPost, account);
 
         return new HttpRequest(httpPost, getInferenceEntityId());
     }
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/cohere/CohereRequest.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/cohere/CohereRequest.java
new file mode 100644
index 0000000000000..17441398e33e0
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/cohere/CohereRequest.java
@@ -0,0 +1,26 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.request.cohere;
+
+import org.apache.http.HttpHeaders;
+import org.apache.http.client.methods.HttpPost;
+import org.elasticsearch.xcontent.XContentType;
+import org.elasticsearch.xpack.inference.external.cohere.CohereAccount;
+import org.elasticsearch.xpack.inference.external.request.Request;
+
+import static org.elasticsearch.xpack.inference.external.request.RequestUtils.createAuthBearerHeader;
+
+public abstract class CohereRequest implements Request {
+
+    public static void decorateWithAuthHeader(HttpPost request, CohereAccount account) {
+        request.setHeader(HttpHeaders.CONTENT_TYPE, XContentType.JSON.mediaType());
+        request.setHeader(createAuthBearerHeader(account.apiKey()));
+        request.setHeader(CohereUtils.createRequestSourceHeader());
+    }
+
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/cohere/CohereRerankRequest.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/cohere/CohereRerankRequest.java
index f87bdb9ab7d4b..492807f74b32a 100644
--- a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/cohere/CohereRerankRequest.java
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/cohere/CohereRerankRequest.java
@@ -7,12 +7,10 @@
 
 package org.elasticsearch.xpack.inference.external.request.cohere;
 
-import org.apache.http.HttpHeaders;
 import org.apache.http.client.methods.HttpPost;
 import org.apache.http.client.utils.URIBuilder;
 import org.apache.http.entity.ByteArrayEntity;
 import org.elasticsearch.common.Strings;
-import org.elasticsearch.xcontent.XContentType;
 import org.elasticsearch.xpack.inference.external.cohere.CohereAccount;
 import org.elasticsearch.xpack.inference.external.request.HttpRequest;
 import org.elasticsearch.xpack.inference.external.request.Request;
@@ -25,9 +23,7 @@
 import java.util.List;
 import java.util.Objects;
 
-import static org.elasticsearch.xpack.inference.external.request.RequestUtils.createAuthBearerHeader;
-
-public class CohereRerankRequest implements Request {
+public class CohereRerankRequest extends CohereRequest {
 
     private final CohereAccount account;
     private final String query;
@@ -56,9 +52,7 @@ public HttpRequest createHttpRequest() {
         );
         httpPost.setEntity(byteEntity);
 
-        httpPost.setHeader(HttpHeaders.CONTENT_TYPE, XContentType.JSON.mediaType());
-        httpPost.setHeader(createAuthBearerHeader(account.apiKey()));
-        httpPost.setHeader(CohereUtils.createRequestSourceHeader());
+        decorateWithAuthHeader(httpPost, account);
 
         return new HttpRequest(httpPost, getInferenceEntityId());
     }
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/cohere/CohereUtils.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/cohere/CohereUtils.java
index e6344f4d17b40..4cfba792f2c5c 100644
--- a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/cohere/CohereUtils.java
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/cohere/CohereUtils.java
@@ -13,6 +13,7 @@
 public class CohereUtils {
     public static final String HOST = "api.cohere.ai";
     public static final String VERSION_1 = "v1";
+    public static final String CHAT_PATH = "chat";
     public static final String EMBEDDINGS_PATH = "embed";
     public static final String RERANK_PATH = "rerank";
     public static final String REQUEST_SOURCE_HEADER = "Request-Source";
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/cohere/completion/CohereCompletionRequest.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/cohere/completion/CohereCompletionRequest.java
new file mode 100644
index 0000000000000..f68f919a7d85b
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/cohere/completion/CohereCompletionRequest.java
@@ -0,0 +1,88 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.request.cohere.completion;
+
+import org.apache.http.client.methods.HttpPost;
+import org.apache.http.client.utils.URIBuilder;
+import org.apache.http.entity.ByteArrayEntity;
+import org.elasticsearch.common.Strings;
+import org.elasticsearch.xpack.inference.external.cohere.CohereAccount;
+import org.elasticsearch.xpack.inference.external.request.HttpRequest;
+import org.elasticsearch.xpack.inference.external.request.Request;
+import org.elasticsearch.xpack.inference.external.request.cohere.CohereRequest;
+import org.elasticsearch.xpack.inference.external.request.cohere.CohereUtils;
+import org.elasticsearch.xpack.inference.services.cohere.completion.CohereCompletionModel;
+
+import java.net.URI;
+import java.net.URISyntaxException;
+import java.nio.charset.StandardCharsets;
+import java.util.List;
+import java.util.Objects;
+
+public class CohereCompletionRequest extends CohereRequest {
+
+    private final CohereAccount account;
+
+    private final List<String> input;
+
+    private final String modelId;
+
+    private final String inferenceEntityId;
+
+    public CohereCompletionRequest(List<String> input, CohereCompletionModel model) {
+        Objects.requireNonNull(model);
+
+        this.account = CohereAccount.of(model, CohereCompletionRequest::buildDefaultUri);
+        this.input = Objects.requireNonNull(input);
+        this.modelId = model.getServiceSettings().modelId();
+        this.inferenceEntityId = model.getInferenceEntityId();
+    }
+
+    @Override
+    public HttpRequest createHttpRequest() {
+        HttpPost httpPost = new HttpPost(account.uri());
+
+        ByteArrayEntity byteEntity = new ByteArrayEntity(
+            Strings.toString(new CohereCompletionRequestEntity(input, modelId)).getBytes(StandardCharsets.UTF_8)
+        );
+        httpPost.setEntity(byteEntity);
+
+        decorateWithAuthHeader(httpPost, account);
+
+        return new HttpRequest(httpPost, getInferenceEntityId());
+    }
+
+    @Override
+    public String getInferenceEntityId() {
+        return inferenceEntityId;
+    }
+
+    @Override
+    public URI getURI() {
+        return account.uri();
+    }
+
+    @Override
+    public Request truncate() {
+        // no truncation
+        return this;
+    }
+
+    @Override
+    public boolean[] getTruncationInfo() {
+        // no truncation
+        return null;
+    }
+
+    public static URI buildDefaultUri() throws URISyntaxException {
+        return new URIBuilder().setScheme("https")
+            .setHost(CohereUtils.HOST)
+            .setPathSegments(CohereUtils.VERSION_1, CohereUtils.CHAT_PATH)
+            .build();
+    }
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/cohere/completion/CohereCompletionRequestEntity.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/cohere/completion/CohereCompletionRequestEntity.java
new file mode 100644
index 0000000000000..8cb3dc6e3c8e8
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/request/cohere/completion/CohereCompletionRequestEntity.java
@@ -0,0 +1,43 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.request.cohere.completion;
+
+import org.elasticsearch.core.Nullable;
+import org.elasticsearch.xcontent.ToXContentObject;
+import org.elasticsearch.xcontent.XContentBuilder;
+
+import java.io.IOException;
+import java.util.List;
+import java.util.Objects;
+
+public record CohereCompletionRequestEntity(List<String> input, @Nullable String model) implements ToXContentObject {
+
+    private static final String MESSAGE_FIELD = "message";
+
+    private static final String MODEL = "model";
+
+    public CohereCompletionRequestEntity {
+        Objects.requireNonNull(input);
+        Objects.requireNonNull(input.get(0));
+    }
+
+    @Override
+    public XContentBuilder toXContent(XContentBuilder builder, Params params) throws IOException {
+        builder.startObject();
+
+        // we only allow one input for completion, so always get the first one
+        builder.field(MESSAGE_FIELD, input.get(0));
+        if (model != null) {
+            builder.field(MODEL, model);
+        }
+
+        builder.endObject();
+
+        return builder;
+    }
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/response/AzureAndOpenAiErrorResponseEntity.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/response/AzureAndOpenAiErrorResponseEntity.java
new file mode 100644
index 0000000000000..4ac77d6df3c33
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/response/AzureAndOpenAiErrorResponseEntity.java
@@ -0,0 +1,74 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.response;
+
+import org.elasticsearch.xcontent.XContentFactory;
+import org.elasticsearch.xcontent.XContentParser;
+import org.elasticsearch.xcontent.XContentParserConfiguration;
+import org.elasticsearch.xcontent.XContentType;
+import org.elasticsearch.xpack.inference.external.http.HttpResult;
+import org.elasticsearch.xpack.inference.external.http.retry.ErrorMessage;
+
+import java.util.Map;
+
+/**
+ * A pattern is emerging in how external providers provide error responses.
+ *
+ * At a minimum, these return:
+ * {
+ *     "error: {
+ *         "message": "(error message)"
+ *     }
+ * }
+ *
+ * Others may return additional information such as error codes specific to the service.
+ *
+ * This currently covers error handling for Azure AI Studio, however this pattern
+ * can be used to simplify and refactor handling for Azure OpenAI and OpenAI responses.
+ */
+public class AzureAndOpenAiErrorResponseEntity implements ErrorMessage {
+    protected String errorMessage;
+
+    public AzureAndOpenAiErrorResponseEntity(String errorMessage) {
+        this.errorMessage = errorMessage;
+    }
+
+    @Override
+    public String getErrorMessage() {
+        return errorMessage;
+    }
+
+    /**
+     * Standard error response parser. This can be overridden for those subclasses that
+     * might have a different format
+     *
+     * @param response the HttpResult
+     * @return the error response
+     */
+    @SuppressWarnings("unchecked")
+    public static ErrorMessage fromResponse(HttpResult response) {
+        try (
+            XContentParser jsonParser = XContentFactory.xContent(XContentType.JSON)
+                .createParser(XContentParserConfiguration.EMPTY, response.body())
+        ) {
+            var responseMap = jsonParser.map();
+
+            var error = (Map<String, Object>) responseMap.get("error");
+            if (error != null) {
+                var message = (String) error.get("message");
+                if (message != null) {
+                    return new AzureAndOpenAiErrorResponseEntity(message);
+                }
+            }
+        } catch (Exception e) {
+            // swallow the error
+        }
+
+        return null;
+    }
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/response/AzureAndOpenAiExternalResponseHandler.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/response/AzureAndOpenAiExternalResponseHandler.java
new file mode 100644
index 0000000000000..5f803ad6fe74e
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/response/AzureAndOpenAiExternalResponseHandler.java
@@ -0,0 +1,149 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.response;
+
+import org.apache.logging.log4j.Logger;
+import org.elasticsearch.common.Strings;
+import org.elasticsearch.xpack.inference.external.http.HttpResult;
+import org.elasticsearch.xpack.inference.external.http.retry.BaseResponseHandler;
+import org.elasticsearch.xpack.inference.external.http.retry.ContentTooLargeException;
+import org.elasticsearch.xpack.inference.external.http.retry.ErrorMessage;
+import org.elasticsearch.xpack.inference.external.http.retry.ResponseParser;
+import org.elasticsearch.xpack.inference.external.http.retry.RetryException;
+import org.elasticsearch.xpack.inference.external.request.Request;
+import org.elasticsearch.xpack.inference.logging.ThrottlerManager;
+
+import java.util.function.Function;
+
+import static org.elasticsearch.xpack.inference.external.http.HttpUtils.checkForEmptyBody;
+import static org.elasticsearch.xpack.inference.external.http.retry.ResponseHandlerUtils.getFirstHeaderOrUnknown;
+
+/**
+ * A base class to use for external response handling.
+ * <p>
+ * This currently covers response handling for Azure AI Studio, however this pattern
+ * can be used to simplify and refactor handling for Azure OpenAI and OpenAI responses.
+ */
+public class AzureAndOpenAiExternalResponseHandler extends BaseResponseHandler {
+
+    // The maximum number of requests that are permitted before exhausting the rate limit.
+    static final String REQUESTS_LIMIT = "x-ratelimit-limit-requests";
+    // The maximum number of tokens that are permitted before exhausting the rate limit.
+    static final String TOKENS_LIMIT = "x-ratelimit-limit-tokens";
+    // The remaining number of requests that are permitted before exhausting the rate limit.
+    static final String REMAINING_REQUESTS = "x-ratelimit-remaining-requests";
+    // The remaining number of tokens that are permitted before exhausting the rate limit.
+    static final String REMAINING_TOKENS = "x-ratelimit-remaining-tokens";
+
+    static final String CONTENT_TOO_LARGE_MESSAGE = "Please reduce your prompt; or completion length.";
+    static final String SERVER_BUSY_ERROR = "Received a server busy error status code";
+
+    public AzureAndOpenAiExternalResponseHandler(
+        String requestType,
+        ResponseParser parseFunction,
+        Function<HttpResult, ErrorMessage> errorParseFunction
+    ) {
+        super(requestType, parseFunction, errorParseFunction);
+    }
+
+    @Override
+    public void validateResponse(ThrottlerManager throttlerManager, Logger logger, Request request, HttpResult result)
+        throws RetryException {
+        checkForFailureStatusCode(request, result);
+        checkForEmptyBody(throttlerManager, logger, request, result);
+    }
+
+    public void checkForFailureStatusCode(Request request, HttpResult result) throws RetryException {
+        int statusCode = result.response().getStatusLine().getStatusCode();
+        if (statusCode >= 200 && statusCode < 300) {
+            return;
+        }
+
+        // handle error codes
+        if (statusCode == 500) {
+            throw handle500Error(request, result);
+        } else if (statusCode == 503) {
+            throw handle503Error(request, result);
+        } else if (statusCode > 500) {
+            throw handleOther500Error(request, result);
+        } else if (statusCode == 429) {
+            throw handleRateLimitingError(request, result);
+        } else if (isContentTooLarge(result)) {
+            throw new ContentTooLargeException(buildError(CONTENT_TOO_LARGE, request, result));
+        } else if (statusCode == 401) {
+            throw handleAuthenticationError(request, result);
+        } else if (statusCode >= 300 && statusCode < 400) {
+            throw handleRedirectionStatusCode(request, result);
+        } else {
+            throw new RetryException(false, buildError(UNSUCCESSFUL, request, result));
+        }
+    }
+
+    protected RetryException handle500Error(Request request, HttpResult result) {
+        return new RetryException(true, buildError(SERVER_ERROR, request, result));
+    }
+
+    protected RetryException handle503Error(Request request, HttpResult result) {
+        return new RetryException(true, buildError(SERVER_BUSY_ERROR, request, result));
+    }
+
+    protected RetryException handleOther500Error(Request request, HttpResult result) {
+        return new RetryException(false, buildError(SERVER_ERROR, request, result));
+    }
+
+    protected RetryException handleAuthenticationError(Request request, HttpResult result) {
+        return new RetryException(false, buildError(AUTHENTICATION, request, result));
+    }
+
+    protected RetryException handleRateLimitingError(Request request, HttpResult result) {
+        return new RetryException(true, buildError(buildRateLimitErrorMessage(result), request, result));
+    }
+
+    protected RetryException handleRedirectionStatusCode(Request request, HttpResult result) {
+        throw new RetryException(false, buildError(REDIRECTION, request, result));
+    }
+
+    public static boolean isContentTooLarge(HttpResult result) {
+        int statusCode = result.response().getStatusLine().getStatusCode();
+
+        if (statusCode == 413) {
+            return true;
+        }
+
+        if (statusCode == 400) {
+            var errorEntity = AzureAndOpenAiErrorResponseEntity.fromResponse(result);
+            return errorEntity != null && errorEntity.getErrorMessage().contains(CONTENT_TOO_LARGE_MESSAGE);
+        }
+
+        return false;
+    }
+
+    public static String buildRateLimitErrorMessage(HttpResult result) {
+        var response = result.response();
+        var tokenLimit = getFirstHeaderOrUnknown(response, TOKENS_LIMIT);
+        var remainingTokens = getFirstHeaderOrUnknown(response, REMAINING_TOKENS);
+        var requestLimit = getFirstHeaderOrUnknown(response, REQUESTS_LIMIT);
+        var remainingRequests = getFirstHeaderOrUnknown(response, REMAINING_REQUESTS);
+
+        if (tokenLimit.equals("unknown") && requestLimit.equals("unknown")) {
+            var usageMessage = Strings.format("Remaining tokens [%s]. Remaining requests [%s].", remainingTokens, remainingRequests);
+            return RATE_LIMIT + ". " + usageMessage;
+        }
+
+        var usageMessage = Strings.format(
+            "Token limit [%s], remaining tokens [%s]. Request limit [%s], remaining requests [%s]",
+            tokenLimit,
+            remainingTokens,
+            requestLimit,
+            remainingRequests
+        );
+
+        return RATE_LIMIT + ". " + usageMessage;
+    }
+
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/response/BaseResponseEntity.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/response/BaseResponseEntity.java
new file mode 100644
index 0000000000000..7c3c7a9645cf3
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/response/BaseResponseEntity.java
@@ -0,0 +1,27 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.response;
+
+import org.elasticsearch.inference.InferenceServiceResults;
+import org.elasticsearch.xpack.inference.external.http.HttpResult;
+import org.elasticsearch.xpack.inference.external.http.retry.ResponseParser;
+import org.elasticsearch.xpack.inference.external.request.Request;
+
+import java.io.IOException;
+
+/**
+ * A base class for providing InferenceServiceResults from a response. This is a lightweight wrapper
+ * to be able to override the `fromReponse` method to avoid using a static reference to the method.
+ */
+public abstract class BaseResponseEntity implements ResponseParser {
+    protected abstract InferenceServiceResults fromResponse(Request request, HttpResult response) throws IOException;
+
+    public InferenceServiceResults apply(Request request, HttpResult response) throws IOException {
+        return fromResponse(request, response);
+    }
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/response/azureaistudio/AzureAiStudioChatCompletionResponseEntity.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/response/azureaistudio/AzureAiStudioChatCompletionResponseEntity.java
new file mode 100644
index 0000000000000..18f5923353960
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/response/azureaistudio/AzureAiStudioChatCompletionResponseEntity.java
@@ -0,0 +1,76 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.response.azureaistudio;
+
+import org.elasticsearch.common.xcontent.LoggingDeprecationHandler;
+import org.elasticsearch.common.xcontent.XContentParserUtils;
+import org.elasticsearch.inference.InferenceServiceResults;
+import org.elasticsearch.xcontent.XContentFactory;
+import org.elasticsearch.xcontent.XContentParser;
+import org.elasticsearch.xcontent.XContentParserConfiguration;
+import org.elasticsearch.xcontent.XContentType;
+import org.elasticsearch.xpack.core.inference.results.ChatCompletionResults;
+import org.elasticsearch.xpack.inference.external.http.HttpResult;
+import org.elasticsearch.xpack.inference.external.request.Request;
+import org.elasticsearch.xpack.inference.external.request.azureaistudio.AzureAiStudioChatCompletionRequest;
+import org.elasticsearch.xpack.inference.external.response.BaseResponseEntity;
+import org.elasticsearch.xpack.inference.external.response.openai.OpenAiChatCompletionResponseEntity;
+
+import java.io.IOException;
+import java.util.List;
+
+import static org.elasticsearch.common.xcontent.XContentParserUtils.ensureExpectedToken;
+import static org.elasticsearch.xpack.inference.external.response.XContentUtils.moveToFirstToken;
+
+public class AzureAiStudioChatCompletionResponseEntity extends BaseResponseEntity {
+
+    @Override
+    protected InferenceServiceResults fromResponse(Request request, HttpResult response) throws IOException {
+        if (request instanceof AzureAiStudioChatCompletionRequest asChatCompletionRequest) {
+            if (asChatCompletionRequest.isRealtimeEndpoint()) {
+                return parseRealtimeEndpointResponse(response);
+            }
+
+            // we can use the OpenAI chat completion type if it's not a realtime endpoint
+            return OpenAiChatCompletionResponseEntity.fromResponse(request, response);
+        }
+
+        return null;
+    }
+
+    private ChatCompletionResults parseRealtimeEndpointResponse(HttpResult response) throws IOException {
+        var parserConfig = XContentParserConfiguration.EMPTY.withDeprecationHandler(LoggingDeprecationHandler.INSTANCE);
+        try (XContentParser jsonParser = XContentFactory.xContent(XContentType.JSON).createParser(parserConfig, response.body())) {
+            moveToFirstToken(jsonParser);
+
+            XContentParser.Token token = jsonParser.currentToken();
+            XContentParserUtils.ensureExpectedToken(XContentParser.Token.START_OBJECT, token, jsonParser);
+
+            while (token != null && token != XContentParser.Token.END_OBJECT) {
+                if (token != XContentParser.Token.FIELD_NAME) {
+                    token = jsonParser.nextToken();
+                    continue;
+                }
+
+                var currentName = jsonParser.currentName();
+                if (currentName == null || currentName.equalsIgnoreCase("output") == false) {
+                    token = jsonParser.nextToken();
+                    continue;
+                }
+
+                token = jsonParser.nextToken();
+                ensureExpectedToken(XContentParser.Token.VALUE_STRING, token, jsonParser);
+                String content = jsonParser.text();
+
+                return new ChatCompletionResults(List.of(new ChatCompletionResults.Result(content)));
+            }
+
+            throw new IllegalStateException("Reached an invalid state while parsing the Azure AI Studio completion response");
+        }
+    }
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/response/azureaistudio/AzureAiStudioEmbeddingsResponseEntity.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/response/azureaistudio/AzureAiStudioEmbeddingsResponseEntity.java
new file mode 100644
index 0000000000000..3fce1ec7920f5
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/response/azureaistudio/AzureAiStudioEmbeddingsResponseEntity.java
@@ -0,0 +1,24 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.response.azureaistudio;
+
+import org.elasticsearch.inference.InferenceServiceResults;
+import org.elasticsearch.xpack.inference.external.http.HttpResult;
+import org.elasticsearch.xpack.inference.external.request.Request;
+import org.elasticsearch.xpack.inference.external.response.BaseResponseEntity;
+import org.elasticsearch.xpack.inference.external.response.openai.OpenAiEmbeddingsResponseEntity;
+
+import java.io.IOException;
+
+public class AzureAiStudioEmbeddingsResponseEntity extends BaseResponseEntity {
+    @Override
+    protected InferenceServiceResults fromResponse(Request request, HttpResult response) throws IOException {
+        // expected response type is the same as the Open AI Embeddings
+        return OpenAiEmbeddingsResponseEntity.fromResponse(request, response);
+    }
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/response/cohere/CohereCompletionResponseEntity.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/response/cohere/CohereCompletionResponseEntity.java
new file mode 100644
index 0000000000000..4740c93ea6c03
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/external/response/cohere/CohereCompletionResponseEntity.java
@@ -0,0 +1,98 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.response.cohere;
+
+import org.elasticsearch.common.xcontent.LoggingDeprecationHandler;
+import org.elasticsearch.common.xcontent.XContentParserUtils;
+import org.elasticsearch.xcontent.XContentFactory;
+import org.elasticsearch.xcontent.XContentParser;
+import org.elasticsearch.xcontent.XContentParserConfiguration;
+import org.elasticsearch.xcontent.XContentType;
+import org.elasticsearch.xpack.core.inference.results.ChatCompletionResults;
+import org.elasticsearch.xpack.inference.external.http.HttpResult;
+import org.elasticsearch.xpack.inference.external.request.Request;
+
+import java.io.IOException;
+import java.util.List;
+
+import static org.elasticsearch.common.xcontent.XContentParserUtils.ensureExpectedToken;
+import static org.elasticsearch.xpack.inference.external.response.XContentUtils.moveToFirstToken;
+import static org.elasticsearch.xpack.inference.external.response.XContentUtils.positionParserAtTokenAfterField;
+
+public class CohereCompletionResponseEntity {
+
+    private static final String FAILED_TO_FIND_FIELD_TEMPLATE = "Failed to find required field [%s] in Cohere chat response";
+
+    /**
+     * Parses the Cohere chat json response.
+     * For a request like:
+     *
+     * <pre>
+     *     <code>
+     *         {
+     *            "message": "What is Elastic?"
+     *         }
+     *     </code>
+     * </pre>
+     *
+     * The response would look like:
+     *
+     * <pre>
+     *     <code>
+     *         {
+     *              "response_id": "some id",
+     *              "text": "response",
+     *              "generation_id": "some id",
+     *              "chat_history": [
+     *                               {
+     *                                  "role": "USER",
+     *                                  "message": "What is Elastic?"
+     *                               },
+     *                               {
+     *                                  "role": "CHATBOT",
+     *                                  "message": "response"
+     *                               }
+     *               ],
+     *              "finish_reason": "COMPLETE",
+     *              "meta": {
+     *                  "api_version": {
+     *                      "version": "1"
+     *                  },
+     *              "billed_units": {
+     *                      "input_tokens": 4,
+     *                      "output_tokens": 229
+     *                  },
+     *              "tokens": {
+     *                      "input_tokens": 70,
+     *                      "output_tokens": 229
+     *                  }
+     *             }
+     *          }
+     *     </code>
+     * </pre>
+     */
+
+    public static ChatCompletionResults fromResponse(Request request, HttpResult response) throws IOException {
+        var parserConfig = XContentParserConfiguration.EMPTY.withDeprecationHandler(LoggingDeprecationHandler.INSTANCE);
+
+        try (XContentParser jsonParser = XContentFactory.xContent(XContentType.JSON).createParser(parserConfig, response.body())) {
+            moveToFirstToken(jsonParser);
+
+            XContentParser.Token token = jsonParser.currentToken();
+            XContentParserUtils.ensureExpectedToken(XContentParser.Token.START_OBJECT, token, jsonParser);
+
+            positionParserAtTokenAfterField(jsonParser, "text", FAILED_TO_FIND_FIELD_TEMPLATE);
+
+            XContentParser.Token contentToken = jsonParser.currentToken();
+            ensureExpectedToken(XContentParser.Token.VALUE_STRING, contentToken, jsonParser);
+            String content = jsonParser.text();
+
+            return new ChatCompletionResults(List.of(new ChatCompletionResults.Result(content)));
+        }
+    }
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/ServiceUtils.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/ServiceUtils.java
index 47c7cc0fce015..25e8afbe1d16c 100644
--- a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/ServiceUtils.java
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/ServiceUtils.java
@@ -34,6 +34,7 @@
 import java.util.Locale;
 import java.util.Map;
 import java.util.Objects;
+import java.util.stream.Collectors;
 
 import static org.elasticsearch.core.Strings.format;
 import static org.elasticsearch.xpack.inference.services.ServiceFields.SIMILARITY;
@@ -91,6 +92,40 @@ public static <T> T removeAsType(Map<String, Object> sourceMap, String key, Clas
         }
     }
 
+    /**
+     * Remove the object from the map and cast to first assignable type in the expected types list.
+     * If the object cannot be cast to one of the types an error is added to the
+     * {@code validationException} parameter
+     *
+     * @param sourceMap Map containing fields
+     * @param key The key of the object to remove
+     * @param types The expected types of the removed object
+     * @param validationException If the value is not of type {@code type}
+     * @return {@code null} if not present else the object cast to the first assignable type in the types list
+     */
+    public static Object removeAsOneOfTypes(
+        Map<String, Object> sourceMap,
+        String key,
+        List<Class<?>> types,
+        ValidationException validationException
+    ) {
+        Object o = sourceMap.remove(key);
+        if (o == null) {
+            return null;
+        }
+
+        for (Class<?> type : types) {
+            if (type.isAssignableFrom(o.getClass())) {
+                return type.cast(o);
+            }
+        }
+
+        validationException.addValidationError(
+            invalidTypesErrorMsg(key, o, types.stream().map(Class::getSimpleName).collect(Collectors.toList()))
+        );
+        return null;
+    }
+
     @SuppressWarnings("unchecked")
     public static Map<String, Object> removeFromMap(Map<String, Object> sourceMap, String fieldName) {
         return (Map<String, Object>) sourceMap.remove(fieldName);
@@ -151,6 +186,16 @@ public static String invalidTypeErrorMsg(String settingName, Object foundObject,
         );
     }
 
+    public static String invalidTypesErrorMsg(String settingName, Object foundObject, List<String> expectedTypes) {
+        return Strings.format(
+            // omitting [ ] for the last string as this will be added, if you convert the list to a string anyway
+            "field [%s] is not of one of the expected types. The value [%s] cannot be converted to one of %s",
+            settingName,
+            foundObject,
+            expectedTypes
+        );
+    }
+
     public static String invalidUrlErrorMsg(String url, String settingName, String settingScope) {
         return Strings.format("[%s] Invalid url [%s] received for field [%s]", settingScope, url, settingName);
     }
@@ -325,7 +370,7 @@ public static Integer extractOptionalPositiveInteger(
         }
 
         if (optionalField != null && optionalField <= 0) {
-            validationException.addValidationError(ServiceUtils.mustBeAPositiveNumberErrorMessage(settingName, scope, optionalField));
+            validationException.addValidationError(ServiceUtils.mustBeAPositiveIntegerErrorMessage(settingName, scope, optionalField));
         }
 
         if (validationException.validationErrors().size() > initialValidationErrorCount) {
@@ -335,6 +380,99 @@ public static Integer extractOptionalPositiveInteger(
         return optionalField;
     }
 
+    public static Float extractOptionalFloat(Map<String, Object> map, String settingName) {
+        return ServiceUtils.removeAsType(map, settingName, Float.class);
+    }
+
+    public static Double extractOptionalDoubleInRange(
+        Map<String, Object> map,
+        String settingName,
+        @Nullable Double minValue,
+        @Nullable Double maxValue,
+        String scope,
+        ValidationException validationException
+    ) {
+        int initialValidationErrorCount = validationException.validationErrors().size();
+        var doubleReturn = ServiceUtils.removeAsType(map, settingName, Double.class, validationException);
+
+        if (validationException.validationErrors().size() > initialValidationErrorCount) {
+            return null;
+        }
+
+        if (doubleReturn != null && minValue != null && doubleReturn < minValue) {
+            validationException.addValidationError(
+                ServiceUtils.mustBeGreaterThanOrEqualNumberErrorMessage(settingName, scope, doubleReturn, minValue)
+            );
+        }
+
+        if (doubleReturn != null && maxValue != null && doubleReturn > maxValue) {
+            validationException.addValidationError(
+                ServiceUtils.mustBeLessThanOrEqualNumberErrorMessage(settingName, scope, doubleReturn, maxValue)
+            );
+        }
+
+        if (validationException.validationErrors().size() > initialValidationErrorCount) {
+            return null;
+        }
+
+        return doubleReturn;
+    }
+
+    public static <E extends Enum<E>> E extractRequiredEnum(
+        Map<String, Object> map,
+        String settingName,
+        String scope,
+        EnumConstructor<E> constructor,
+        EnumSet<E> validValues,
+        ValidationException validationException
+    ) {
+        int initialValidationErrorCount = validationException.validationErrors().size();
+        var enumReturn = extractOptionalEnum(map, settingName, scope, constructor, validValues, validationException);
+
+        if (validationException.validationErrors().size() > initialValidationErrorCount) {
+            return null;
+        }
+
+        if (enumReturn == null) {
+            validationException.addValidationError(ServiceUtils.missingSettingErrorMsg(settingName, scope));
+        }
+
+        return enumReturn;
+    }
+
+    public static Long extractOptionalPositiveLong(
+        Map<String, Object> map,
+        String settingName,
+        String scope,
+        ValidationException validationException
+    ) {
+        // We don't want callers to handle the implementation detail that a long is expected (also treat integers like a long)
+        List<Class<?>> types = List.of(Integer.class, Long.class);
+        int initialValidationErrorCount = validationException.validationErrors().size();
+        var optionalField = ServiceUtils.removeAsOneOfTypes(map, settingName, types, validationException);
+
+        if (optionalField != null) {
+            try {
+                // Use String.valueOf first as there's no Long.valueOf(Object o)
+                Long longValue = Long.valueOf(String.valueOf(optionalField));
+
+                if (longValue <= 0L) {
+                    validationException.addValidationError(ServiceUtils.mustBeAPositiveLongErrorMessage(settingName, scope, longValue));
+                }
+
+                if (validationException.validationErrors().size() > initialValidationErrorCount) {
+                    return null;
+                }
+
+                return longValue;
+            } catch (NumberFormatException e) {
+                validationException.addValidationError(format("unable to parse long [%s]", e));
+            }
+        }
+
+        return null;
+    }
+
     public static <E extends Enum<E>> E extractOptionalEnum(
         Map<String, Object> map,
         String settingName,
@@ -391,10 +529,26 @@ private static <E extends Enum<E>> void validateEnumValue(E enumValue, EnumSet<E
         }
     }
 
-    public static String mustBeAPositiveNumberErrorMessage(String settingName, String scope, int value) {
+    public static String mustBeAPositiveIntegerErrorMessage(String settingName, String scope, int value) {
         return format("[%s] Invalid value [%s]. [%s] must be a positive integer", scope, value, settingName);
     }
 
+    public static String mustBeLessThanOrEqualNumberErrorMessage(String settingName, String scope, double value, double maxValue) {
+        return format("[%s] Invalid value [%s]. [%s] must be a less than or equal to [%s]", scope, value, settingName, maxValue);
+    }
+
+    public static String mustBeGreaterThanOrEqualNumberErrorMessage(String settingName, String scope, double value, double minValue) {
+        return format("[%s] Invalid value [%s]. [%s] must be a greater than or equal to [%s]", scope, value, settingName, minValue);
+    }
+
+    public static String mustBeAFloatingPointNumberErrorMessage(String settingName, String scope) {
+        return format("[%s] Invalid value. [%s] must be a floating point number", scope, settingName);
+    }
+
+    public static String mustBeAPositiveLongErrorMessage(String settingName, String scope, Long value) {
+        return format("[%s] Invalid value [%s]. [%s] must be a positive long", scope, value, settingName);
+    }
+
     /**
      * Functional interface for creating an enum from a string.
      * @param <E>
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/AzureAiStudioConstants.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/AzureAiStudioConstants.java
new file mode 100644
index 0000000000000..296b8cf09f8c0
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/AzureAiStudioConstants.java
@@ -0,0 +1,39 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.services.azureaistudio;
+
+public class AzureAiStudioConstants {
+    public static final String EMBEDDINGS_URI_PATH = "/v1/embeddings";
+    public static final String COMPLETIONS_URI_PATH = "/v1/chat/completions";
+
+    // common service settings fields
+    public static final String TARGET_FIELD = "target";
+    public static final String ENDPOINT_TYPE_FIELD = "endpoint_type";
+    public static final String PROVIDER_FIELD = "provider";
+    public static final String API_KEY_FIELD = "api_key";
+
+    // embeddings service and request settings
+    public static final String INPUT_FIELD = "input";
+    public static final String DIMENSIONS_FIELD = "dimensions";
+    public static final String DIMENSIONS_SET_BY_USER = "dimensions_set_by_user";
+
+    // embeddings task settings fields
+    public static final String USER_FIELD = "user";
+
+    // completion task settings fields
+    public static final String TEMPERATURE_FIELD = "temperature";
+    public static final String TOP_P_FIELD = "top_p";
+    public static final String DO_SAMPLE_FIELD = "do_sample";
+    public static final String MAX_TOKENS_FIELD = "max_tokens";
+    public static final String MAX_NEW_TOKENS_FIELD = "max_new_tokens";
+
+    public static final Double MIN_TEMPERATURE_TOP_P = 0.0;
+    public static final Double MAX_TEMPERATURE_TOP_P = 2.0;
+
+    private AzureAiStudioConstants() {}
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/AzureAiStudioEndpointType.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/AzureAiStudioEndpointType.java
new file mode 100644
index 0000000000000..ece63f4bbf0cd
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/AzureAiStudioEndpointType.java
@@ -0,0 +1,26 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.services.azureaistudio;
+
+import java.util.Locale;
+
+public enum AzureAiStudioEndpointType {
+    TOKEN,
+    REALTIME;
+
+    public static String NAME = "azure_ai_studio_endpoint_type";
+
+    public static AzureAiStudioEndpointType fromString(String name) {
+        return valueOf(name.trim().toUpperCase(Locale.ROOT));
+    }
+
+    @Override
+    public String toString() {
+        return name().toLowerCase(Locale.ROOT);
+    }
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/AzureAiStudioModel.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/AzureAiStudioModel.java
new file mode 100644
index 0000000000000..a5dd491d198ae
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/AzureAiStudioModel.java
@@ -0,0 +1,104 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.services.azureaistudio;
+
+import org.elasticsearch.inference.Model;
+import org.elasticsearch.inference.ModelConfigurations;
+import org.elasticsearch.inference.ModelSecrets;
+import org.elasticsearch.inference.TaskSettings;
+import org.elasticsearch.xpack.inference.external.action.ExecutableAction;
+import org.elasticsearch.xpack.inference.external.action.azureaistudio.AzureAiStudioActionVisitor;
+import org.elasticsearch.xpack.inference.services.settings.DefaultSecretSettings;
+import org.elasticsearch.xpack.inference.services.settings.RateLimitSettings;
+
+import java.net.URI;
+import java.net.URISyntaxException;
+import java.util.Map;
+import java.util.Objects;
+
+/**
+ * Base class for Azure AI Studio models. There are some common properties across the task types
+ * including:
+ * - target:
+ * - uri:
+ * - provider:
+ * - endpointType:
+ */
+public abstract class AzureAiStudioModel extends Model {
+    protected String target;
+    protected URI uri;
+    protected AzureAiStudioProvider provider;
+    protected AzureAiStudioEndpointType endpointType;
+    protected RateLimitSettings rateLimitSettings;
+
+    public AzureAiStudioModel(AzureAiStudioModel model, TaskSettings taskSettings, RateLimitSettings rateLimitSettings) {
+        super(model, taskSettings);
+        this.rateLimitSettings = Objects.requireNonNull(rateLimitSettings);
+        setPropertiesFromServiceSettings((AzureAiStudioServiceSettings) model.getServiceSettings());
+    }
+
+    public AzureAiStudioModel(AzureAiStudioModel model, AzureAiStudioServiceSettings serviceSettings) {
+        super(model, serviceSettings);
+        setPropertiesFromServiceSettings(serviceSettings);
+    }
+
+    protected AzureAiStudioModel(ModelConfigurations modelConfigurations, ModelSecrets modelSecrets) {
+        super(modelConfigurations, modelSecrets);
+        setPropertiesFromServiceSettings((AzureAiStudioServiceSettings) modelConfigurations.getServiceSettings());
+    }
+
+    private void setPropertiesFromServiceSettings(AzureAiStudioServiceSettings serviceSettings) {
+        this.target = serviceSettings.target;
+        this.provider = serviceSettings.provider();
+        this.endpointType = serviceSettings.endpointType();
+        this.rateLimitSettings = serviceSettings.rateLimitSettings();
+        try {
+            this.uri = getEndpointUri();
+        } catch (URISyntaxException e) {
+            throw new RuntimeException(e);
+        }
+    }
+
+    protected abstract URI getEndpointUri() throws URISyntaxException;
+
+    public String target() {
+        return this.target;
+    }
+
+    public RateLimitSettings rateLimitSettings() {
+        return this.rateLimitSettings;
+    }
+
+    public AzureAiStudioProvider provider() {
+        return this.provider;
+    }
+
+    public AzureAiStudioEndpointType endpointType() {
+        return this.endpointType;
+    }
+
+    public URI uri() {
+        return this.uri;
+    }
+
+    // Needed for testing only
+    public void setURI(String newUri) {
+        try {
+            this.uri = new URI(newUri);
+        } catch (URISyntaxException e) {
+            // swallow any error
+        }
+    }
+
+    @Override
+    public DefaultSecretSettings getSecretSettings() {
+        return (DefaultSecretSettings) super.getSecretSettings();
+    }
+
+    public abstract ExecutableAction accept(AzureAiStudioActionVisitor creator, Map<String, Object> taskSettings);
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/AzureAiStudioProvider.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/AzureAiStudioProvider.java
new file mode 100644
index 0000000000000..6b3efca0888f3
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/AzureAiStudioProvider.java
@@ -0,0 +1,31 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.services.azureaistudio;
+
+import java.util.Locale;
+
+public enum AzureAiStudioProvider {
+    OPENAI,
+    MISTRAL,
+    META,
+    MICROSOFT_PHI,
+    COHERE,
+    DATABRICKS;
+
+    public static String NAME = "azure_ai_studio_provider";
+
+    public static AzureAiStudioProvider fromString(String name) {
+        return valueOf(name.trim().toUpperCase(Locale.ROOT));
+    }
+
+    @Override
+    public String toString() {
+        return name().toLowerCase(Locale.ROOT);
+    }
+
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/AzureAiStudioProviderCapabilities.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/AzureAiStudioProviderCapabilities.java
new file mode 100644
index 0000000000000..af064707536eb
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/AzureAiStudioProviderCapabilities.java
@@ -0,0 +1,85 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.services.azureaistudio;
+
+import org.elasticsearch.inference.TaskType;
+
+import java.util.List;
+
+public final class AzureAiStudioProviderCapabilities {
+
+    // these providers have embeddings inference
+    public static final List<AzureAiStudioProvider> embeddingProviders = List.of(
+        AzureAiStudioProvider.OPENAI,
+        AzureAiStudioProvider.COHERE
+    );
+
+    // these providers have chat completion inference (all providers at the moment)
+    public static final List<AzureAiStudioProvider> chatCompletionProviders = List.of(AzureAiStudioProvider.values());
+
+    // these providers allow token ("pay as you go") embeddings endpoints
+    public static final List<AzureAiStudioProvider> tokenEmbeddingsProviders = List.of(
+        AzureAiStudioProvider.OPENAI,
+        AzureAiStudioProvider.COHERE
+    );
+
+    // these providers allow realtime embeddings endpoints (none at the moment)
+    public static final List<AzureAiStudioProvider> realtimeEmbeddingsProviders = List.of();
+
+    // these providers allow token ("pay as you go") chat completion endpoints
+    public static final List<AzureAiStudioProvider> tokenChatCompletionProviders = List.of(
+        AzureAiStudioProvider.OPENAI,
+        AzureAiStudioProvider.META,
+        AzureAiStudioProvider.COHERE
+    );
+
+    // these providers allow realtime chat completion endpoints
+    public static final List<AzureAiStudioProvider> realtimeChatCompletionProviders = List.of(
+        AzureAiStudioProvider.MISTRAL,
+        AzureAiStudioProvider.META,
+        AzureAiStudioProvider.MICROSOFT_PHI,
+        AzureAiStudioProvider.DATABRICKS
+    );
+
+    public static boolean providerAllowsTaskType(AzureAiStudioProvider provider, TaskType taskType) {
+        switch (taskType) {
+            case COMPLETION -> {
+                return chatCompletionProviders.contains(provider);
+            }
+            case TEXT_EMBEDDING -> {
+                return embeddingProviders.contains(provider);
+            }
+            default -> {
+                return false;
+            }
+        }
+    }
+
+    public static boolean providerAllowsEndpointTypeForTask(
+        AzureAiStudioProvider provider,
+        TaskType taskType,
+        AzureAiStudioEndpointType endpointType
+    ) {
+        switch (taskType) {
+            case COMPLETION -> {
+                return (endpointType == AzureAiStudioEndpointType.TOKEN)
+                    ? tokenChatCompletionProviders.contains(provider)
+                    : realtimeChatCompletionProviders.contains(provider);
+            }
+            case TEXT_EMBEDDING -> {
+                return (endpointType == AzureAiStudioEndpointType.TOKEN)
+                    ? tokenEmbeddingsProviders.contains(provider)
+                    : realtimeEmbeddingsProviders.contains(provider);
+            }
+            default -> {
+                return false;
+            }
+        }
+    }
+
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/AzureAiStudioService.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/AzureAiStudioService.java
new file mode 100644
index 0000000000000..c488eac422401
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/AzureAiStudioService.java
@@ -0,0 +1,358 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.services.azureaistudio;
+
+import org.elasticsearch.ElasticsearchStatusException;
+import org.elasticsearch.TransportVersion;
+import org.elasticsearch.TransportVersions;
+import org.elasticsearch.action.ActionListener;
+import org.elasticsearch.common.Strings;
+import org.elasticsearch.core.Nullable;
+import org.elasticsearch.core.TimeValue;
+import org.elasticsearch.inference.ChunkedInferenceServiceResults;
+import org.elasticsearch.inference.ChunkingOptions;
+import org.elasticsearch.inference.InferenceServiceResults;
+import org.elasticsearch.inference.InputType;
+import org.elasticsearch.inference.Model;
+import org.elasticsearch.inference.ModelConfigurations;
+import org.elasticsearch.inference.ModelSecrets;
+import org.elasticsearch.inference.SimilarityMeasure;
+import org.elasticsearch.inference.TaskType;
+import org.elasticsearch.rest.RestStatus;
+import org.elasticsearch.xpack.core.inference.results.ChunkedTextEmbeddingResults;
+import org.elasticsearch.xpack.core.inference.results.ErrorChunkedInferenceResults;
+import org.elasticsearch.xpack.core.inference.results.TextEmbeddingResults;
+import org.elasticsearch.xpack.core.ml.inference.results.ErrorInferenceResults;
+import org.elasticsearch.xpack.inference.external.action.azureaistudio.AzureAiStudioActionCreator;
+import org.elasticsearch.xpack.inference.external.http.sender.DocumentsOnlyInput;
+import org.elasticsearch.xpack.inference.external.http.sender.HttpRequestSender;
+import org.elasticsearch.xpack.inference.services.ConfigurationParseContext;
+import org.elasticsearch.xpack.inference.services.SenderService;
+import org.elasticsearch.xpack.inference.services.ServiceComponents;
+import org.elasticsearch.xpack.inference.services.ServiceUtils;
+import org.elasticsearch.xpack.inference.services.azureaistudio.completion.AzureAiStudioChatCompletionModel;
+import org.elasticsearch.xpack.inference.services.azureaistudio.completion.AzureAiStudioChatCompletionTaskSettings;
+import org.elasticsearch.xpack.inference.services.azureaistudio.embeddings.AzureAiStudioEmbeddingsModel;
+import org.elasticsearch.xpack.inference.services.azureaistudio.embeddings.AzureAiStudioEmbeddingsServiceSettings;
+
+import java.util.List;
+import java.util.Map;
+import java.util.Set;
+
+import static org.elasticsearch.xpack.core.inference.results.ResultUtils.createInvalidChunkedResultException;
+import static org.elasticsearch.xpack.inference.services.ServiceUtils.createInvalidModelException;
+import static org.elasticsearch.xpack.inference.services.ServiceUtils.parsePersistedConfigErrorMsg;
+import static org.elasticsearch.xpack.inference.services.ServiceUtils.removeFromMapOrDefaultEmpty;
+import static org.elasticsearch.xpack.inference.services.ServiceUtils.removeFromMapOrThrowIfNull;
+import static org.elasticsearch.xpack.inference.services.ServiceUtils.throwIfNotEmptyMap;
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioProviderCapabilities.providerAllowsEndpointTypeForTask;
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioProviderCapabilities.providerAllowsTaskType;
+import static org.elasticsearch.xpack.inference.services.azureaistudio.completion.AzureAiStudioChatCompletionTaskSettings.DEFAULT_MAX_NEW_TOKENS;
+
+public class AzureAiStudioService extends SenderService {
+
+    private static final String NAME = "azureaistudio";
+
+    public AzureAiStudioService(HttpRequestSender.Factory factory, ServiceComponents serviceComponents) {
+        super(factory, serviceComponents);
+    }
+
+    @Override
+    protected void doInfer(
+        Model model,
+        List<String> input,
+        Map<String, Object> taskSettings,
+        InputType inputType,
+        TimeValue timeout,
+        ActionListener<InferenceServiceResults> listener
+    ) {
+        var actionCreator = new AzureAiStudioActionCreator(getSender(), getServiceComponents());
+
+        if (model instanceof AzureAiStudioModel baseAzureAiStudioModel) {
+            var action = baseAzureAiStudioModel.accept(actionCreator, taskSettings);
+            action.execute(new DocumentsOnlyInput(input), timeout, listener);
+        } else {
+            listener.onFailure(createInvalidModelException(model));
+        }
+    }
+
+    @Override
+    protected void doInfer(
+        Model model,
+        String query,
+        List<String> input,
+        Map<String, Object> taskSettings,
+        InputType inputType,
+        TimeValue timeout,
+        ActionListener<InferenceServiceResults> listener
+    ) {
+        throw new UnsupportedOperationException("Azure AI Studio service does not support inference with query input");
+    }
+
+    @Override
+    protected void doChunkedInfer(
+        Model model,
+        String query,
+        List<String> input,
+        Map<String, Object> taskSettings,
+        InputType inputType,
+        ChunkingOptions chunkingOptions,
+        TimeValue timeout,
+        ActionListener<List<ChunkedInferenceServiceResults>> listener
+    ) {
+        ActionListener<InferenceServiceResults> inferListener = listener.delegateFailureAndWrap(
+            (delegate, response) -> delegate.onResponse(translateToChunkedResults(input, response))
+        );
+
+        doInfer(model, input, taskSettings, inputType, timeout, inferListener);
+    }
+
+    private static List<ChunkedInferenceServiceResults> translateToChunkedResults(
+        List<String> inputs,
+        InferenceServiceResults inferenceResults
+    ) {
+        if (inferenceResults instanceof TextEmbeddingResults textEmbeddingResults) {
+            return ChunkedTextEmbeddingResults.of(inputs, textEmbeddingResults);
+        } else if (inferenceResults instanceof ErrorInferenceResults error) {
+            return List.of(new ErrorChunkedInferenceResults(error.getException()));
+        } else {
+            throw createInvalidChunkedResultException(inferenceResults.getWriteableName());
+        }
+    }
+
+    @Override
+    public void parseRequestConfig(
+        String inferenceEntityId,
+        TaskType taskType,
+        Map<String, Object> config,
+        Set<String> platformArchitectures,
+        ActionListener<Model> parsedModelListener
+    ) {
+        try {
+            Map<String, Object> serviceSettingsMap = removeFromMapOrThrowIfNull(config, ModelConfigurations.SERVICE_SETTINGS);
+            Map<String, Object> taskSettingsMap = removeFromMapOrDefaultEmpty(config, ModelConfigurations.TASK_SETTINGS);
+
+            AzureAiStudioModel model = createModel(
+                inferenceEntityId,
+                taskType,
+                serviceSettingsMap,
+                taskSettingsMap,
+                serviceSettingsMap,
+                TaskType.unsupportedTaskTypeErrorMsg(taskType, NAME),
+                ConfigurationParseContext.REQUEST
+            );
+
+            throwIfNotEmptyMap(config, NAME);
+            throwIfNotEmptyMap(serviceSettingsMap, NAME);
+            throwIfNotEmptyMap(taskSettingsMap, NAME);
+
+            parsedModelListener.onResponse(model);
+        } catch (Exception e) {
+            parsedModelListener.onFailure(e);
+        }
+    }
+
+    @Override
+    public AzureAiStudioModel parsePersistedConfigWithSecrets(
+        String inferenceEntityId,
+        TaskType taskType,
+        Map<String, Object> config,
+        Map<String, Object> secrets
+    ) {
+        Map<String, Object> serviceSettingsMap = removeFromMapOrThrowIfNull(config, ModelConfigurations.SERVICE_SETTINGS);
+        Map<String, Object> taskSettingsMap = removeFromMapOrDefaultEmpty(config, ModelConfigurations.TASK_SETTINGS);
+        Map<String, Object> secretSettingsMap = removeFromMapOrDefaultEmpty(secrets, ModelSecrets.SECRET_SETTINGS);
+
+        return createModelFromPersistent(
+            inferenceEntityId,
+            taskType,
+            serviceSettingsMap,
+            taskSettingsMap,
+            secretSettingsMap,
+            parsePersistedConfigErrorMsg(inferenceEntityId, NAME)
+        );
+    }
+
+    @Override
+    public Model parsePersistedConfig(String inferenceEntityId, TaskType taskType, Map<String, Object> config) {
+        Map<String, Object> serviceSettingsMap = removeFromMapOrThrowIfNull(config, ModelConfigurations.SERVICE_SETTINGS);
+        Map<String, Object> taskSettingsMap = removeFromMapOrDefaultEmpty(config, ModelConfigurations.TASK_SETTINGS);
+
+        return createModelFromPersistent(
+            inferenceEntityId,
+            taskType,
+            serviceSettingsMap,
+            taskSettingsMap,
+            null,
+            parsePersistedConfigErrorMsg(inferenceEntityId, NAME)
+        );
+    }
+
+    @Override
+    public String name() {
+        return NAME;
+    }
+
+    @Override
+    public TransportVersion getMinimalSupportedVersion() {
+        return TransportVersions.ML_INFERENCE_AZURE_AI_STUDIO;
+    }
+
+    private static AzureAiStudioModel createModel(
+        String inferenceEntityId,
+        TaskType taskType,
+        Map<String, Object> serviceSettings,
+        Map<String, Object> taskSettings,
+        @Nullable Map<String, Object> secretSettings,
+        String failureMessage,
+        ConfigurationParseContext context
+    ) {
+
+        if (taskType == TaskType.TEXT_EMBEDDING) {
+            var embeddingsModel = new AzureAiStudioEmbeddingsModel(
+                inferenceEntityId,
+                taskType,
+                NAME,
+                serviceSettings,
+                taskSettings,
+                secretSettings,
+                context
+            );
+            checkProviderAndEndpointTypeForTask(
+                TaskType.TEXT_EMBEDDING,
+                embeddingsModel.getServiceSettings().provider(),
+                embeddingsModel.getServiceSettings().endpointType()
+            );
+            return embeddingsModel;
+        }
+
+        if (taskType == TaskType.COMPLETION) {
+            var completionModel = new AzureAiStudioChatCompletionModel(
+                inferenceEntityId,
+                taskType,
+                NAME,
+                serviceSettings,
+                taskSettings,
+                secretSettings,
+                context
+            );
+            checkProviderAndEndpointTypeForTask(
+                TaskType.COMPLETION,
+                completionModel.getServiceSettings().provider(),
+                completionModel.getServiceSettings().endpointType()
+            );
+            return completionModel;
+        }
+
+        throw new ElasticsearchStatusException(failureMessage, RestStatus.BAD_REQUEST);
+    }
+
+    private AzureAiStudioModel createModelFromPersistent(
+        String inferenceEntityId,
+        TaskType taskType,
+        Map<String, Object> serviceSettings,
+        Map<String, Object> taskSettings,
+        Map<String, Object> secretSettings,
+        String failureMessage
+    ) {
+        return createModel(
+            inferenceEntityId,
+            taskType,
+            serviceSettings,
+            taskSettings,
+            secretSettings,
+            failureMessage,
+            ConfigurationParseContext.PERSISTENT
+        );
+    }
+
+    @Override
+    public void checkModelConfig(Model model, ActionListener<Model> listener) {
+        if (model instanceof AzureAiStudioEmbeddingsModel embeddingsModel) {
+            ServiceUtils.getEmbeddingSize(
+                model,
+                this,
+                listener.delegateFailureAndWrap((l, size) -> l.onResponse(updateEmbeddingModelConfig(embeddingsModel, size)))
+            );
+        } else if (model instanceof AzureAiStudioChatCompletionModel chatCompletionModel) {
+            listener.onResponse(updateChatCompletionModelConfig(chatCompletionModel));
+        } else {
+            listener.onResponse(model);
+        }
+    }
+
+    private AzureAiStudioEmbeddingsModel updateEmbeddingModelConfig(AzureAiStudioEmbeddingsModel embeddingsModel, int embeddingsSize) {
+        if (embeddingsModel.getServiceSettings().dimensionsSetByUser()
+            && embeddingsModel.getServiceSettings().dimensions() != null
+            && embeddingsModel.getServiceSettings().dimensions() != embeddingsSize) {
+            throw new ElasticsearchStatusException(
+                Strings.format(
+                    "The retrieved embeddings size [%s] does not match the size specified in the settings [%s]. "
+                        + "Please recreate the [%s] configuration with the correct dimensions",
+                    embeddingsSize,
+                    embeddingsModel.getServiceSettings().dimensions(),
+                    embeddingsModel.getConfigurations().getInferenceEntityId()
+                ),
+                RestStatus.BAD_REQUEST
+            );
+        }
+
+        var similarityFromModel = embeddingsModel.getServiceSettings().similarity();
+        var similarityToUse = similarityFromModel == null ? SimilarityMeasure.DOT_PRODUCT : similarityFromModel;
+
+        AzureAiStudioEmbeddingsServiceSettings serviceSettings = new AzureAiStudioEmbeddingsServiceSettings(
+            embeddingsModel.getServiceSettings().target(),
+            embeddingsModel.getServiceSettings().provider(),
+            embeddingsModel.getServiceSettings().endpointType(),
+            embeddingsSize,
+            embeddingsModel.getServiceSettings().dimensionsSetByUser(),
+            embeddingsModel.getServiceSettings().maxInputTokens(),
+            similarityToUse,
+            embeddingsModel.getServiceSettings().rateLimitSettings()
+        );
+
+        return new AzureAiStudioEmbeddingsModel(embeddingsModel, serviceSettings);
+    }
+
+    private AzureAiStudioChatCompletionModel updateChatCompletionModelConfig(AzureAiStudioChatCompletionModel chatCompletionModel) {
+        var modelMaxNewTokens = chatCompletionModel.getTaskSettings().maxNewTokens();
+        var maxNewTokensToUse = modelMaxNewTokens == null ? DEFAULT_MAX_NEW_TOKENS : modelMaxNewTokens;
+        var updatedTaskSettings = new AzureAiStudioChatCompletionTaskSettings(
+            chatCompletionModel.getTaskSettings().temperature(),
+            chatCompletionModel.getTaskSettings().topP(),
+            chatCompletionModel.getTaskSettings().doSample(),
+            maxNewTokensToUse
+        );
+        return new AzureAiStudioChatCompletionModel(chatCompletionModel, updatedTaskSettings);
+    }
+
+    private static void checkProviderAndEndpointTypeForTask(
+        TaskType taskType,
+        AzureAiStudioProvider provider,
+        AzureAiStudioEndpointType endpointType
+    ) {
+        if (providerAllowsTaskType(provider, taskType) == false) {
+            throw new ElasticsearchStatusException(
+                Strings.format("The [%s] task type for provider [%s] is not available", taskType, provider),
+                RestStatus.BAD_REQUEST
+            );
+        }
+
+        if (providerAllowsEndpointTypeForTask(provider, taskType, endpointType) == false) {
+            throw new ElasticsearchStatusException(
+                Strings.format(
+                    "The [%s] endpoint type with [%s] task type for provider [%s] is not available",
+                    endpointType,
+                    taskType,
+                    provider
+                ),
+                RestStatus.BAD_REQUEST
+            );
+        }
+    }
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/AzureAiStudioServiceSettings.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/AzureAiStudioServiceSettings.java
new file mode 100644
index 0000000000000..10c57e19b6403
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/AzureAiStudioServiceSettings.java
@@ -0,0 +1,130 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.services.azureaistudio;
+
+import org.elasticsearch.common.ValidationException;
+import org.elasticsearch.common.io.stream.StreamInput;
+import org.elasticsearch.common.io.stream.StreamOutput;
+import org.elasticsearch.core.Nullable;
+import org.elasticsearch.inference.ModelConfigurations;
+import org.elasticsearch.inference.ServiceSettings;
+import org.elasticsearch.xcontent.XContentBuilder;
+import org.elasticsearch.xpack.inference.services.ConfigurationParseContext;
+import org.elasticsearch.xpack.inference.services.settings.FilteredXContentObject;
+import org.elasticsearch.xpack.inference.services.settings.RateLimitSettings;
+
+import java.io.IOException;
+import java.util.EnumSet;
+import java.util.Map;
+import java.util.Objects;
+
+import static org.elasticsearch.xpack.inference.services.ServiceUtils.extractRequiredEnum;
+import static org.elasticsearch.xpack.inference.services.ServiceUtils.extractRequiredString;
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants.ENDPOINT_TYPE_FIELD;
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants.PROVIDER_FIELD;
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants.TARGET_FIELD;
+
+public abstract class AzureAiStudioServiceSettings extends FilteredXContentObject implements ServiceSettings {
+
+    protected final String target;
+    protected final AzureAiStudioProvider provider;
+    protected final AzureAiStudioEndpointType endpointType;
+    protected final RateLimitSettings rateLimitSettings;
+
+    protected static final RateLimitSettings DEFAULT_RATE_LIMIT_SETTINGS = new RateLimitSettings(240);
+
+    protected static BaseAzureAiStudioCommonFields fromMap(
+        Map<String, Object> map,
+        ValidationException validationException,
+        ConfigurationParseContext context
+    ) {
+        String target = extractRequiredString(map, TARGET_FIELD, ModelConfigurations.SERVICE_SETTINGS, validationException);
+        RateLimitSettings rateLimitSettings = RateLimitSettings.of(map, DEFAULT_RATE_LIMIT_SETTINGS, validationException);
+        AzureAiStudioEndpointType endpointType = extractRequiredEnum(
+            map,
+            ENDPOINT_TYPE_FIELD,
+            ModelConfigurations.SERVICE_SETTINGS,
+            AzureAiStudioEndpointType::fromString,
+            EnumSet.allOf(AzureAiStudioEndpointType.class),
+            validationException
+        );
+
+        AzureAiStudioProvider provider = extractRequiredEnum(
+            map,
+            PROVIDER_FIELD,
+            ModelConfigurations.SERVICE_SETTINGS,
+            AzureAiStudioProvider::fromString,
+            EnumSet.allOf(AzureAiStudioProvider.class),
+            validationException
+        );
+
+        return new BaseAzureAiStudioCommonFields(target, provider, endpointType, rateLimitSettings);
+    }
+
+    protected AzureAiStudioServiceSettings(StreamInput in) throws IOException {
+        this.target = in.readString();
+        this.provider = in.readEnum(AzureAiStudioProvider.class);
+        this.endpointType = in.readEnum(AzureAiStudioEndpointType.class);
+        this.rateLimitSettings = new RateLimitSettings(in);
+    }
+
+    protected AzureAiStudioServiceSettings(
+        String target,
+        AzureAiStudioProvider provider,
+        AzureAiStudioEndpointType endpointType,
+        @Nullable RateLimitSettings rateLimitSettings
+    ) {
+        this.target = target;
+        this.provider = provider;
+        this.endpointType = endpointType;
+        this.rateLimitSettings = Objects.requireNonNullElse(rateLimitSettings, DEFAULT_RATE_LIMIT_SETTINGS);
+    }
+
+    protected record BaseAzureAiStudioCommonFields(
+        String target,
+        AzureAiStudioProvider provider,
+        AzureAiStudioEndpointType endpointType,
+        RateLimitSettings rateLimitSettings
+    ) {}
+
+    public String target() {
+        return this.target;
+    }
+
+    public AzureAiStudioProvider provider() {
+        return this.provider;
+    }
+
+    public AzureAiStudioEndpointType endpointType() {
+        return this.endpointType;
+    }
+
+    public RateLimitSettings rateLimitSettings() {
+        return this.rateLimitSettings;
+    }
+
+    @Override
+    public void writeTo(StreamOutput out) throws IOException {
+        out.writeString(target);
+        out.writeEnum(provider);
+        out.writeEnum(endpointType);
+        rateLimitSettings.writeTo(out);
+    }
+
+    protected void addXContentFields(XContentBuilder builder, Params params) throws IOException {
+        this.addExposedXContentFields(builder, params);
+        rateLimitSettings.toXContent(builder, params);
+    }
+
+    protected void addExposedXContentFields(XContentBuilder builder, Params params) throws IOException {
+        builder.field(TARGET_FIELD, this.target);
+        builder.field(PROVIDER_FIELD, this.provider);
+        builder.field(ENDPOINT_TYPE_FIELD, this.endpointType);
+    }
+
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/completion/AzureAiStudioChatCompletionModel.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/completion/AzureAiStudioChatCompletionModel.java
new file mode 100644
index 0000000000000..5afb3aaed61ff
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/completion/AzureAiStudioChatCompletionModel.java
@@ -0,0 +1,105 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.services.azureaistudio.completion;
+
+import org.elasticsearch.core.Nullable;
+import org.elasticsearch.inference.ModelConfigurations;
+import org.elasticsearch.inference.ModelSecrets;
+import org.elasticsearch.inference.TaskType;
+import org.elasticsearch.xpack.inference.external.action.ExecutableAction;
+import org.elasticsearch.xpack.inference.external.action.azureaistudio.AzureAiStudioActionVisitor;
+import org.elasticsearch.xpack.inference.services.ConfigurationParseContext;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioEndpointType;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioModel;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioProvider;
+import org.elasticsearch.xpack.inference.services.settings.DefaultSecretSettings;
+
+import java.net.URI;
+import java.net.URISyntaxException;
+import java.util.Map;
+
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants.COMPLETIONS_URI_PATH;
+
+public class AzureAiStudioChatCompletionModel extends AzureAiStudioModel {
+
+    public static AzureAiStudioChatCompletionModel of(AzureAiStudioModel model, Map<String, Object> taskSettings) {
+        var modelAsCompletionModel = (AzureAiStudioChatCompletionModel) model;
+
+        if (taskSettings == null || taskSettings.isEmpty()) {
+            return modelAsCompletionModel;
+        }
+
+        var requestTaskSettings = AzureAiStudioChatCompletionRequestTaskSettings.fromMap(taskSettings);
+        var taskSettingToUse = AzureAiStudioChatCompletionTaskSettings.of(modelAsCompletionModel.getTaskSettings(), requestTaskSettings);
+
+        return new AzureAiStudioChatCompletionModel(modelAsCompletionModel, taskSettingToUse);
+    }
+
+    public AzureAiStudioChatCompletionModel(
+        String inferenceEntityId,
+        TaskType taskType,
+        String service,
+        AzureAiStudioChatCompletionServiceSettings serviceSettings,
+        AzureAiStudioChatCompletionTaskSettings taskSettings,
+        DefaultSecretSettings secrets
+    ) {
+        super(new ModelConfigurations(inferenceEntityId, taskType, service, serviceSettings, taskSettings), new ModelSecrets(secrets));
+    }
+
+    public AzureAiStudioChatCompletionModel(
+        String inferenceEntityId,
+        TaskType taskType,
+        String service,
+        Map<String, Object> serviceSettings,
+        Map<String, Object> taskSettings,
+        @Nullable Map<String, Object> secrets,
+        ConfigurationParseContext context
+    ) {
+        this(
+            inferenceEntityId,
+            taskType,
+            service,
+            AzureAiStudioChatCompletionServiceSettings.fromMap(serviceSettings, context),
+            AzureAiStudioChatCompletionTaskSettings.fromMap(taskSettings),
+            DefaultSecretSettings.fromMap(secrets)
+        );
+    }
+
+    public AzureAiStudioChatCompletionModel(AzureAiStudioChatCompletionModel model, AzureAiStudioChatCompletionTaskSettings taskSettings) {
+        super(model, taskSettings, model.getServiceSettings().rateLimitSettings());
+    }
+
+    @Override
+    public AzureAiStudioChatCompletionServiceSettings getServiceSettings() {
+        return (AzureAiStudioChatCompletionServiceSettings) super.getServiceSettings();
+    }
+
+    @Override
+    public AzureAiStudioChatCompletionTaskSettings getTaskSettings() {
+        return (AzureAiStudioChatCompletionTaskSettings) super.getTaskSettings();
+    }
+
+    @Override
+    public DefaultSecretSettings getSecretSettings() {
+        return super.getSecretSettings();
+    }
+
+    @Override
+    protected URI getEndpointUri() throws URISyntaxException {
+        if (this.provider == AzureAiStudioProvider.OPENAI || this.endpointType == AzureAiStudioEndpointType.REALTIME) {
+            return new URI(this.target);
+        }
+
+        return new URI(this.target + COMPLETIONS_URI_PATH);
+    }
+
+    @Override
+    public ExecutableAction accept(AzureAiStudioActionVisitor creator, Map<String, Object> taskSettings) {
+        return creator.create(this, taskSettings);
+    }
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/completion/AzureAiStudioChatCompletionRequestTaskSettings.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/completion/AzureAiStudioChatCompletionRequestTaskSettings.java
new file mode 100644
index 0000000000000..2eef059e3fae1
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/completion/AzureAiStudioChatCompletionRequestTaskSettings.java
@@ -0,0 +1,83 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.services.azureaistudio.completion;
+
+import org.elasticsearch.common.ValidationException;
+import org.elasticsearch.core.Nullable;
+import org.elasticsearch.inference.ModelConfigurations;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants;
+
+import java.util.Map;
+
+import static org.elasticsearch.xpack.inference.services.ServiceUtils.extractOptionalBoolean;
+import static org.elasticsearch.xpack.inference.services.ServiceUtils.extractOptionalDoubleInRange;
+import static org.elasticsearch.xpack.inference.services.ServiceUtils.extractOptionalPositiveInteger;
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants.DO_SAMPLE_FIELD;
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants.MAX_NEW_TOKENS_FIELD;
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants.TEMPERATURE_FIELD;
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants.TOP_P_FIELD;
+
+public record AzureAiStudioChatCompletionRequestTaskSettings(
+    @Nullable Double temperature,
+    @Nullable Double topP,
+    @Nullable Boolean doSample,
+    @Nullable Integer maxNewTokens
+) {
+
+    public static final AzureAiStudioChatCompletionRequestTaskSettings EMPTY_SETTINGS = new AzureAiStudioChatCompletionRequestTaskSettings(
+        null,
+        null,
+        null,
+        null
+    );
+
+    /**
+     * Extracts the task settings from a map. All settings are considered optional and the absence of a setting
+     * does not throw an error.
+     *
+     * @param map the settings received from a request
+     * @return a {@link AzureAiStudioChatCompletionRequestTaskSettings}
+     */
+    public static AzureAiStudioChatCompletionRequestTaskSettings fromMap(Map<String, Object> map) {
+        if (map.isEmpty()) {
+            return AzureAiStudioChatCompletionRequestTaskSettings.EMPTY_SETTINGS;
+        }
+
+        ValidationException validationException = new ValidationException();
+
+        var temperature = extractOptionalDoubleInRange(
+            map,
+            TEMPERATURE_FIELD,
+            AzureAiStudioConstants.MIN_TEMPERATURE_TOP_P,
+            AzureAiStudioConstants.MAX_TEMPERATURE_TOP_P,
+            ModelConfigurations.TASK_SETTINGS,
+            validationException
+        );
+        var topP = extractOptionalDoubleInRange(
+            map,
+            TOP_P_FIELD,
+            AzureAiStudioConstants.MIN_TEMPERATURE_TOP_P,
+            AzureAiStudioConstants.MAX_TEMPERATURE_TOP_P,
+            ModelConfigurations.TASK_SETTINGS,
+            validationException
+        );
+        Boolean doSample = extractOptionalBoolean(map, DO_SAMPLE_FIELD, validationException);
+        Integer maxNewTokens = extractOptionalPositiveInteger(
+            map,
+            MAX_NEW_TOKENS_FIELD,
+            ModelConfigurations.TASK_SETTINGS,
+            validationException
+        );
+
+        if (validationException.validationErrors().isEmpty() == false) {
+            throw validationException;
+        }
+
+        return new AzureAiStudioChatCompletionRequestTaskSettings(temperature, topP, doSample, maxNewTokens);
+    }
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/completion/AzureAiStudioChatCompletionServiceSettings.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/completion/AzureAiStudioChatCompletionServiceSettings.java
new file mode 100644
index 0000000000000..2f8422be5ed90
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/completion/AzureAiStudioChatCompletionServiceSettings.java
@@ -0,0 +1,123 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.services.azureaistudio.completion;
+
+import org.elasticsearch.TransportVersion;
+import org.elasticsearch.TransportVersions;
+import org.elasticsearch.common.ValidationException;
+import org.elasticsearch.common.io.stream.StreamInput;
+import org.elasticsearch.common.io.stream.StreamOutput;
+import org.elasticsearch.core.Nullable;
+import org.elasticsearch.xcontent.ToXContent;
+import org.elasticsearch.xcontent.XContentBuilder;
+import org.elasticsearch.xpack.inference.services.ConfigurationParseContext;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioEndpointType;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioProvider;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioServiceSettings;
+import org.elasticsearch.xpack.inference.services.settings.RateLimitSettings;
+
+import java.io.IOException;
+import java.util.Map;
+import java.util.Objects;
+
+public class AzureAiStudioChatCompletionServiceSettings extends AzureAiStudioServiceSettings {
+    public static final String NAME = "azure_ai_studio_chat_completion_service_settings";
+
+    public static AzureAiStudioChatCompletionServiceSettings fromMap(Map<String, Object> map, ConfigurationParseContext context) {
+        ValidationException validationException = new ValidationException();
+
+        var settings = completionSettingsFromMap(map, validationException, context);
+
+        if (validationException.validationErrors().isEmpty() == false) {
+            throw validationException;
+        }
+
+        return new AzureAiStudioChatCompletionServiceSettings(settings);
+    }
+
+    private static AzureAiStudioCompletionCommonFields completionSettingsFromMap(
+        Map<String, Object> map,
+        ValidationException validationException,
+        ConfigurationParseContext context
+    ) {
+        var baseSettings = AzureAiStudioServiceSettings.fromMap(map, validationException, context);
+        return new AzureAiStudioCompletionCommonFields(baseSettings);
+    }
+
+    private record AzureAiStudioCompletionCommonFields(BaseAzureAiStudioCommonFields baseCommonFields) {}
+
+    public AzureAiStudioChatCompletionServiceSettings(
+        String target,
+        AzureAiStudioProvider provider,
+        AzureAiStudioEndpointType endpointType,
+        @Nullable RateLimitSettings rateLimitSettings
+    ) {
+        super(target, provider, endpointType, rateLimitSettings);
+    }
+
+    public AzureAiStudioChatCompletionServiceSettings(StreamInput in) throws IOException {
+        super(in);
+    }
+
+    private AzureAiStudioChatCompletionServiceSettings(AzureAiStudioCompletionCommonFields fields) {
+        this(
+            fields.baseCommonFields.target(),
+            fields.baseCommonFields.provider(),
+            fields.baseCommonFields.endpointType(),
+            fields.baseCommonFields.rateLimitSettings()
+        );
+    }
+
+    @Override
+    public String getWriteableName() {
+        return NAME;
+    }
+
+    @Override
+    public TransportVersion getMinimalSupportedVersion() {
+        return TransportVersions.ML_INFERENCE_AZURE_AI_STUDIO;
+    }
+
+    @Override
+    public void writeTo(StreamOutput out) throws IOException {
+        super.writeTo(out);
+    }
+
+    @Override
+    public XContentBuilder toXContent(XContentBuilder builder, Params params) throws IOException {
+        builder.startObject();
+
+        super.addXContentFields(builder, params);
+
+        builder.endObject();
+        return builder;
+    }
+
+    @Override
+    protected XContentBuilder toXContentFragmentOfExposedFields(XContentBuilder builder, ToXContent.Params params) throws IOException {
+        super.addExposedXContentFields(builder, params);
+        return builder;
+    }
+
+    @Override
+    public boolean equals(Object o) {
+        if (this == o) return true;
+        if (o == null || getClass() != o.getClass()) return false;
+        AzureAiStudioChatCompletionServiceSettings that = (AzureAiStudioChatCompletionServiceSettings) o;
+
+        return Objects.equals(target, that.target)
+            && Objects.equals(provider, that.provider)
+            && Objects.equals(endpointType, that.endpointType)
+            && Objects.equals(rateLimitSettings, that.rateLimitSettings);
+    }
+
+    @Override
+    public int hashCode() {
+        return Objects.hash(target, provider, endpointType, rateLimitSettings);
+    }
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/completion/AzureAiStudioChatCompletionTaskSettings.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/completion/AzureAiStudioChatCompletionTaskSettings.java
new file mode 100644
index 0000000000000..fc11d96269b68
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/completion/AzureAiStudioChatCompletionTaskSettings.java
@@ -0,0 +1,192 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.services.azureaistudio.completion;
+
+import org.elasticsearch.TransportVersion;
+import org.elasticsearch.TransportVersions;
+import org.elasticsearch.common.ValidationException;
+import org.elasticsearch.common.io.stream.StreamInput;
+import org.elasticsearch.common.io.stream.StreamOutput;
+import org.elasticsearch.core.Nullable;
+import org.elasticsearch.inference.ModelConfigurations;
+import org.elasticsearch.inference.TaskSettings;
+import org.elasticsearch.xcontent.XContentBuilder;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants;
+import org.elasticsearch.xpack.inference.services.azureopenai.embeddings.AzureOpenAiEmbeddingsTaskSettings;
+
+import java.io.IOException;
+import java.util.Map;
+import java.util.Objects;
+
+import static org.elasticsearch.xpack.inference.services.ServiceUtils.extractOptionalBoolean;
+import static org.elasticsearch.xpack.inference.services.ServiceUtils.extractOptionalDoubleInRange;
+import static org.elasticsearch.xpack.inference.services.ServiceUtils.extractOptionalPositiveInteger;
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants.DO_SAMPLE_FIELD;
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants.MAX_NEW_TOKENS_FIELD;
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants.TEMPERATURE_FIELD;
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants.TOP_P_FIELD;
+
+public class AzureAiStudioChatCompletionTaskSettings implements TaskSettings {
+    public static final String NAME = "azure_ai_studio_chat_completion_task_settings";
+    public static final Integer DEFAULT_MAX_NEW_TOKENS = 64;
+
+    public static AzureAiStudioChatCompletionTaskSettings fromMap(Map<String, Object> map) {
+        ValidationException validationException = new ValidationException();
+
+        var temperature = extractOptionalDoubleInRange(
+            map,
+            TEMPERATURE_FIELD,
+            AzureAiStudioConstants.MIN_TEMPERATURE_TOP_P,
+            AzureAiStudioConstants.MAX_TEMPERATURE_TOP_P,
+            ModelConfigurations.TASK_SETTINGS,
+            validationException
+        );
+        var topP = extractOptionalDoubleInRange(
+            map,
+            TOP_P_FIELD,
+            AzureAiStudioConstants.MIN_TEMPERATURE_TOP_P,
+            AzureAiStudioConstants.MAX_TEMPERATURE_TOP_P,
+            ModelConfigurations.TASK_SETTINGS,
+            validationException
+        );
+        var doSample = extractOptionalBoolean(map, DO_SAMPLE_FIELD, validationException);
+        var maxNewTokens = extractOptionalPositiveInteger(
+            map,
+            MAX_NEW_TOKENS_FIELD,
+            ModelConfigurations.TASK_SETTINGS,
+            validationException
+        );
+
+        if (validationException.validationErrors().isEmpty() == false) {
+            throw validationException;
+        }
+
+        return new AzureAiStudioChatCompletionTaskSettings(temperature, topP, doSample, maxNewTokens);
+    }
+
+    /**
+     * Creates a new {@link AzureOpenAiEmbeddingsTaskSettings} object by overriding the values in originalSettings with the ones
+     * passed in via requestSettings if the fields are not null.
+     * @param originalSettings the original {@link AzureOpenAiEmbeddingsTaskSettings} from the inference entity configuration from storage
+     * @param requestSettings the {@link AzureOpenAiEmbeddingsTaskSettings} from the request
+     * @return a new {@link AzureOpenAiEmbeddingsTaskSettings}
+     */
+    public static AzureAiStudioChatCompletionTaskSettings of(
+        AzureAiStudioChatCompletionTaskSettings originalSettings,
+        AzureAiStudioChatCompletionRequestTaskSettings requestSettings
+    ) {
+
+        var temperature = requestSettings.temperature() == null ? originalSettings.temperature() : requestSettings.temperature();
+        var topP = requestSettings.topP() == null ? originalSettings.topP() : requestSettings.topP();
+        var doSample = requestSettings.doSample() == null ? originalSettings.doSample() : requestSettings.doSample();
+        var maxNewTokens = requestSettings.maxNewTokens() == null ? originalSettings.maxNewTokens() : requestSettings.maxNewTokens();
+
+        return new AzureAiStudioChatCompletionTaskSettings(temperature, topP, doSample, maxNewTokens);
+    }
+
+    public AzureAiStudioChatCompletionTaskSettings(
+        @Nullable Double temperature,
+        @Nullable Double topP,
+        @Nullable Boolean doSample,
+        @Nullable Integer maxNewTokens
+    ) {
+
+        this.temperature = temperature;
+        this.topP = topP;
+        this.doSample = doSample;
+        this.maxNewTokens = maxNewTokens;
+    }
+
+    public AzureAiStudioChatCompletionTaskSettings(StreamInput in) throws IOException {
+        this.temperature = in.readOptionalDouble();
+        this.topP = in.readOptionalDouble();
+        this.doSample = in.readOptionalBoolean();
+        this.maxNewTokens = in.readOptionalInt();
+    }
+
+    private final Double temperature;
+    private final Double topP;
+    private final Boolean doSample;
+    private final Integer maxNewTokens;
+
+    public Double temperature() {
+        return temperature;
+    }
+
+    public Double topP() {
+        return topP;
+    }
+
+    public Boolean doSample() {
+        return doSample;
+    }
+
+    public Integer maxNewTokens() {
+        return maxNewTokens;
+    }
+
+    public boolean areAnyParametersAvailable() {
+        return temperature != null && topP != null && doSample != null && maxNewTokens != null;
+    }
+
+    @Override
+    public String getWriteableName() {
+        return NAME;
+    }
+
+    @Override
+    public TransportVersion getMinimalSupportedVersion() {
+        return TransportVersions.ML_INFERENCE_AZURE_OPENAI_EMBEDDINGS;
+    }
+
+    @Override
+    public void writeTo(StreamOutput out) throws IOException {
+        out.writeOptionalDouble(temperature);
+        out.writeOptionalDouble(topP);
+        out.writeOptionalBoolean(doSample);
+        out.writeOptionalInt(maxNewTokens);
+    }
+
+    @Override
+    public XContentBuilder toXContent(XContentBuilder builder, Params params) throws IOException {
+        builder.startObject();
+
+        if (temperature != null) {
+            builder.field(TEMPERATURE_FIELD, temperature);
+        }
+        if (topP != null) {
+            builder.field(TOP_P_FIELD, topP);
+        }
+        if (doSample != null) {
+            builder.field(DO_SAMPLE_FIELD, doSample);
+        }
+        if (maxNewTokens != null) {
+            builder.field(MAX_NEW_TOKENS_FIELD, maxNewTokens);
+        }
+
+        builder.endObject();
+        return builder;
+    }
+
+    @Override
+    public boolean equals(Object o) {
+        if (this == o) return true;
+        if (o == null || getClass() != o.getClass()) return false;
+        AzureAiStudioChatCompletionTaskSettings that = (AzureAiStudioChatCompletionTaskSettings) o;
+        return Objects.equals(temperature, that.temperature)
+            && Objects.equals(topP, that.topP)
+            && Objects.equals(doSample, that.doSample)
+            && Objects.equals(maxNewTokens, that.maxNewTokens);
+    }
+
+    @Override
+    public int hashCode() {
+        return Objects.hash(temperature, topP, doSample, maxNewTokens);
+    }
+
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/embeddings/AzureAiStudioEmbeddingsModel.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/embeddings/AzureAiStudioEmbeddingsModel.java
new file mode 100644
index 0000000000000..a999b9f0312e6
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/embeddings/AzureAiStudioEmbeddingsModel.java
@@ -0,0 +1,102 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.services.azureaistudio.embeddings;
+
+import org.elasticsearch.core.Nullable;
+import org.elasticsearch.inference.ModelConfigurations;
+import org.elasticsearch.inference.ModelSecrets;
+import org.elasticsearch.inference.TaskType;
+import org.elasticsearch.xpack.inference.external.action.ExecutableAction;
+import org.elasticsearch.xpack.inference.external.action.azureaistudio.AzureAiStudioActionVisitor;
+import org.elasticsearch.xpack.inference.services.ConfigurationParseContext;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioEndpointType;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioModel;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioProvider;
+import org.elasticsearch.xpack.inference.services.settings.DefaultSecretSettings;
+
+import java.net.URI;
+import java.net.URISyntaxException;
+import java.util.Map;
+
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants.EMBEDDINGS_URI_PATH;
+
+public class AzureAiStudioEmbeddingsModel extends AzureAiStudioModel {
+
+    public static AzureAiStudioEmbeddingsModel of(AzureAiStudioEmbeddingsModel model, Map<String, Object> taskSettings) {
+        if (taskSettings == null || taskSettings.isEmpty()) {
+            return model;
+        }
+
+        var requestTaskSettings = AzureAiStudioEmbeddingsRequestTaskSettings.fromMap(taskSettings);
+        var taskSettingToUse = AzureAiStudioEmbeddingsTaskSettings.of(model.getTaskSettings(), requestTaskSettings);
+
+        return new AzureAiStudioEmbeddingsModel(model, taskSettingToUse);
+    }
+
+    public AzureAiStudioEmbeddingsModel(
+        String inferenceEntityId,
+        TaskType taskType,
+        String service,
+        AzureAiStudioEmbeddingsServiceSettings serviceSettings,
+        AzureAiStudioEmbeddingsTaskSettings taskSettings,
+        DefaultSecretSettings secrets
+    ) {
+        super(new ModelConfigurations(inferenceEntityId, taskType, service, serviceSettings, taskSettings), new ModelSecrets(secrets));
+    }
+
+    public AzureAiStudioEmbeddingsModel(
+        String inferenceEntityId,
+        TaskType taskType,
+        String service,
+        Map<String, Object> serviceSettings,
+        Map<String, Object> taskSettings,
+        @Nullable Map<String, Object> secrets,
+        ConfigurationParseContext context
+    ) {
+        this(
+            inferenceEntityId,
+            taskType,
+            service,
+            AzureAiStudioEmbeddingsServiceSettings.fromMap(serviceSettings, context),
+            AzureAiStudioEmbeddingsTaskSettings.fromMap(taskSettings),
+            DefaultSecretSettings.fromMap(secrets)
+        );
+    }
+
+    private AzureAiStudioEmbeddingsModel(AzureAiStudioEmbeddingsModel model, AzureAiStudioEmbeddingsTaskSettings taskSettings) {
+        super(model, taskSettings, model.getServiceSettings().rateLimitSettings());
+    }
+
+    public AzureAiStudioEmbeddingsModel(AzureAiStudioEmbeddingsModel model, AzureAiStudioEmbeddingsServiceSettings serviceSettings) {
+        super(model, serviceSettings);
+    }
+
+    @Override
+    public AzureAiStudioEmbeddingsServiceSettings getServiceSettings() {
+        return (AzureAiStudioEmbeddingsServiceSettings) super.getServiceSettings();
+    }
+
+    @Override
+    public AzureAiStudioEmbeddingsTaskSettings getTaskSettings() {
+        return (AzureAiStudioEmbeddingsTaskSettings) super.getTaskSettings();
+    }
+
+    @Override
+    protected URI getEndpointUri() throws URISyntaxException {
+        if (this.provider == AzureAiStudioProvider.OPENAI || this.endpointType == AzureAiStudioEndpointType.REALTIME) {
+            return new URI(this.target);
+        }
+
+        return new URI(this.target + EMBEDDINGS_URI_PATH);
+    }
+
+    @Override
+    public ExecutableAction accept(AzureAiStudioActionVisitor creator, Map<String, Object> taskSettings) {
+        return creator.create(this, taskSettings);
+    }
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/embeddings/AzureAiStudioEmbeddingsRequestTaskSettings.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/embeddings/AzureAiStudioEmbeddingsRequestTaskSettings.java
new file mode 100644
index 0000000000000..8c9fd22a7cdf7
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/embeddings/AzureAiStudioEmbeddingsRequestTaskSettings.java
@@ -0,0 +1,52 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.services.azureaistudio.embeddings;
+
+import org.elasticsearch.common.ValidationException;
+import org.elasticsearch.core.Nullable;
+import org.elasticsearch.inference.ModelConfigurations;
+import org.elasticsearch.xpack.inference.services.azureopenai.embeddings.AzureOpenAiEmbeddingsRequestTaskSettings;
+
+import java.util.Map;
+
+import static org.elasticsearch.xpack.inference.services.ServiceUtils.extractOptionalString;
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants.USER_FIELD;
+
+/**
+ * This class handles extracting Azure OpenAI task settings from a request. The difference between this class and
+ * {@link AzureAiStudioEmbeddingsTaskSettings} is that this class considers all fields as optional. It will not throw an error if a field
+ * is missing. This allows overriding persistent task settings.
+ * @param user a unique identifier representing your end-user, which can help OpenAI to monitor and detect abuse, if using an OpenAI model
+ */
+public record AzureAiStudioEmbeddingsRequestTaskSettings(@Nullable String user) {
+    public static final AzureAiStudioEmbeddingsRequestTaskSettings EMPTY_SETTINGS = new AzureAiStudioEmbeddingsRequestTaskSettings(null);
+
+    /**
+     * Extracts the task settings from a map. All settings are considered optional and the absence of a setting
+     * does not throw an error.
+     *
+     * @param map the settings received from a request
+     * @return a {@link AzureOpenAiEmbeddingsRequestTaskSettings}
+     */
+    public static AzureAiStudioEmbeddingsRequestTaskSettings fromMap(Map<String, Object> map) {
+        if (map.isEmpty()) {
+            return AzureAiStudioEmbeddingsRequestTaskSettings.EMPTY_SETTINGS;
+        }
+
+        ValidationException validationException = new ValidationException();
+
+        String user = extractOptionalString(map, USER_FIELD, ModelConfigurations.TASK_SETTINGS, validationException);
+
+        if (validationException.validationErrors().isEmpty() == false) {
+            throw validationException;
+        }
+
+        return new AzureAiStudioEmbeddingsRequestTaskSettings(user);
+    }
+
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/embeddings/AzureAiStudioEmbeddingsServiceSettings.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/embeddings/AzureAiStudioEmbeddingsServiceSettings.java
new file mode 100644
index 0000000000000..1a39cd67a70f3
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/embeddings/AzureAiStudioEmbeddingsServiceSettings.java
@@ -0,0 +1,231 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.services.azureaistudio.embeddings;
+
+import org.elasticsearch.TransportVersion;
+import org.elasticsearch.TransportVersions;
+import org.elasticsearch.common.ValidationException;
+import org.elasticsearch.common.io.stream.StreamInput;
+import org.elasticsearch.common.io.stream.StreamOutput;
+import org.elasticsearch.core.Nullable;
+import org.elasticsearch.index.mapper.vectors.DenseVectorFieldMapper;
+import org.elasticsearch.inference.ModelConfigurations;
+import org.elasticsearch.inference.SimilarityMeasure;
+import org.elasticsearch.xcontent.ToXContent;
+import org.elasticsearch.xcontent.XContentBuilder;
+import org.elasticsearch.xpack.inference.services.ConfigurationParseContext;
+import org.elasticsearch.xpack.inference.services.ServiceUtils;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioEndpointType;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioProvider;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioServiceSettings;
+import org.elasticsearch.xpack.inference.services.settings.RateLimitSettings;
+
+import java.io.IOException;
+import java.util.Map;
+import java.util.Objects;
+
+import static org.elasticsearch.xpack.inference.services.ServiceFields.DIMENSIONS;
+import static org.elasticsearch.xpack.inference.services.ServiceFields.MAX_INPUT_TOKENS;
+import static org.elasticsearch.xpack.inference.services.ServiceFields.SIMILARITY;
+import static org.elasticsearch.xpack.inference.services.ServiceUtils.extractOptionalBoolean;
+import static org.elasticsearch.xpack.inference.services.ServiceUtils.extractSimilarity;
+import static org.elasticsearch.xpack.inference.services.ServiceUtils.removeAsType;
+
+public class AzureAiStudioEmbeddingsServiceSettings extends AzureAiStudioServiceSettings {
+
+    public static final String NAME = "azure_ai_studio_embeddings_service_settings";
+    static final String DIMENSIONS_SET_BY_USER = "dimensions_set_by_user";
+
+    public static AzureAiStudioEmbeddingsServiceSettings fromMap(Map<String, Object> map, ConfigurationParseContext context) {
+        ValidationException validationException = new ValidationException();
+
+        var settings = embeddingSettingsFromMap(map, validationException, context);
+
+        if (validationException.validationErrors().isEmpty() == false) {
+            throw validationException;
+        }
+
+        return new AzureAiStudioEmbeddingsServiceSettings(settings);
+    }
+
+    private static AzureAiStudioEmbeddingCommonFields embeddingSettingsFromMap(
+        Map<String, Object> map,
+        ValidationException validationException,
+        ConfigurationParseContext context
+    ) {
+        var baseSettings = AzureAiStudioServiceSettings.fromMap(map, validationException, context);
+        SimilarityMeasure similarity = extractSimilarity(map, ModelConfigurations.SERVICE_SETTINGS, validationException);
+        Integer dims = removeAsType(map, DIMENSIONS, Integer.class);
+        Integer maxTokens = removeAsType(map, MAX_INPUT_TOKENS, Integer.class);
+
+        Boolean dimensionsSetByUser = extractOptionalBoolean(map, DIMENSIONS_SET_BY_USER, validationException);
+
+        switch (context) {
+            case REQUEST -> {
+                if (dimensionsSetByUser != null) {
+                    validationException.addValidationError(
+                        ServiceUtils.invalidSettingError(DIMENSIONS_SET_BY_USER, ModelConfigurations.SERVICE_SETTINGS)
+                    );
+                }
+                dimensionsSetByUser = dims != null;
+            }
+            case PERSISTENT -> {
+                if (dimensionsSetByUser == null) {
+                    validationException.addValidationError(
+                        ServiceUtils.missingSettingErrorMsg(DIMENSIONS_SET_BY_USER, ModelConfigurations.SERVICE_SETTINGS)
+                    );
+                }
+            }
+        }
+        return new AzureAiStudioEmbeddingCommonFields(baseSettings, dims, dimensionsSetByUser, maxTokens, similarity);
+    }
+
+    private record AzureAiStudioEmbeddingCommonFields(
+        BaseAzureAiStudioCommonFields baseCommonFields,
+        @Nullable Integer dimensions,
+        Boolean dimensionsSetByUser,
+        @Nullable Integer maxInputTokens,
+        SimilarityMeasure similarity
+    ) {}
+
+    public AzureAiStudioEmbeddingsServiceSettings(
+        String target,
+        AzureAiStudioProvider provider,
+        AzureAiStudioEndpointType endpointType,
+        @Nullable Integer dimensions,
+        Boolean dimensionsSetByUser,
+        @Nullable Integer maxInputTokens,
+        @Nullable SimilarityMeasure similarity,
+        RateLimitSettings rateLimitSettings
+    ) {
+        super(target, provider, endpointType, rateLimitSettings);
+        this.dimensions = dimensions;
+        this.dimensionsSetByUser = dimensionsSetByUser;
+        this.maxInputTokens = maxInputTokens;
+        this.similarity = similarity;
+    }
+
+    public AzureAiStudioEmbeddingsServiceSettings(StreamInput in) throws IOException {
+        super(in);
+        this.dimensions = in.readOptionalVInt();
+        this.dimensionsSetByUser = in.readBoolean();
+        this.maxInputTokens = in.readOptionalVInt();
+        this.similarity = in.readOptionalEnum(SimilarityMeasure.class);
+    }
+
+    private AzureAiStudioEmbeddingsServiceSettings(AzureAiStudioEmbeddingCommonFields fields) {
+        this(
+            fields.baseCommonFields.target(),
+            fields.baseCommonFields.provider(),
+            fields.baseCommonFields.endpointType(),
+            fields.dimensions(),
+            fields.dimensionsSetByUser(),
+            fields.maxInputTokens(),
+            fields.similarity(),
+            fields.baseCommonFields.rateLimitSettings()
+        );
+    }
+
+    private final Integer dimensions;
+    private final Boolean dimensionsSetByUser;
+    private final Integer maxInputTokens;
+    private final SimilarityMeasure similarity;
+
+    @Override
+    public SimilarityMeasure similarity() {
+        return similarity;
+    }
+
+    public boolean dimensionsSetByUser() {
+        return this.dimensionsSetByUser;
+    }
+
+    public Integer dimensions() {
+        return dimensions;
+    }
+
+    public Integer maxInputTokens() {
+        return maxInputTokens;
+    }
+
+    @Override
+    public String getWriteableName() {
+        return NAME;
+    }
+
+    @Override
+    public TransportVersion getMinimalSupportedVersion() {
+        return TransportVersions.ML_INFERENCE_AZURE_AI_STUDIO;
+    }
+
+    @Override
+    public DenseVectorFieldMapper.ElementType elementType() {
+        return DenseVectorFieldMapper.ElementType.FLOAT;
+    }
+
+    @Override
+    public void writeTo(StreamOutput out) throws IOException {
+        super.writeTo(out);
+        out.writeOptionalVInt(dimensions);
+        out.writeBoolean(dimensionsSetByUser);
+        out.writeOptionalVInt(maxInputTokens);
+        out.writeOptionalEnum(similarity);
+    }
+
+    private void addXContentFragmentOfExposedFields(XContentBuilder builder, Params params) throws IOException {
+        if (dimensions != null) {
+            builder.field(DIMENSIONS, dimensions);
+        }
+        if (maxInputTokens != null) {
+            builder.field(MAX_INPUT_TOKENS, maxInputTokens);
+        }
+        if (similarity != null) {
+            builder.field(SIMILARITY, similarity);
+        }
+    }
+
+    @Override
+    public XContentBuilder toXContent(XContentBuilder builder, Params params) throws IOException {
+        builder.startObject();
+
+        super.addXContentFields(builder, params);
+        addXContentFragmentOfExposedFields(builder, params);
+        builder.field(DIMENSIONS_SET_BY_USER, dimensionsSetByUser);
+
+        builder.endObject();
+        return builder;
+    }
+
+    @Override
+    protected XContentBuilder toXContentFragmentOfExposedFields(XContentBuilder builder, ToXContent.Params params) throws IOException {
+        super.addExposedXContentFields(builder, params);
+        addXContentFragmentOfExposedFields(builder, params);
+        return builder;
+    }
+
+    @Override
+    public boolean equals(Object o) {
+        if (this == o) return true;
+        if (o == null || getClass() != o.getClass()) return false;
+        AzureAiStudioEmbeddingsServiceSettings that = (AzureAiStudioEmbeddingsServiceSettings) o;
+
+        return Objects.equals(target, that.target)
+            && Objects.equals(provider, that.provider)
+            && Objects.equals(endpointType, that.endpointType)
+            && Objects.equals(dimensions, that.dimensions)
+            && Objects.equals(dimensionsSetByUser, that.dimensionsSetByUser)
+            && Objects.equals(maxInputTokens, that.maxInputTokens)
+            && Objects.equals(similarity, that.similarity)
+            && Objects.equals(rateLimitSettings, that.rateLimitSettings);
+    }
+
+    @Override
+    public int hashCode() {
+        return Objects.hash(target, provider, endpointType, dimensions, dimensionsSetByUser, maxInputTokens, similarity, rateLimitSettings);
+    }
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/embeddings/AzureAiStudioEmbeddingsTaskSettings.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/embeddings/AzureAiStudioEmbeddingsTaskSettings.java
new file mode 100644
index 0000000000000..dc001993b366f
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/azureaistudio/embeddings/AzureAiStudioEmbeddingsTaskSettings.java
@@ -0,0 +1,109 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.services.azureaistudio.embeddings;
+
+import org.elasticsearch.TransportVersion;
+import org.elasticsearch.TransportVersions;
+import org.elasticsearch.common.ValidationException;
+import org.elasticsearch.common.io.stream.StreamInput;
+import org.elasticsearch.common.io.stream.StreamOutput;
+import org.elasticsearch.core.Nullable;
+import org.elasticsearch.inference.ModelConfigurations;
+import org.elasticsearch.inference.TaskSettings;
+import org.elasticsearch.xcontent.XContentBuilder;
+import org.elasticsearch.xpack.inference.services.azureopenai.embeddings.AzureOpenAiEmbeddingsTaskSettings;
+
+import java.io.IOException;
+import java.util.Map;
+import java.util.Objects;
+
+import static org.elasticsearch.xpack.inference.services.ServiceUtils.extractOptionalString;
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants.USER_FIELD;
+
+public class AzureAiStudioEmbeddingsTaskSettings implements TaskSettings {
+    public static final String NAME = "azure_ai_studio_embeddings_task_settings";
+
+    public static AzureAiStudioEmbeddingsTaskSettings fromMap(Map<String, Object> map) {
+        ValidationException validationException = new ValidationException();
+
+        String user = extractOptionalString(map, USER_FIELD, ModelConfigurations.TASK_SETTINGS, validationException);
+        if (validationException.validationErrors().isEmpty() == false) {
+            throw validationException;
+        }
+
+        return new AzureAiStudioEmbeddingsTaskSettings(user);
+    }
+
+    /**
+     * Creates a new {@link AzureOpenAiEmbeddingsTaskSettings} object by overriding the values in originalSettings with the ones
+     * passed in via requestSettings if the fields are not null.
+     *
+     * @param originalSettings the original {@link AzureOpenAiEmbeddingsTaskSettings} from the inference entity configuration from storage
+     * @param requestSettings  the {@link AzureOpenAiEmbeddingsTaskSettings} from the request
+     * @return a new {@link AzureOpenAiEmbeddingsTaskSettings}
+     */
+    public static AzureAiStudioEmbeddingsTaskSettings of(
+        AzureAiStudioEmbeddingsTaskSettings originalSettings,
+        AzureAiStudioEmbeddingsRequestTaskSettings requestSettings
+    ) {
+        var userToUse = requestSettings.user() == null ? originalSettings.user : requestSettings.user();
+        return new AzureAiStudioEmbeddingsTaskSettings(userToUse);
+    }
+
+    public AzureAiStudioEmbeddingsTaskSettings(@Nullable String user) {
+        this.user = user;
+    }
+
+    public AzureAiStudioEmbeddingsTaskSettings(StreamInput in) throws IOException {
+        this.user = in.readOptionalString();
+    }
+
+    private final String user;
+
+    public String user() {
+        return this.user;
+    }
+
+    @Override
+    public String getWriteableName() {
+        return NAME;
+    }
+
+    @Override
+    public TransportVersion getMinimalSupportedVersion() {
+        return TransportVersions.ML_INFERENCE_AZURE_OPENAI_EMBEDDINGS;
+    }
+
+    @Override
+    public void writeTo(StreamOutput out) throws IOException {
+        out.writeOptionalString(this.user);
+    }
+
+    @Override
+    public XContentBuilder toXContent(XContentBuilder builder, Params params) throws IOException {
+        builder.startObject();
+        if (user != null) {
+            builder.field(USER_FIELD, user);
+        }
+        builder.endObject();
+        return builder;
+    }
+
+    @Override
+    public boolean equals(Object o) {
+        if (this == o) return true;
+        if (o == null || getClass() != o.getClass()) return false;
+        AzureAiStudioEmbeddingsTaskSettings that = (AzureAiStudioEmbeddingsTaskSettings) o;
+        return Objects.equals(user, that.user);
+    }
+
+    @Override
+    public int hashCode() {
+        return Objects.hashCode(user);
+    }
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/cohere/CohereService.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/cohere/CohereService.java
index deb1cfb901602..11dbf673ab7bd 100644
--- a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/cohere/CohereService.java
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/cohere/CohereService.java
@@ -32,6 +32,7 @@
 import org.elasticsearch.xpack.inference.services.SenderService;
 import org.elasticsearch.xpack.inference.services.ServiceComponents;
 import org.elasticsearch.xpack.inference.services.ServiceUtils;
+import org.elasticsearch.xpack.inference.services.cohere.completion.CohereCompletionModel;
 import org.elasticsearch.xpack.inference.services.cohere.embeddings.CohereEmbeddingsModel;
 import org.elasticsearch.xpack.inference.services.cohere.embeddings.CohereEmbeddingsServiceSettings;
 import org.elasticsearch.xpack.inference.services.cohere.rerank.CohereRerankModel;
@@ -130,6 +131,7 @@ private static CohereModel createModel(
                 context
             );
             case RERANK -> new CohereRerankModel(inferenceEntityId, taskType, NAME, serviceSettings, taskSettings, secretSettings, context);
+            case COMPLETION -> new CohereCompletionModel(inferenceEntityId, taskType, NAME, serviceSettings, taskSettings, secretSettings);
             default -> throw new ElasticsearchStatusException(failureMessage, RestStatus.BAD_REQUEST);
         };
     }
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/cohere/completion/CohereCompletionModel.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/cohere/completion/CohereCompletionModel.java
new file mode 100644
index 0000000000000..761081d4d723c
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/cohere/completion/CohereCompletionModel.java
@@ -0,0 +1,86 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.services.cohere.completion;
+
+import org.elasticsearch.core.Nullable;
+import org.elasticsearch.inference.EmptyTaskSettings;
+import org.elasticsearch.inference.InputType;
+import org.elasticsearch.inference.ModelConfigurations;
+import org.elasticsearch.inference.ModelSecrets;
+import org.elasticsearch.inference.TaskSettings;
+import org.elasticsearch.inference.TaskType;
+import org.elasticsearch.xpack.inference.external.action.ExecutableAction;
+import org.elasticsearch.xpack.inference.external.action.cohere.CohereActionVisitor;
+import org.elasticsearch.xpack.inference.services.cohere.CohereModel;
+import org.elasticsearch.xpack.inference.services.settings.DefaultSecretSettings;
+
+import java.net.URI;
+import java.util.Map;
+
+public class CohereCompletionModel extends CohereModel {
+
+    public CohereCompletionModel(
+        String modelId,
+        TaskType taskType,
+        String service,
+        Map<String, Object> serviceSettings,
+        Map<String, Object> taskSettings,
+        @Nullable Map<String, Object> secrets
+    ) {
+        this(
+            modelId,
+            taskType,
+            service,
+            CohereCompletionServiceSettings.fromMap(serviceSettings),
+            EmptyTaskSettings.INSTANCE,
+            DefaultSecretSettings.fromMap(secrets)
+        );
+    }
+
+    // should only be used for testing
+    CohereCompletionModel(
+        String modelId,
+        TaskType taskType,
+        String service,
+        CohereCompletionServiceSettings serviceSettings,
+        TaskSettings taskSettings,
+        @Nullable DefaultSecretSettings secretSettings
+    ) {
+        super(
+            new ModelConfigurations(modelId, taskType, service, serviceSettings, taskSettings),
+            new ModelSecrets(secretSettings),
+            secretSettings,
+            serviceSettings
+        );
+    }
+
+    @Override
+    public CohereCompletionServiceSettings getServiceSettings() {
+        return (CohereCompletionServiceSettings) super.getServiceSettings();
+    }
+
+    @Override
+    public TaskSettings getTaskSettings() {
+        return super.getTaskSettings();
+    }
+
+    @Override
+    public DefaultSecretSettings getSecretSettings() {
+        return (DefaultSecretSettings) super.getSecretSettings();
+    }
+
+    @Override
+    public ExecutableAction accept(CohereActionVisitor visitor, Map<String, Object> taskSettings, InputType inputType) {
+        return visitor.create(this, taskSettings);
+    }
+
+    @Override
+    public URI uri() {
+        return getServiceSettings().uri();
+    }
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/cohere/completion/CohereCompletionServiceSettings.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/cohere/completion/CohereCompletionServiceSettings.java
new file mode 100644
index 0000000000000..2a22f6333f1a2
--- /dev/null
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/cohere/completion/CohereCompletionServiceSettings.java
@@ -0,0 +1,148 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.services.cohere.completion;
+
+import org.elasticsearch.TransportVersion;
+import org.elasticsearch.TransportVersions;
+import org.elasticsearch.common.ValidationException;
+import org.elasticsearch.common.io.stream.StreamInput;
+import org.elasticsearch.common.io.stream.StreamOutput;
+import org.elasticsearch.core.Nullable;
+import org.elasticsearch.inference.ModelConfigurations;
+import org.elasticsearch.inference.ServiceSettings;
+import org.elasticsearch.xcontent.XContentBuilder;
+import org.elasticsearch.xpack.inference.services.cohere.CohereRateLimitServiceSettings;
+import org.elasticsearch.xpack.inference.services.settings.FilteredXContentObject;
+import org.elasticsearch.xpack.inference.services.settings.RateLimitSettings;
+
+import java.io.IOException;
+import java.net.URI;
+import java.util.Map;
+import java.util.Objects;
+
+import static org.elasticsearch.xpack.inference.services.ServiceFields.MODEL_ID;
+import static org.elasticsearch.xpack.inference.services.ServiceFields.URL;
+import static org.elasticsearch.xpack.inference.services.ServiceUtils.convertToUri;
+import static org.elasticsearch.xpack.inference.services.ServiceUtils.createOptionalUri;
+import static org.elasticsearch.xpack.inference.services.ServiceUtils.extractOptionalString;
+
+public class CohereCompletionServiceSettings extends FilteredXContentObject implements ServiceSettings, CohereRateLimitServiceSettings {
+
+    public static final String NAME = "cohere_completion_service_settings";
+
+    // Production key rate limits for all endpoints: https://docs.cohere.com/docs/going-live#production-key-specifications
+    // 10K requests per minute
+    private static final RateLimitSettings DEFAULT_RATE_LIMIT_SETTINGS = new RateLimitSettings(10_000);
+
+    public static CohereCompletionServiceSettings fromMap(Map<String, Object> map) {
+        ValidationException validationException = new ValidationException();
+
+        String url = extractOptionalString(map, URL, ModelConfigurations.SERVICE_SETTINGS, validationException);
+        URI uri = convertToUri(url, URL, ModelConfigurations.SERVICE_SETTINGS, validationException);
+        RateLimitSettings rateLimitSettings = RateLimitSettings.of(map, DEFAULT_RATE_LIMIT_SETTINGS, validationException);
+        String modelId = extractOptionalString(map, MODEL_ID, ModelConfigurations.SERVICE_SETTINGS, validationException);
+
+        if (validationException.validationErrors().isEmpty() == false) {
+            throw validationException;
+        }
+
+        return new CohereCompletionServiceSettings(uri, modelId, rateLimitSettings);
+    }
+
+    private final URI uri;
+
+    private final String modelId;
+
+    private final RateLimitSettings rateLimitSettings;
+
+    public CohereCompletionServiceSettings(@Nullable URI uri, @Nullable String modelId, @Nullable RateLimitSettings rateLimitSettings) {
+        this.uri = uri;
+        this.modelId = modelId;
+        this.rateLimitSettings = Objects.requireNonNullElse(rateLimitSettings, DEFAULT_RATE_LIMIT_SETTINGS);
+    }
+
+    public CohereCompletionServiceSettings(@Nullable String url, @Nullable String modelId, @Nullable RateLimitSettings rateLimitSettings) {
+        this(createOptionalUri(url), modelId, rateLimitSettings);
+    }
+
+    public CohereCompletionServiceSettings(StreamInput in) throws IOException {
+        uri = createOptionalUri(in.readOptionalString());
+        modelId = in.readOptionalString();
+        rateLimitSettings = new RateLimitSettings(in);
+    }
+
+    @Override
+    public RateLimitSettings rateLimitSettings() {
+        return rateLimitSettings;
+    }
+
+    public URI uri() {
+        return uri;
+    }
+
+    public String modelId() {
+        return modelId;
+    }
+
+    @Override
+    public XContentBuilder toXContent(XContentBuilder builder, Params params) throws IOException {
+        builder.startObject();
+
+        toXContentFragmentOfExposedFields(builder, params);
+        rateLimitSettings.toXContent(builder, params);
+
+        builder.endObject();
+        return builder;
+    }
+
+    @Override
+    public String getWriteableName() {
+        return NAME;
+    }
+
+    @Override
+    public TransportVersion getMinimalSupportedVersion() {
+        return TransportVersions.ML_INFERENCE_COHERE_COMPLETION_ADDED;
+    }
+
+    @Override
+    public void writeTo(StreamOutput out) throws IOException {
+        var uriToWrite = uri != null ? uri.toString() : null;
+        out.writeOptionalString(uriToWrite);
+        out.writeOptionalString(modelId);
+        rateLimitSettings.writeTo(out);
+    }
+
+    @Override
+    protected XContentBuilder toXContentFragmentOfExposedFields(XContentBuilder builder, Params params) throws IOException {
+        if (uri != null) {
+            builder.field(URL, uri.toString());
+        }
+
+        if (modelId != null) {
+            builder.field(MODEL_ID, modelId);
+        }
+
+        return builder;
+    }
+
+    @Override
+    public boolean equals(Object object) {
+        if (this == object) return true;
+        if (object == null || getClass() != object.getClass()) return false;
+        CohereCompletionServiceSettings that = (CohereCompletionServiceSettings) object;
+        return Objects.equals(uri, that.uri)
+            && Objects.equals(modelId, that.modelId)
+            && Objects.equals(rateLimitSettings, that.rateLimitSettings);
+    }
+
+    @Override
+    public int hashCode() {
+        return Objects.hash(uri, modelId, rateLimitSettings);
+    }
+}
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/settings/InternalServiceSettings.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/settings/InternalServiceSettings.java
index 854722d989340..ee7db662b4997 100644
--- a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/settings/InternalServiceSettings.java
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/settings/InternalServiceSettings.java
@@ -41,7 +41,7 @@ protected static void validateParameters(Integer numAllocations, ValidationExcep
             );
         } else if (numAllocations < 1) {
             validationException.addValidationError(
-                ServiceUtils.mustBeAPositiveNumberErrorMessage(NUM_ALLOCATIONS, ModelConfigurations.SERVICE_SETTINGS, numAllocations)
+                ServiceUtils.mustBeAPositiveIntegerErrorMessage(NUM_ALLOCATIONS, ModelConfigurations.SERVICE_SETTINGS, numAllocations)
             );
         }
 
@@ -49,7 +49,7 @@ protected static void validateParameters(Integer numAllocations, ValidationExcep
             validationException.addValidationError(ServiceUtils.missingSettingErrorMsg(NUM_THREADS, ModelConfigurations.SERVICE_SETTINGS));
         } else if (numThreads < 1) {
             validationException.addValidationError(
-                ServiceUtils.mustBeAPositiveNumberErrorMessage(NUM_THREADS, ModelConfigurations.SERVICE_SETTINGS, numThreads)
+                ServiceUtils.mustBeAPositiveIntegerErrorMessage(NUM_THREADS, ModelConfigurations.SERVICE_SETTINGS, numThreads)
             );
         }
     }
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/settings/RateLimitSettings.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/settings/RateLimitSettings.java
index 985168c7ccfd1..cfc375a525dd6 100644
--- a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/settings/RateLimitSettings.java
+++ b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/settings/RateLimitSettings.java
@@ -19,7 +19,7 @@
 import java.util.Objects;
 import java.util.concurrent.TimeUnit;
 
-import static org.elasticsearch.xpack.inference.services.ServiceUtils.extractOptionalPositiveInteger;
+import static org.elasticsearch.xpack.inference.services.ServiceUtils.extractOptionalPositiveLong;
 import static org.elasticsearch.xpack.inference.services.ServiceUtils.removeFromMapOrDefaultEmpty;
 
 public class RateLimitSettings implements Writeable, ToXContentFragment {
@@ -32,7 +32,7 @@ public class RateLimitSettings implements Writeable, ToXContentFragment {
 
     public static RateLimitSettings of(Map<String, Object> map, RateLimitSettings defaultValue, ValidationException validationException) {
         Map<String, Object> settings = removeFromMapOrDefaultEmpty(map, FIELD_NAME);
-        var requestsPerMinute = extractOptionalPositiveInteger(settings, REQUESTS_PER_MINUTE_FIELD, FIELD_NAME, validationException);
+        var requestsPerMinute = extractOptionalPositiveLong(settings, REQUESTS_PER_MINUTE_FIELD, FIELD_NAME, validationException);
 
         return requestsPerMinute == null ? defaultValue : new RateLimitSettings(requestsPerMinute);
     }
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/action/azureaistudio/AzureAiStudioActionAndCreatorTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/action/azureaistudio/AzureAiStudioActionAndCreatorTests.java
new file mode 100644
index 0000000000000..15d082f455130
--- /dev/null
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/action/azureaistudio/AzureAiStudioActionAndCreatorTests.java
@@ -0,0 +1,229 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.action.azureaistudio;
+
+import org.apache.http.HttpHeaders;
+import org.elasticsearch.action.support.PlainActionFuture;
+import org.elasticsearch.common.settings.Settings;
+import org.elasticsearch.core.TimeValue;
+import org.elasticsearch.inference.InferenceServiceResults;
+import org.elasticsearch.test.ESTestCase;
+import org.elasticsearch.test.http.MockRequest;
+import org.elasticsearch.test.http.MockResponse;
+import org.elasticsearch.test.http.MockWebServer;
+import org.elasticsearch.threadpool.ThreadPool;
+import org.elasticsearch.xcontent.XContentType;
+import org.elasticsearch.xpack.core.inference.action.InferenceAction;
+import org.elasticsearch.xpack.inference.common.TruncatorTests;
+import org.elasticsearch.xpack.inference.external.action.openai.OpenAiChatCompletionActionTests;
+import org.elasticsearch.xpack.inference.external.http.HttpClientManager;
+import org.elasticsearch.xpack.inference.external.http.sender.DocumentsOnlyInput;
+import org.elasticsearch.xpack.inference.external.http.sender.HttpRequestSender;
+import org.elasticsearch.xpack.inference.external.http.sender.HttpRequestSenderTests;
+import org.elasticsearch.xpack.inference.logging.ThrottlerManager;
+import org.elasticsearch.xpack.inference.services.ServiceComponents;
+import org.elasticsearch.xpack.inference.services.ServiceComponentsTests;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioEndpointType;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioProvider;
+import org.elasticsearch.xpack.inference.services.azureaistudio.completion.AzureAiStudioChatCompletionModelTests;
+import org.elasticsearch.xpack.inference.services.azureaistudio.embeddings.AzureAiStudioEmbeddingsModelTests;
+import org.junit.After;
+import org.junit.Before;
+
+import java.io.IOException;
+import java.util.List;
+import java.util.Map;
+import java.util.concurrent.TimeUnit;
+
+import static org.elasticsearch.xpack.inference.Utils.inferenceUtilityPool;
+import static org.elasticsearch.xpack.inference.Utils.mockClusterServiceEmpty;
+import static org.elasticsearch.xpack.inference.external.http.Utils.entityAsMap;
+import static org.elasticsearch.xpack.inference.external.http.Utils.getUrl;
+import static org.elasticsearch.xpack.inference.external.http.retry.RetrySettingsTests.buildSettingsWithRetryFields;
+import static org.elasticsearch.xpack.inference.external.request.azureaistudio.AzureAiStudioRequestFields.API_KEY_HEADER;
+import static org.elasticsearch.xpack.inference.results.TextEmbeddingResultsTests.buildExpectation;
+import static org.hamcrest.Matchers.equalTo;
+import static org.hamcrest.Matchers.hasSize;
+import static org.hamcrest.Matchers.is;
+import static org.mockito.Mockito.mock;
+
+public class AzureAiStudioActionAndCreatorTests extends ESTestCase {
+    private static final TimeValue TIMEOUT = new TimeValue(30, TimeUnit.SECONDS);
+    private final MockWebServer webServer = new MockWebServer();
+    private ThreadPool threadPool;
+    private HttpClientManager clientManager;
+
+    @Before
+    public void init() throws Exception {
+        webServer.start();
+        threadPool = createThreadPool(inferenceUtilityPool());
+        clientManager = HttpClientManager.create(Settings.EMPTY, threadPool, mockClusterServiceEmpty(), mock(ThrottlerManager.class));
+    }
+
+    @After
+    public void shutdown() throws IOException {
+        clientManager.close();
+        terminate(threadPool);
+        webServer.close();
+    }
+
+    public void testEmbeddingsRequestAction() throws IOException {
+        var senderFactory = new HttpRequestSender.Factory(
+            ServiceComponentsTests.createWithEmptySettings(threadPool),
+            clientManager,
+            mockClusterServiceEmpty()
+        );
+
+        var timeoutSettings = buildSettingsWithRetryFields(
+            TimeValue.timeValueMillis(1),
+            TimeValue.timeValueMinutes(1),
+            TimeValue.timeValueSeconds(0)
+        );
+
+        var serviceComponents = new ServiceComponents(
+            threadPool,
+            mock(ThrottlerManager.class),
+            timeoutSettings,
+            TruncatorTests.createTruncator()
+        );
+
+        try (var sender = senderFactory.createSender("test_service")) {
+            sender.start();
+
+            webServer.enqueue(new MockResponse().setResponseCode(200).setBody(testEmbeddingsTokenResponseJson));
+
+            var model = AzureAiStudioEmbeddingsModelTests.createModel(
+                "id",
+                "http://will-be-replaced.local",
+                AzureAiStudioProvider.OPENAI,
+                AzureAiStudioEndpointType.TOKEN,
+                "apikey"
+            );
+            model.setURI(getUrl(webServer));
+
+            var creator = new AzureAiStudioActionCreator(sender, serviceComponents);
+            var action = creator.create(model, Map.of());
+            PlainActionFuture<InferenceServiceResults> listener = new PlainActionFuture<>();
+            action.execute(new DocumentsOnlyInput(List.of("abc")), InferenceAction.Request.DEFAULT_TIMEOUT, listener);
+
+            var result = listener.actionGet(TIMEOUT);
+
+            assertThat(result.asMap(), is(buildExpectation(List.of(List.of(0.0123F, -0.0123F)))));
+            assertThat(webServer.requests(), hasSize(1));
+            assertNull(webServer.requests().get(0).getUri().getQuery());
+            assertThat(webServer.requests().get(0).getHeader(HttpHeaders.CONTENT_TYPE), equalTo(XContentType.JSON.mediaType()));
+            assertThat(webServer.requests().get(0).getHeader(API_KEY_HEADER), equalTo("apikey"));
+
+            var requestMap = entityAsMap(webServer.requests().get(0).getBody());
+            assertThat(requestMap.size(), is(1));
+            assertThat(requestMap.get("input"), is(List.of("abc")));
+        }
+    }
+
+    public void testChatCompletionRequestAction() throws IOException {
+        var senderFactory = HttpRequestSenderTests.createSenderFactory(threadPool, clientManager);
+
+        var timeoutSettings = buildSettingsWithRetryFields(
+            TimeValue.timeValueMillis(1),
+            TimeValue.timeValueMinutes(1),
+            TimeValue.timeValueSeconds(0)
+        );
+
+        var serviceComponents = new ServiceComponents(
+            threadPool,
+            mock(ThrottlerManager.class),
+            timeoutSettings,
+            TruncatorTests.createTruncator()
+        );
+
+        try (var sender = senderFactory.createSender("test_service")) {
+            sender.start();
+
+            webServer.enqueue(new MockResponse().setResponseCode(200).setBody(testCompletionTokenResponseJson));
+            var webserverUrl = getUrl(webServer);
+            var model = AzureAiStudioChatCompletionModelTests.createModel(
+                "id",
+                "http://will-be-replaced.local",
+                AzureAiStudioProvider.COHERE,
+                AzureAiStudioEndpointType.TOKEN,
+                "apikey"
+            );
+            model.setURI(webserverUrl);
+
+            var creator = new AzureAiStudioActionCreator(sender, serviceComponents);
+            var action = creator.create(model, Map.of());
+
+            PlainActionFuture<InferenceServiceResults> listener = new PlainActionFuture<>();
+            action.execute(new DocumentsOnlyInput(List.of("abc")), InferenceAction.Request.DEFAULT_TIMEOUT, listener);
+
+            var result = listener.actionGet(TIMEOUT);
+
+            assertThat(
+                result.asMap(),
+                is(OpenAiChatCompletionActionTests.buildExpectedChatCompletionResultMap(List.of("test input string")))
+            );
+            assertThat(webServer.requests(), hasSize(1));
+
+            MockRequest request = webServer.requests().get(0);
+
+            assertNull(request.getUri().getQuery());
+            assertThat(request.getHeader(HttpHeaders.CONTENT_TYPE), equalTo(XContentType.JSON.mediaType()));
+            assertThat(request.getHeader(HttpHeaders.AUTHORIZATION), equalTo("apikey"));
+
+            var requestMap = entityAsMap(request.getBody());
+            assertThat(requestMap.size(), is(1));
+            assertThat(requestMap.get("messages"), is(List.of(Map.of("role", "user", "content", "abc"))));
+        }
+    }
+
+    private static String testEmbeddingsTokenResponseJson = """
+        {
+          "object": "list",
+          "data": [
+              {
+                  "object": "embedding",
+                  "index": 0,
+                  "embedding": [
+                      0.0123,
+                      -0.0123
+                  ]
+              }
+          ],
+          "model": "text-embedding-ada-002-v2",
+          "usage": {
+              "prompt_tokens": 8,
+              "total_tokens": 8
+          }
+        }
+        """;
+
+    private static String testCompletionTokenResponseJson = """
+        {
+            "choices": [
+                {
+                    "finish_reason": "stop",
+                    "index": 0,
+                    "message": {
+                        "content": "test input string",
+                        "role": "assistant",
+                        "tool_calls": null
+                    }
+                }
+            ],
+            "created": 1714006424,
+            "id": "f92b5b4d-0de3-4152-a3c6-5aae8a74555c",
+            "model": "",
+            "object": "chat.completion",
+            "usage": {
+                "completion_tokens": 35,
+                "prompt_tokens": 8,
+                "total_tokens": 43
+            }
+        }""";
+
+}
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/action/cohere/CohereActionCreatorTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/action/cohere/CohereActionCreatorTests.java
index 73b627742ab03..8d63072b5d7aa 100644
--- a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/action/cohere/CohereActionCreatorTests.java
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/action/cohere/CohereActionCreatorTests.java
@@ -24,6 +24,7 @@
 import org.elasticsearch.xpack.inference.external.http.sender.HttpRequestSenderTests;
 import org.elasticsearch.xpack.inference.logging.ThrottlerManager;
 import org.elasticsearch.xpack.inference.services.cohere.CohereTruncation;
+import org.elasticsearch.xpack.inference.services.cohere.completion.CohereCompletionModelTests;
 import org.elasticsearch.xpack.inference.services.cohere.embeddings.CohereEmbeddingType;
 import org.elasticsearch.xpack.inference.services.cohere.embeddings.CohereEmbeddingsModelTests;
 import org.elasticsearch.xpack.inference.services.cohere.embeddings.CohereEmbeddingsTaskSettings;
@@ -39,6 +40,7 @@
 
 import static org.elasticsearch.xpack.inference.Utils.inferenceUtilityPool;
 import static org.elasticsearch.xpack.inference.Utils.mockClusterServiceEmpty;
+import static org.elasticsearch.xpack.inference.external.action.cohere.CohereCompletionActionTests.buildExpectedChatCompletionResultMap;
 import static org.elasticsearch.xpack.inference.external.http.Utils.entityAsMap;
 import static org.elasticsearch.xpack.inference.external.http.Utils.getUrl;
 import static org.elasticsearch.xpack.inference.results.TextEmbeddingResultsTests.buildExpectation;
@@ -148,4 +150,124 @@ public void testCreate_CohereEmbeddingsModel() throws IOException {
             );
         }
     }
+
+    public void testCreate_CohereCompletionModel_WithModelSpecified() throws IOException {
+        var senderFactory = HttpRequestSenderTests.createSenderFactory(threadPool, clientManager);
+
+        try (var sender = senderFactory.createSender("test_service")) {
+            sender.start();
+
+            String responseJson = """
+                {
+                     "response_id": "some id",
+                     "text": "result",
+                     "generation_id": "some id",
+                     "chat_history": [
+                         {
+                             "role": "USER",
+                             "message": "input"
+                         },
+                         {
+                             "role": "CHATBOT",
+                             "message": "result"
+                         }
+                     ],
+                     "finish_reason": "COMPLETE",
+                     "meta": {
+                         "api_version": {
+                             "version": "1"
+                         },
+                         "billed_units": {
+                             "input_tokens": 4,
+                             "output_tokens": 191
+                         },
+                         "tokens": {
+                             "input_tokens": 70,
+                             "output_tokens": 191
+                         }
+                     }
+                 }
+                """;
+
+            webServer.enqueue(new MockResponse().setResponseCode(200).setBody(responseJson));
+
+            var model = CohereCompletionModelTests.createModel(getUrl(webServer), "secret", "model");
+            var actionCreator = new CohereActionCreator(sender, createWithEmptySettings(threadPool));
+            var action = actionCreator.create(model, Map.of());
+
+            PlainActionFuture<InferenceServiceResults> listener = new PlainActionFuture<>();
+            action.execute(new DocumentsOnlyInput(List.of("abc")), InferenceAction.Request.DEFAULT_TIMEOUT, listener);
+
+            var result = listener.actionGet(TIMEOUT);
+
+            assertThat(result.asMap(), is(buildExpectedChatCompletionResultMap(List.of("result"))));
+            assertThat(webServer.requests(), hasSize(1));
+            assertNull(webServer.requests().get(0).getUri().getQuery());
+            assertThat(webServer.requests().get(0).getHeader(HttpHeaders.CONTENT_TYPE), is(XContentType.JSON.mediaType()));
+            assertThat(webServer.requests().get(0).getHeader(HttpHeaders.AUTHORIZATION), is("Bearer secret"));
+
+            var requestMap = entityAsMap(webServer.requests().get(0).getBody());
+            assertThat(requestMap, is(Map.of("message", "abc", "model", "model")));
+        }
+    }
+
+    public void testCreate_CohereCompletionModel_WithoutModelSpecified() throws IOException {
+        var senderFactory = HttpRequestSenderTests.createSenderFactory(threadPool, clientManager);
+
+        try (var sender = senderFactory.createSender("test_service")) {
+            sender.start();
+
+            String responseJson = """
+                {
+                     "response_id": "some id",
+                     "text": "result",
+                     "generation_id": "some id",
+                     "chat_history": [
+                         {
+                             "role": "USER",
+                             "message": "input"
+                         },
+                         {
+                             "role": "CHATBOT",
+                             "message": "result"
+                         }
+                     ],
+                     "finish_reason": "COMPLETE",
+                     "meta": {
+                         "api_version": {
+                             "version": "1"
+                         },
+                         "billed_units": {
+                             "input_tokens": 4,
+                             "output_tokens": 191
+                         },
+                         "tokens": {
+                             "input_tokens": 70,
+                             "output_tokens": 191
+                         }
+                     }
+                 }
+                """;
+
+            webServer.enqueue(new MockResponse().setResponseCode(200).setBody(responseJson));
+
+            var model = CohereCompletionModelTests.createModel(getUrl(webServer), "secret", null);
+            var actionCreator = new CohereActionCreator(sender, createWithEmptySettings(threadPool));
+            var action = actionCreator.create(model, Map.of());
+
+            PlainActionFuture<InferenceServiceResults> listener = new PlainActionFuture<>();
+            action.execute(new DocumentsOnlyInput(List.of("abc")), InferenceAction.Request.DEFAULT_TIMEOUT, listener);
+
+            var result = listener.actionGet(TIMEOUT);
+
+            assertThat(result.asMap(), is(buildExpectedChatCompletionResultMap(List.of("result"))));
+            assertThat(webServer.requests(), hasSize(1));
+            assertNull(webServer.requests().get(0).getUri().getQuery());
+            assertThat(webServer.requests().get(0).getHeader(HttpHeaders.CONTENT_TYPE), is(XContentType.JSON.mediaType()));
+            assertThat(webServer.requests().get(0).getHeader(HttpHeaders.AUTHORIZATION), is("Bearer secret"));
+
+            var requestMap = entityAsMap(webServer.requests().get(0).getBody());
+            assertThat(requestMap, is(Map.of("message", "abc")));
+        }
+    }
 }
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/action/cohere/CohereCompletionActionTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/action/cohere/CohereCompletionActionTests.java
new file mode 100644
index 0000000000000..195f2bab1d6b5
--- /dev/null
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/action/cohere/CohereCompletionActionTests.java
@@ -0,0 +1,353 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.action.cohere;
+
+import org.apache.http.HttpHeaders;
+import org.elasticsearch.ElasticsearchException;
+import org.elasticsearch.ElasticsearchStatusException;
+import org.elasticsearch.action.ActionListener;
+import org.elasticsearch.action.support.PlainActionFuture;
+import org.elasticsearch.common.settings.Settings;
+import org.elasticsearch.core.Nullable;
+import org.elasticsearch.core.TimeValue;
+import org.elasticsearch.inference.InferenceServiceResults;
+import org.elasticsearch.rest.RestStatus;
+import org.elasticsearch.test.ESTestCase;
+import org.elasticsearch.test.http.MockResponse;
+import org.elasticsearch.test.http.MockWebServer;
+import org.elasticsearch.threadpool.ThreadPool;
+import org.elasticsearch.xcontent.XContentType;
+import org.elasticsearch.xpack.core.inference.action.InferenceAction;
+import org.elasticsearch.xpack.core.inference.results.ChatCompletionResults;
+import org.elasticsearch.xpack.inference.external.http.HttpClientManager;
+import org.elasticsearch.xpack.inference.external.http.sender.DocumentsOnlyInput;
+import org.elasticsearch.xpack.inference.external.http.sender.HttpRequestSenderTests;
+import org.elasticsearch.xpack.inference.external.http.sender.Sender;
+import org.elasticsearch.xpack.inference.external.request.cohere.CohereUtils;
+import org.elasticsearch.xpack.inference.logging.ThrottlerManager;
+import org.elasticsearch.xpack.inference.services.cohere.completion.CohereCompletionModelTests;
+import org.junit.After;
+import org.junit.Before;
+
+import java.io.IOException;
+import java.util.List;
+import java.util.Map;
+import java.util.concurrent.TimeUnit;
+
+import static org.elasticsearch.core.Strings.format;
+import static org.elasticsearch.xpack.inference.Utils.inferenceUtilityPool;
+import static org.elasticsearch.xpack.inference.Utils.mockClusterServiceEmpty;
+import static org.elasticsearch.xpack.inference.external.http.Utils.entityAsMap;
+import static org.elasticsearch.xpack.inference.external.http.Utils.getUrl;
+import static org.hamcrest.Matchers.equalTo;
+import static org.hamcrest.Matchers.hasSize;
+import static org.hamcrest.Matchers.is;
+import static org.mockito.ArgumentMatchers.any;
+import static org.mockito.Mockito.doAnswer;
+import static org.mockito.Mockito.doThrow;
+import static org.mockito.Mockito.mock;
+
+public class CohereCompletionActionTests extends ESTestCase {
+
+    private static final TimeValue TIMEOUT = new TimeValue(30, TimeUnit.SECONDS);
+    private final MockWebServer webServer = new MockWebServer();
+    private ThreadPool threadPool;
+    private HttpClientManager clientManager;
+
+    @Before
+    public void init() throws Exception {
+        webServer.start();
+        threadPool = createThreadPool(inferenceUtilityPool());
+        clientManager = HttpClientManager.create(Settings.EMPTY, threadPool, mockClusterServiceEmpty(), mock(ThrottlerManager.class));
+    }
+
+    @After
+    public void shutdown() throws IOException {
+        clientManager.close();
+        terminate(threadPool);
+        webServer.close();
+    }
+
+    public void testExecute_ReturnsSuccessfulResponse_WithModelSpecified() throws IOException {
+        var senderFactory = HttpRequestSenderTests.createSenderFactory(threadPool, clientManager);
+
+        try (var sender = HttpRequestSenderTests.createSenderWithSingleRequestManager(senderFactory, "test_service")) {
+            sender.start();
+
+            String responseJson = """
+                {
+                     "response_id": "some id",
+                     "text": "result",
+                     "generation_id": "some id",
+                     "chat_history": [
+                         {
+                             "role": "USER",
+                             "message": "input"
+                         },
+                         {
+                             "role": "CHATBOT",
+                             "message": "result"
+                         }
+                     ],
+                     "finish_reason": "COMPLETE",
+                     "meta": {
+                         "api_version": {
+                             "version": "1"
+                         },
+                         "billed_units": {
+                             "input_tokens": 4,
+                             "output_tokens": 191
+                         },
+                         "tokens": {
+                             "input_tokens": 70,
+                             "output_tokens": 191
+                         }
+                     }
+                 }
+                """;
+            webServer.enqueue(new MockResponse().setResponseCode(200).setBody(responseJson));
+
+            var action = createAction(getUrl(webServer), "secret", "model", sender);
+
+            PlainActionFuture<InferenceServiceResults> listener = new PlainActionFuture<>();
+            action.execute(new DocumentsOnlyInput(List.of("abc")), InferenceAction.Request.DEFAULT_TIMEOUT, listener);
+
+            var result = listener.actionGet(TIMEOUT);
+
+            assertThat(result.asMap(), is(buildExpectedChatCompletionResultMap(List.of("result"))));
+            assertThat(webServer.requests(), hasSize(1));
+            assertNull(webServer.requests().get(0).getUri().getQuery());
+            assertThat(webServer.requests().get(0).getHeader(HttpHeaders.CONTENT_TYPE), equalTo(XContentType.JSON.mediaType()));
+            assertThat(webServer.requests().get(0).getHeader(HttpHeaders.AUTHORIZATION), equalTo("Bearer secret"));
+            assertThat(
+                webServer.requests().get(0).getHeader(CohereUtils.REQUEST_SOURCE_HEADER),
+                equalTo(CohereUtils.ELASTIC_REQUEST_SOURCE)
+            );
+
+            var requestMap = entityAsMap(webServer.requests().get(0).getBody());
+            assertThat(requestMap, is(Map.of("message", "abc", "model", "model")));
+        }
+    }
+
+    public void testExecute_ReturnsSuccessfulResponse_WithoutModelSpecified() throws IOException {
+        var senderFactory = HttpRequestSenderTests.createSenderFactory(threadPool, clientManager);
+
+        try (var sender = HttpRequestSenderTests.createSenderWithSingleRequestManager(senderFactory, "test_service")) {
+            sender.start();
+
+            String responseJson = """
+                {
+                     "response_id": "some id",
+                     "text": "result",
+                     "generation_id": "some id",
+                     "chat_history": [
+                         {
+                             "role": "USER",
+                             "message": "input"
+                         },
+                         {
+                             "role": "CHATBOT",
+                             "message": "result"
+                         }
+                     ],
+                     "finish_reason": "COMPLETE",
+                     "meta": {
+                         "api_version": {
+                             "version": "1"
+                         },
+                         "billed_units": {
+                             "input_tokens": 4,
+                             "output_tokens": 191
+                         },
+                         "tokens": {
+                             "input_tokens": 70,
+                             "output_tokens": 191
+                         }
+                     }
+                 }
+                """;
+            webServer.enqueue(new MockResponse().setResponseCode(200).setBody(responseJson));
+
+            var action = createAction(getUrl(webServer), "secret", null, sender);
+
+            PlainActionFuture<InferenceServiceResults> listener = new PlainActionFuture<>();
+            action.execute(new DocumentsOnlyInput(List.of("abc")), InferenceAction.Request.DEFAULT_TIMEOUT, listener);
+
+            var result = listener.actionGet(TIMEOUT);
+
+            assertThat(result.asMap(), is(buildExpectedChatCompletionResultMap(List.of("result"))));
+            assertThat(webServer.requests(), hasSize(1));
+            assertNull(webServer.requests().get(0).getUri().getQuery());
+            assertThat(webServer.requests().get(0).getHeader(HttpHeaders.CONTENT_TYPE), equalTo(XContentType.JSON.mediaType()));
+            assertThat(webServer.requests().get(0).getHeader(HttpHeaders.AUTHORIZATION), equalTo("Bearer secret"));
+            assertThat(
+                webServer.requests().get(0).getHeader(CohereUtils.REQUEST_SOURCE_HEADER),
+                equalTo(CohereUtils.ELASTIC_REQUEST_SOURCE)
+            );
+
+            var requestMap = entityAsMap(webServer.requests().get(0).getBody());
+            assertThat(requestMap, is(Map.of("message", "abc")));
+        }
+    }
+
+    public void testExecute_ThrowsURISyntaxException_ForInvalidUrl() throws IOException {
+        try (var sender = mock(Sender.class)) {
+            var thrownException = expectThrows(IllegalArgumentException.class, () -> createAction("a^b", "api key", "model", sender));
+            assertThat(thrownException.getMessage(), is("unable to parse url [a^b]"));
+        }
+    }
+
+    public void testExecute_ThrowsElasticsearchException() {
+        var sender = mock(Sender.class);
+        doThrow(new ElasticsearchException("failed")).when(sender).send(any(), any(), any(), any());
+
+        var action = createAction(getUrl(webServer), "secret", "model", sender);
+
+        PlainActionFuture<InferenceServiceResults> listener = new PlainActionFuture<>();
+        action.execute(new DocumentsOnlyInput(List.of("abc")), InferenceAction.Request.DEFAULT_TIMEOUT, listener);
+
+        var thrownException = expectThrows(ElasticsearchException.class, () -> listener.actionGet(TIMEOUT));
+
+        assertThat(thrownException.getMessage(), is("failed"));
+    }
+
+    public void testExecute_ThrowsElasticsearchException_WhenSenderOnFailureIsCalled() {
+        var sender = mock(Sender.class);
+
+        doAnswer(invocation -> {
+            @SuppressWarnings("unchecked")
+            ActionListener<InferenceServiceResults> listener = (ActionListener<InferenceServiceResults>) invocation.getArguments()[2];
+            listener.onFailure(new IllegalStateException("failed"));
+
+            return Void.TYPE;
+        }).when(sender).send(any(), any(), any(), any());
+
+        var action = createAction(getUrl(webServer), "secret", "model", sender);
+
+        PlainActionFuture<InferenceServiceResults> listener = new PlainActionFuture<>();
+        action.execute(new DocumentsOnlyInput(List.of("abc")), InferenceAction.Request.DEFAULT_TIMEOUT, listener);
+
+        var thrownException = expectThrows(ElasticsearchException.class, () -> listener.actionGet(TIMEOUT));
+
+        assertThat(thrownException.getMessage(), is(format("Failed to send Cohere completion request to [%s]", getUrl(webServer))));
+    }
+
+    public void testExecute_ThrowsElasticsearchException_WhenSenderOnFailureIsCalled_WhenUrlIsNull() {
+        var sender = mock(Sender.class);
+
+        doAnswer(invocation -> {
+            @SuppressWarnings("unchecked")
+            ActionListener<InferenceServiceResults> listener = (ActionListener<InferenceServiceResults>) invocation.getArguments()[2];
+            listener.onFailure(new IllegalStateException("failed"));
+
+            return Void.TYPE;
+        }).when(sender).send(any(), any(), any(), any());
+
+        var action = createAction(null, "secret", "model", sender);
+
+        PlainActionFuture<InferenceServiceResults> listener = new PlainActionFuture<>();
+        action.execute(new DocumentsOnlyInput(List.of("abc")), InferenceAction.Request.DEFAULT_TIMEOUT, listener);
+
+        var thrownException = expectThrows(ElasticsearchException.class, () -> listener.actionGet(TIMEOUT));
+
+        assertThat(thrownException.getMessage(), is(format("Failed to send Cohere completion request", getUrl(webServer))));
+    }
+
+    public void testExecute_ThrowsException() {
+        var sender = mock(Sender.class);
+        doThrow(new IllegalArgumentException("failed")).when(sender).send(any(), any(), any(), any());
+
+        var action = createAction(getUrl(webServer), "secret", "model", sender);
+
+        PlainActionFuture<InferenceServiceResults> listener = new PlainActionFuture<>();
+        action.execute(new DocumentsOnlyInput(List.of("abc")), InferenceAction.Request.DEFAULT_TIMEOUT, listener);
+
+        var thrownException = expectThrows(ElasticsearchException.class, () -> listener.actionGet(TIMEOUT));
+
+        assertThat(thrownException.getMessage(), is(format("Failed to send Cohere completion request to [%s]", getUrl(webServer))));
+    }
+
+    public void testExecute_ThrowsExceptionWithNullUrl() {
+        var sender = mock(Sender.class);
+        doThrow(new IllegalArgumentException("failed")).when(sender).send(any(), any(), any(), any());
+
+        var action = createAction(null, "secret", "model", sender);
+
+        PlainActionFuture<InferenceServiceResults> listener = new PlainActionFuture<>();
+        action.execute(new DocumentsOnlyInput(List.of("abc")), InferenceAction.Request.DEFAULT_TIMEOUT, listener);
+
+        var thrownException = expectThrows(ElasticsearchException.class, () -> listener.actionGet(TIMEOUT));
+
+        assertThat(thrownException.getMessage(), is("Failed to send Cohere completion request"));
+    }
+
+    public void testExecute_ThrowsException_WhenInputIsGreaterThanOne() throws IOException {
+        var senderFactory = HttpRequestSenderTests.createSenderFactory(threadPool, clientManager);
+
+        try (var sender = senderFactory.createSender("test_service")) {
+            sender.start();
+
+            String responseJson = """
+                {
+                     "response_id": "some id",
+                     "text": "result",
+                     "generation_id": "some id",
+                     "chat_history": [
+                         {
+                             "role": "USER",
+                             "message": "input"
+                         },
+                         {
+                             "role": "CHATBOT",
+                             "message": "result"
+                         }
+                     ],
+                     "finish_reason": "COMPLETE",
+                     "meta": {
+                         "api_version": {
+                             "version": "1"
+                         },
+                         "billed_units": {
+                             "input_tokens": 4,
+                             "output_tokens": 191
+                         },
+                         "tokens": {
+                             "input_tokens": 70,
+                             "output_tokens": 191
+                         }
+                     }
+                 }
+                """;
+
+            webServer.enqueue(new MockResponse().setResponseCode(200).setBody(responseJson));
+
+            var action = createAction(getUrl(webServer), "secret", "model", sender);
+
+            PlainActionFuture<InferenceServiceResults> listener = new PlainActionFuture<>();
+            action.execute(new DocumentsOnlyInput(List.of("abc", "def")), InferenceAction.Request.DEFAULT_TIMEOUT, listener);
+
+            var thrownException = expectThrows(ElasticsearchStatusException.class, () -> listener.actionGet(TIMEOUT));
+
+            assertThat(thrownException.getMessage(), is("Cohere completion only accepts 1 input"));
+            assertThat(thrownException.status(), is(RestStatus.BAD_REQUEST));
+        }
+    }
+
+    public static Map<String, Object> buildExpectedChatCompletionResultMap(List<String> results) {
+        return Map.of(
+            ChatCompletionResults.COMPLETION,
+            results.stream().map(result -> Map.of(ChatCompletionResults.Result.RESULT, result)).toList()
+        );
+    }
+
+    private CohereCompletionAction createAction(String url, String apiKey, @Nullable String modelName, Sender sender) {
+        var model = CohereCompletionModelTests.createModel(url, apiKey, modelName);
+
+        return new CohereCompletionAction(sender, model, threadPool);
+    }
+}
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/request/azureaistudio/AzureAiStudioChatCompletionRequestEntityTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/request/azureaistudio/AzureAiStudioChatCompletionRequestEntityTests.java
new file mode 100644
index 0000000000000..3b086f4d3b900
--- /dev/null
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/request/azureaistudio/AzureAiStudioChatCompletionRequestEntityTests.java
@@ -0,0 +1,227 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.request.azureaistudio;
+
+import org.elasticsearch.common.Strings;
+import org.elasticsearch.core.Nullable;
+import org.elasticsearch.test.ESTestCase;
+import org.elasticsearch.xcontent.XContentBuilder;
+import org.elasticsearch.xcontent.XContentFactory;
+import org.elasticsearch.xcontent.XContentType;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioEndpointType;
+
+import java.io.IOException;
+import java.util.List;
+
+import static org.hamcrest.CoreMatchers.is;
+
+public class AzureAiStudioChatCompletionRequestEntityTests extends ESTestCase {
+
+    public void testToXContent_WhenTokenEndpoint_NoParameters() throws IOException {
+        var entity = new AzureAiStudioChatCompletionRequestEntity(List.of("abc"), AzureAiStudioEndpointType.TOKEN, null, null, null, null);
+        var request = getXContentAsString(entity);
+        var expectedRequest = getExpectedTokenEndpointRequest(List.of("abc"), null, null, null, null);
+        assertThat(request, is(expectedRequest));
+    }
+
+    public void testToXContent_WhenTokenEndpoint_WithTemperatureParam() throws IOException {
+        var entity = new AzureAiStudioChatCompletionRequestEntity(List.of("abc"), AzureAiStudioEndpointType.TOKEN, 1.0, null, null, null);
+        var request = getXContentAsString(entity);
+        var expectedRequest = getExpectedTokenEndpointRequest(List.of("abc"), 1.0, null, null, null);
+        assertThat(request, is(expectedRequest));
+    }
+
+    public void testToXContent_WhenTokenEndpoint_WithTopPParam() throws IOException {
+        var entity = new AzureAiStudioChatCompletionRequestEntity(List.of("abc"), AzureAiStudioEndpointType.TOKEN, null, 2.0, null, null);
+        var request = getXContentAsString(entity);
+        var expectedRequest = getExpectedTokenEndpointRequest(List.of("abc"), null, 2.0, null, null);
+        assertThat(request, is(expectedRequest));
+    }
+
+    public void testToXContent_WhenTokenEndpoint_WithDoSampleParam() throws IOException {
+        var entity = new AzureAiStudioChatCompletionRequestEntity(List.of("abc"), AzureAiStudioEndpointType.TOKEN, null, null, true, null);
+        var request = getXContentAsString(entity);
+        var expectedRequest = getExpectedTokenEndpointRequest(List.of("abc"), null, null, true, null);
+        assertThat(request, is(expectedRequest));
+    }
+
+    public void testToXContent_WhenTokenEndpoint_WithMaxNewTokensParam() throws IOException {
+        var entity = new AzureAiStudioChatCompletionRequestEntity(List.of("abc"), AzureAiStudioEndpointType.TOKEN, null, null, null, 512);
+        var request = getXContentAsString(entity);
+        var expectedRequest = getExpectedTokenEndpointRequest(List.of("abc"), null, null, null, 512);
+        assertThat(request, is(expectedRequest));
+    }
+
+    public void testToXContent_WhenRealtimeEndpoint_NoParameters() throws IOException {
+        var entity = new AzureAiStudioChatCompletionRequestEntity(
+            List.of("abc"),
+            AzureAiStudioEndpointType.REALTIME,
+            null,
+            null,
+            null,
+            null
+        );
+        var request = getXContentAsString(entity);
+        var expectedRequest = getExpectedRealtimeEndpointRequest(List.of("abc"), null, null, null, null);
+        assertThat(request, is(expectedRequest));
+    }
+
+    public void testToXContent_WhenRealtimeEndpoint_WithTemperatureParam() throws IOException {
+        var entity = new AzureAiStudioChatCompletionRequestEntity(
+            List.of("abc"),
+            AzureAiStudioEndpointType.REALTIME,
+            1.0,
+            null,
+            null,
+            null
+        );
+        var request = getXContentAsString(entity);
+        var expectedRequest = getExpectedRealtimeEndpointRequest(List.of("abc"), 1.0, null, null, null);
+        assertThat(request, is(expectedRequest));
+    }
+
+    public void testToXContent_WhenRealtimeEndpoint_WithTopPParam() throws IOException {
+        var entity = new AzureAiStudioChatCompletionRequestEntity(
+            List.of("abc"),
+            AzureAiStudioEndpointType.REALTIME,
+            null,
+            2.0,
+            null,
+            null
+        );
+        var request = getXContentAsString(entity);
+        var expectedRequest = getExpectedRealtimeEndpointRequest(List.of("abc"), null, 2.0, null, null);
+        assertThat(request, is(expectedRequest));
+    }
+
+    public void testToXContent_WhenRealtimeEndpoint_WithDoSampleParam() throws IOException {
+        var entity = new AzureAiStudioChatCompletionRequestEntity(
+            List.of("abc"),
+            AzureAiStudioEndpointType.REALTIME,
+            null,
+            null,
+            true,
+            null
+        );
+        var request = getXContentAsString(entity);
+        var expectedRequest = getExpectedRealtimeEndpointRequest(List.of("abc"), null, null, true, null);
+        assertThat(request, is(expectedRequest));
+    }
+
+    public void testToXContent_WhenRealtimeEndpoint_WithMaxNewTokensParam() throws IOException {
+        var entity = new AzureAiStudioChatCompletionRequestEntity(
+            List.of("abc"),
+            AzureAiStudioEndpointType.REALTIME,
+            null,
+            null,
+            null,
+            512
+        );
+        var request = getXContentAsString(entity);
+        var expectedRequest = getExpectedRealtimeEndpointRequest(List.of("abc"), null, null, null, 512);
+        assertThat(request, is(expectedRequest));
+    }
+
+    private String getXContentAsString(AzureAiStudioChatCompletionRequestEntity entity) throws IOException {
+        XContentBuilder builder = XContentFactory.contentBuilder(XContentType.JSON);
+        entity.toXContent(builder, null);
+        return Strings.toString(builder);
+    }
+
+    private String getExpectedTokenEndpointRequest(
+        List<String> inputs,
+        @Nullable Double temperature,
+        @Nullable Double topP,
+        @Nullable Boolean doSample,
+        @Nullable Integer maxNewTokens
+    ) {
+        String expected = "{";
+
+        expected = addMessageInputs("messages", expected, inputs);
+        expected = addParameters(expected, temperature, topP, doSample, maxNewTokens);
+
+        expected += "}";
+        return expected;
+    }
+
+    private String getExpectedRealtimeEndpointRequest(
+        List<String> inputs,
+        @Nullable Double temperature,
+        @Nullable Double topP,
+        @Nullable Boolean doSample,
+        @Nullable Integer maxNewTokens
+    ) {
+        String expected = "{\"input_data\":{";
+
+        expected = addMessageInputs("input_string", expected, inputs);
+        expected = addParameters(expected, temperature, topP, doSample, maxNewTokens);
+
+        expected += "}}";
+        return expected;
+    }
+
+    private String addMessageInputs(String fieldName, String expected, List<String> inputs) {
+        StringBuilder messages = new StringBuilder(Strings.format("\"%s\":[", fieldName));
+        var hasOne = false;
+        for (String input : inputs) {
+            if (hasOne) {
+                messages.append(",");
+            }
+            messages.append(getMessageString(input));
+            hasOne = true;
+        }
+        messages.append("]");
+
+        return expected + messages;
+    }
+
+    private String getMessageString(String input) {
+        return Strings.format("{\"content\":\"%s\",\"role\":\"user\"}", input);
+    }
+
+    private String addParameters(String expected, Double temperature, Double topP, Boolean doSample, Integer maxNewTokens) {
+        if (temperature == null && topP == null && doSample == null && maxNewTokens == null) {
+            return expected;
+        }
+
+        StringBuilder parameters = new StringBuilder(",\"parameters\":{");
+
+        var hasOne = false;
+        if (temperature != null) {
+            parameters.append(Strings.format("\"temperature\":%.1f", temperature));
+            hasOne = true;
+        }
+
+        if (topP != null) {
+            if (hasOne) {
+                parameters.append(",");
+            }
+            parameters.append(Strings.format("\"top_p\":%.1f", topP));
+            hasOne = true;
+        }
+
+        if (doSample != null) {
+            if (hasOne) {
+                parameters.append(",");
+            }
+            parameters.append(Strings.format("\"do_sample\":%s", doSample.equals(Boolean.TRUE)));
+            hasOne = true;
+        }
+
+        if (maxNewTokens != null) {
+            if (hasOne) {
+                parameters.append(",");
+            }
+            parameters.append(Strings.format("\"max_new_tokens\":%d", maxNewTokens));
+        }
+
+        parameters.append("}");
+
+        return expected + parameters;
+    }
+}
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/request/azureaistudio/AzureAiStudioChatCompletionRequestTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/request/azureaistudio/AzureAiStudioChatCompletionRequestTests.java
new file mode 100644
index 0000000000000..f3ddf7f9299d9
--- /dev/null
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/request/azureaistudio/AzureAiStudioChatCompletionRequestTests.java
@@ -0,0 +1,465 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.request.azureaistudio;
+
+import org.apache.http.HttpHeaders;
+import org.apache.http.client.methods.HttpPost;
+import org.elasticsearch.core.Nullable;
+import org.elasticsearch.test.ESTestCase;
+import org.elasticsearch.xcontent.XContentType;
+import org.elasticsearch.xpack.inference.external.request.HttpRequest;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioEndpointType;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioProvider;
+import org.elasticsearch.xpack.inference.services.azureaistudio.completion.AzureAiStudioChatCompletionModelTests;
+
+import java.io.IOException;
+import java.util.HashMap;
+import java.util.List;
+import java.util.Map;
+
+import static org.elasticsearch.xpack.inference.external.http.Utils.entityAsMap;
+import static org.elasticsearch.xpack.inference.external.request.azureopenai.AzureOpenAiUtils.API_KEY_HEADER;
+import static org.hamcrest.Matchers.aMapWithSize;
+import static org.hamcrest.Matchers.instanceOf;
+import static org.hamcrest.Matchers.is;
+
+public class AzureAiStudioChatCompletionRequestTests extends ESTestCase {
+
+    public void testCreateRequest_WithOpenAiProviderTokenEndpoint_NoParams() throws IOException {
+        var request = createRequest(
+            "http://openaitarget.local",
+            AzureAiStudioProvider.OPENAI,
+            AzureAiStudioEndpointType.TOKEN,
+            "apikey",
+            "abcd"
+        );
+        var httpRequest = request.createHttpRequest();
+
+        var httpPost = validateRequestUrlAndContentType(httpRequest, "http://openaitarget.local");
+        validateRequestApiKey(httpPost, AzureAiStudioProvider.OPENAI, AzureAiStudioEndpointType.TOKEN, "apikey");
+
+        var requestMap = entityAsMap(httpPost.getEntity().getContent());
+        assertThat(requestMap, aMapWithSize(1));
+        assertThat(requestMap.get("messages"), is(List.of(Map.of("role", "user", "content", "abcd"))));
+    }
+
+    public void testCreateRequest_WithOpenAiProviderTokenEndpoint_WithTemperatureParam() throws IOException {
+        var request = createRequest(
+            "http://openaitarget.local",
+            AzureAiStudioProvider.OPENAI,
+            AzureAiStudioEndpointType.TOKEN,
+            "apikey",
+            1.0,
+            null,
+            null,
+            null,
+            "abcd"
+        );
+        var httpRequest = request.createHttpRequest();
+
+        var httpPost = validateRequestUrlAndContentType(httpRequest, "http://openaitarget.local");
+        validateRequestApiKey(httpPost, AzureAiStudioProvider.OPENAI, AzureAiStudioEndpointType.TOKEN, "apikey");
+
+        var requestMap = entityAsMap(httpPost.getEntity().getContent());
+        assertThat(requestMap, aMapWithSize(2));
+        assertThat(requestMap.get("messages"), is(List.of(Map.of("role", "user", "content", "abcd"))));
+        assertThat(requestMap.get("parameters"), is(getParameterMap(1.0, null, null, null)));
+    }
+
+    public void testCreateRequest_WithOpenAiProviderTokenEndpoint_WithTopPParam() throws IOException {
+        var request = createRequest(
+            "http://openaitarget.local",
+            AzureAiStudioProvider.OPENAI,
+            AzureAiStudioEndpointType.TOKEN,
+            "apikey",
+            null,
+            2.0,
+            null,
+            null,
+            "abcd"
+        );
+        var httpRequest = request.createHttpRequest();
+
+        var httpPost = validateRequestUrlAndContentType(httpRequest, "http://openaitarget.local");
+        validateRequestApiKey(httpPost, AzureAiStudioProvider.OPENAI, AzureAiStudioEndpointType.TOKEN, "apikey");
+
+        var requestMap = entityAsMap(httpPost.getEntity().getContent());
+        assertThat(requestMap, aMapWithSize(2));
+        assertThat(requestMap.get("messages"), is(List.of(Map.of("role", "user", "content", "abcd"))));
+        assertThat(requestMap.get("parameters"), is(getParameterMap(null, 2.0, null, null)));
+    }
+
+    public void testCreateRequest_WithOpenAiProviderTokenEndpoint_WithDoSampleParam() throws IOException {
+        var request = createRequest(
+            "http://openaitarget.local",
+            AzureAiStudioProvider.OPENAI,
+            AzureAiStudioEndpointType.TOKEN,
+            "apikey",
+            null,
+            null,
+            true,
+            null,
+            "abcd"
+        );
+        var httpRequest = request.createHttpRequest();
+
+        var httpPost = validateRequestUrlAndContentType(httpRequest, "http://openaitarget.local");
+        validateRequestApiKey(httpPost, AzureAiStudioProvider.OPENAI, AzureAiStudioEndpointType.TOKEN, "apikey");
+
+        var requestMap = entityAsMap(httpPost.getEntity().getContent());
+        assertThat(requestMap, aMapWithSize(2));
+        assertThat(requestMap.get("messages"), is(List.of(Map.of("role", "user", "content", "abcd"))));
+        assertThat(requestMap.get("parameters"), is(getParameterMap(null, null, true, null)));
+    }
+
+    public void testCreateRequest_WithOpenAiProviderTokenEndpoint_WithMaxNewTokensParam() throws IOException {
+        var request = createRequest(
+            "http://openaitarget.local",
+            AzureAiStudioProvider.OPENAI,
+            AzureAiStudioEndpointType.TOKEN,
+            "apikey",
+            null,
+            null,
+            null,
+            512,
+            "abcd"
+        );
+        var httpRequest = request.createHttpRequest();
+
+        var httpPost = validateRequestUrlAndContentType(httpRequest, "http://openaitarget.local");
+        validateRequestApiKey(httpPost, AzureAiStudioProvider.OPENAI, AzureAiStudioEndpointType.TOKEN, "apikey");
+
+        var requestMap = entityAsMap(httpPost.getEntity().getContent());
+        assertThat(requestMap, aMapWithSize(2));
+        assertThat(requestMap.get("messages"), is(List.of(Map.of("role", "user", "content", "abcd"))));
+        assertThat(requestMap.get("parameters"), is(getParameterMap(null, null, null, 512)));
+    }
+
+    public void testCreateRequest_WithCohereProviderTokenEndpoint_NoParams() throws IOException {
+        var request = createRequest(
+            "http://coheretarget.local",
+            AzureAiStudioProvider.COHERE,
+            AzureAiStudioEndpointType.TOKEN,
+            "apikey",
+            "abcd"
+        );
+        var httpRequest = request.createHttpRequest();
+
+        var httpPost = validateRequestUrlAndContentType(httpRequest, "http://coheretarget.local/v1/chat/completions");
+        validateRequestApiKey(httpPost, AzureAiStudioProvider.COHERE, AzureAiStudioEndpointType.TOKEN, "apikey");
+
+        var requestMap = entityAsMap(httpPost.getEntity().getContent());
+        assertThat(requestMap, aMapWithSize(1));
+        assertThat(requestMap.get("messages"), is(List.of(Map.of("role", "user", "content", "abcd"))));
+    }
+
+    public void testCreateRequest_WithCohereProviderTokenEndpoint_WithTemperatureParam() throws IOException {
+        var request = createRequest(
+            "http://coheretarget.local",
+            AzureAiStudioProvider.COHERE,
+            AzureAiStudioEndpointType.TOKEN,
+            "apikey",
+            1.0,
+            null,
+            null,
+            null,
+            "abcd"
+        );
+        var httpRequest = request.createHttpRequest();
+
+        var httpPost = validateRequestUrlAndContentType(httpRequest, "http://coheretarget.local/v1/chat/completions");
+        validateRequestApiKey(httpPost, AzureAiStudioProvider.COHERE, AzureAiStudioEndpointType.TOKEN, "apikey");
+
+        var requestMap = entityAsMap(httpPost.getEntity().getContent());
+        assertThat(requestMap, aMapWithSize(2));
+        assertThat(requestMap.get("messages"), is(List.of(Map.of("role", "user", "content", "abcd"))));
+        assertThat(requestMap.get("parameters"), is(getParameterMap(1.0, null, null, null)));
+    }
+
+    public void testCreateRequest_WithCohereProviderTokenEndpoint_WithTopPParam() throws IOException {
+        var request = createRequest(
+            "http://coheretarget.local",
+            AzureAiStudioProvider.COHERE,
+            AzureAiStudioEndpointType.TOKEN,
+            "apikey",
+            null,
+            2.0,
+            null,
+            null,
+            "abcd"
+        );
+        var httpRequest = request.createHttpRequest();
+
+        var httpPost = validateRequestUrlAndContentType(httpRequest, "http://coheretarget.local/v1/chat/completions");
+        validateRequestApiKey(httpPost, AzureAiStudioProvider.COHERE, AzureAiStudioEndpointType.TOKEN, "apikey");
+
+        var requestMap = entityAsMap(httpPost.getEntity().getContent());
+        assertThat(requestMap, aMapWithSize(2));
+        assertThat(requestMap.get("messages"), is(List.of(Map.of("role", "user", "content", "abcd"))));
+        assertThat(requestMap.get("parameters"), is(getParameterMap(null, 2.0, null, null)));
+    }
+
+    public void testCreateRequest_WithCohereProviderTokenEndpoint_WithDoSampleParam() throws IOException {
+        var request = createRequest(
+            "http://coheretarget.local",
+            AzureAiStudioProvider.COHERE,
+            AzureAiStudioEndpointType.TOKEN,
+            "apikey",
+            null,
+            null,
+            true,
+            null,
+            "abcd"
+        );
+        var httpRequest = request.createHttpRequest();
+
+        var httpPost = validateRequestUrlAndContentType(httpRequest, "http://coheretarget.local/v1/chat/completions");
+        validateRequestApiKey(httpPost, AzureAiStudioProvider.COHERE, AzureAiStudioEndpointType.TOKEN, "apikey");
+
+        var requestMap = entityAsMap(httpPost.getEntity().getContent());
+        assertThat(requestMap, aMapWithSize(2));
+        assertThat(requestMap.get("messages"), is(List.of(Map.of("role", "user", "content", "abcd"))));
+        assertThat(requestMap.get("parameters"), is(getParameterMap(null, null, true, null)));
+    }
+
+    public void testCreateRequest_WithCohereProviderTokenEndpoint_WithMaxNewTokensParam() throws IOException {
+        var request = createRequest(
+            "http://coheretarget.local",
+            AzureAiStudioProvider.COHERE,
+            AzureAiStudioEndpointType.TOKEN,
+            "apikey",
+            null,
+            null,
+            null,
+            512,
+            "abcd"
+        );
+        var httpRequest = request.createHttpRequest();
+
+        var httpPost = validateRequestUrlAndContentType(httpRequest, "http://coheretarget.local/v1/chat/completions");
+        validateRequestApiKey(httpPost, AzureAiStudioProvider.COHERE, AzureAiStudioEndpointType.TOKEN, "apikey");
+
+        var requestMap = entityAsMap(httpPost.getEntity().getContent());
+        assertThat(requestMap, aMapWithSize(2));
+        assertThat(requestMap.get("messages"), is(List.of(Map.of("role", "user", "content", "abcd"))));
+        assertThat(requestMap.get("parameters"), is(getParameterMap(null, null, null, 512)));
+    }
+
+    public void testCreateRequest_WithMistralProviderRealtimeEndpoint_NoParams() throws IOException {
+        var request = createRequest(
+            "http://mistral.local/score",
+            AzureAiStudioProvider.MISTRAL,
+            AzureAiStudioEndpointType.REALTIME,
+            "apikey",
+            "abcd"
+        );
+        var httpRequest = request.createHttpRequest();
+
+        var httpPost = validateRequestUrlAndContentType(httpRequest, "http://mistral.local/score");
+        validateRequestApiKey(httpPost, AzureAiStudioProvider.MISTRAL, AzureAiStudioEndpointType.REALTIME, "apikey");
+
+        var requestMap = entityAsMap(httpPost.getEntity().getContent());
+        assertThat(requestMap, aMapWithSize(1));
+
+        @SuppressWarnings("unchecked")
+        var input_data = (Map<String, Object>) requestMap.get("input_data");
+        assertThat(input_data, aMapWithSize(1));
+        assertThat(input_data.get("input_string"), is(List.of(Map.of("role", "user", "content", "abcd"))));
+    }
+
+    public void testCreateRequest_WithMistralProviderRealtimeEndpoint_WithTemperatureParam() throws IOException {
+        var request = createRequest(
+            "http://mistral.local/score",
+            AzureAiStudioProvider.MISTRAL,
+            AzureAiStudioEndpointType.REALTIME,
+            "apikey",
+            1.0,
+            null,
+            null,
+            null,
+            "abcd"
+        );
+        var httpRequest = request.createHttpRequest();
+
+        var httpPost = validateRequestUrlAndContentType(httpRequest, "http://mistral.local/score");
+        validateRequestApiKey(httpPost, AzureAiStudioProvider.MISTRAL, AzureAiStudioEndpointType.REALTIME, "apikey");
+
+        var requestMap = entityAsMap(httpPost.getEntity().getContent());
+        assertThat(requestMap, aMapWithSize(1));
+
+        @SuppressWarnings("unchecked")
+        var input_data = (Map<String, Object>) requestMap.get("input_data");
+        assertThat(input_data, aMapWithSize(2));
+        assertThat(input_data.get("input_string"), is(List.of(Map.of("role", "user", "content", "abcd"))));
+        assertThat(input_data.get("parameters"), is(getParameterMap(1.0, null, null, null)));
+    }
+
+    public void testCreateRequest_WithMistralProviderRealtimeEndpoint_WithTopPParam() throws IOException {
+        var request = createRequest(
+            "http://mistral.local/score",
+            AzureAiStudioProvider.MISTRAL,
+            AzureAiStudioEndpointType.REALTIME,
+            "apikey",
+            null,
+            2.0,
+            null,
+            null,
+            "abcd"
+        );
+        var httpRequest = request.createHttpRequest();
+
+        var httpPost = validateRequestUrlAndContentType(httpRequest, "http://mistral.local/score");
+        validateRequestApiKey(httpPost, AzureAiStudioProvider.MISTRAL, AzureAiStudioEndpointType.REALTIME, "apikey");
+
+        var requestMap = entityAsMap(httpPost.getEntity().getContent());
+        assertThat(requestMap, aMapWithSize(1));
+
+        @SuppressWarnings("unchecked")
+        var input_data = (Map<String, Object>) requestMap.get("input_data");
+        assertThat(input_data, aMapWithSize(2));
+        assertThat(input_data.get("input_string"), is(List.of(Map.of("role", "user", "content", "abcd"))));
+        assertThat(input_data.get("parameters"), is(getParameterMap(null, 2.0, null, null)));
+    }
+
+    public void testCreateRequest_WithMistralProviderRealtimeEndpoint_WithDoSampleParam() throws IOException {
+        var request = createRequest(
+            "http://mistral.local/score",
+            AzureAiStudioProvider.MISTRAL,
+            AzureAiStudioEndpointType.REALTIME,
+            "apikey",
+            null,
+            null,
+            true,
+            null,
+            "abcd"
+        );
+        var httpRequest = request.createHttpRequest();
+
+        var httpPost = validateRequestUrlAndContentType(httpRequest, "http://mistral.local/score");
+        validateRequestApiKey(httpPost, AzureAiStudioProvider.MISTRAL, AzureAiStudioEndpointType.REALTIME, "apikey");
+
+        var requestMap = entityAsMap(httpPost.getEntity().getContent());
+        assertThat(requestMap, aMapWithSize(1));
+
+        @SuppressWarnings("unchecked")
+        var input_data = (Map<String, Object>) requestMap.get("input_data");
+        assertThat(input_data, aMapWithSize(2));
+        assertThat(input_data.get("input_string"), is(List.of(Map.of("role", "user", "content", "abcd"))));
+        assertThat(input_data.get("parameters"), is(getParameterMap(null, null, true, null)));
+    }
+
+    public void testCreateRequest_WithMistralProviderRealtimeEndpoint_WithMaxNewTokensParam() throws IOException {
+        var request = createRequest(
+            "http://mistral.local/score",
+            AzureAiStudioProvider.MISTRAL,
+            AzureAiStudioEndpointType.REALTIME,
+            "apikey",
+            null,
+            null,
+            null,
+            512,
+            "abcd"
+        );
+        var httpRequest = request.createHttpRequest();
+
+        var httpPost = validateRequestUrlAndContentType(httpRequest, "http://mistral.local/score");
+        validateRequestApiKey(httpPost, AzureAiStudioProvider.MISTRAL, AzureAiStudioEndpointType.REALTIME, "apikey");
+
+        var requestMap = entityAsMap(httpPost.getEntity().getContent());
+        assertThat(requestMap, aMapWithSize(1));
+
+        @SuppressWarnings("unchecked")
+        var input_data = (Map<String, Object>) requestMap.get("input_data");
+        assertThat(input_data, aMapWithSize(2));
+        assertThat(input_data.get("input_string"), is(List.of(Map.of("role", "user", "content", "abcd"))));
+        assertThat(input_data.get("parameters"), is(getParameterMap(null, null, null, 512)));
+    }
+
+    private HttpPost validateRequestUrlAndContentType(HttpRequest request, String expectedUrl) throws IOException {
+        assertThat(request.httpRequestBase(), instanceOf(HttpPost.class));
+        var httpPost = (HttpPost) request.httpRequestBase();
+        assertThat(httpPost.getURI().toString(), is(expectedUrl));
+        assertThat(httpPost.getLastHeader(HttpHeaders.CONTENT_TYPE).getValue(), is(XContentType.JSON.mediaType()));
+        return httpPost;
+    }
+
+    private void validateRequestApiKey(
+        HttpPost httpPost,
+        AzureAiStudioProvider provider,
+        AzureAiStudioEndpointType endpointType,
+        String apiKey
+    ) {
+        if (endpointType == AzureAiStudioEndpointType.TOKEN) {
+            if (provider == AzureAiStudioProvider.OPENAI) {
+                assertThat(httpPost.getLastHeader(API_KEY_HEADER).getValue(), is(apiKey));
+            } else {
+                assertThat(httpPost.getLastHeader(HttpHeaders.AUTHORIZATION).getValue(), is(apiKey));
+            }
+        } else {
+            assertThat(httpPost.getLastHeader(HttpHeaders.AUTHORIZATION).getValue(), is("Bearer " + apiKey));
+        }
+    }
+
+    private Map<String, Object> getParameterMap(
+        @Nullable Double temperature,
+        @Nullable Double topP,
+        @Nullable Boolean doSample,
+        @Nullable Integer maxNewTokens
+    ) {
+        var map = new HashMap<String, Object>();
+        if (temperature != null) {
+            map.put("temperature", temperature);
+        }
+        if (topP != null) {
+            map.put("top_p", topP);
+        }
+        if (doSample != null) {
+            map.put("do_sample", doSample);
+        }
+        if (maxNewTokens != null) {
+            map.put("max_new_tokens", maxNewTokens);
+        }
+        return map;
+    }
+
+    public static AzureAiStudioChatCompletionRequest createRequest(
+        String target,
+        AzureAiStudioProvider provider,
+        AzureAiStudioEndpointType endpointType,
+        String apiKey,
+        String input
+    ) {
+        return createRequest(target, provider, endpointType, apiKey, null, null, null, null, input);
+    }
+
+    public static AzureAiStudioChatCompletionRequest createRequest(
+        String target,
+        AzureAiStudioProvider provider,
+        AzureAiStudioEndpointType endpointType,
+        String apiKey,
+        @Nullable Double temperature,
+        @Nullable Double topP,
+        @Nullable Boolean doSample,
+        @Nullable Integer maxNewTokens,
+        String input
+    ) {
+        var model = AzureAiStudioChatCompletionModelTests.createModel(
+            "id",
+            target,
+            provider,
+            endpointType,
+            apiKey,
+            temperature,
+            topP,
+            doSample,
+            maxNewTokens,
+            null
+        );
+        return new AzureAiStudioChatCompletionRequest(model, List.of(input));
+    }
+}
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/request/azureaistudio/AzureAiStudioEmbeddingsRequestEntityTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/request/azureaistudio/AzureAiStudioEmbeddingsRequestEntityTests.java
new file mode 100644
index 0000000000000..b2df7f7c27564
--- /dev/null
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/request/azureaistudio/AzureAiStudioEmbeddingsRequestEntityTests.java
@@ -0,0 +1,77 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.request.azureaistudio;
+
+import org.elasticsearch.common.Strings;
+import org.elasticsearch.test.ESTestCase;
+import org.elasticsearch.xcontent.XContentBuilder;
+import org.elasticsearch.xcontent.XContentFactory;
+import org.elasticsearch.xcontent.XContentType;
+
+import java.io.IOException;
+import java.util.List;
+
+import static org.hamcrest.CoreMatchers.is;
+
+public class AzureAiStudioEmbeddingsRequestEntityTests extends ESTestCase {
+    public void testXContent_WritesUserWhenDefined() throws IOException {
+        var entity = new AzureAiStudioEmbeddingsRequestEntity(List.of("abc"), "testuser", null, false);
+
+        XContentBuilder builder = XContentFactory.contentBuilder(XContentType.JSON);
+        entity.toXContent(builder, null);
+        String xContentResult = Strings.toString(builder);
+
+        assertThat(xContentResult, is("""
+            {"input":["abc"],"user":"testuser"}"""));
+    }
+
+    public void testXContent_DoesNotWriteUserWhenItIsNull() throws IOException {
+        var entity = new AzureAiStudioEmbeddingsRequestEntity(List.of("abc"), null, null, false);
+
+        XContentBuilder builder = XContentFactory.contentBuilder(XContentType.JSON);
+        entity.toXContent(builder, null);
+        String xContentResult = Strings.toString(builder);
+
+        assertThat(xContentResult, is("""
+            {"input":["abc"]}"""));
+    }
+
+    public void testXContent_DoesNotWriteDimensionsWhenNotSetByUser() throws IOException {
+        var entity = new AzureAiStudioEmbeddingsRequestEntity(List.of("abc"), null, 100, false);
+
+        XContentBuilder builder = XContentFactory.contentBuilder(XContentType.JSON);
+        entity.toXContent(builder, null);
+        String xContentResult = Strings.toString(builder);
+
+        assertThat(xContentResult, is("""
+            {"input":["abc"]}"""));
+    }
+
+    public void testXContent_DoesNotWriteDimensionsWhenNull_EvenIfSetByUserIsTrue() throws IOException {
+        var entity = new AzureAiStudioEmbeddingsRequestEntity(List.of("abc"), null, null, true);
+
+        XContentBuilder builder = XContentFactory.contentBuilder(XContentType.JSON);
+        entity.toXContent(builder, null);
+        String xContentResult = Strings.toString(builder);
+
+        assertThat(xContentResult, is("""
+            {"input":["abc"]}"""));
+    }
+
+    public void testXContent_WritesDimensionsWhenNonNull_AndSetByUserIsTrue() throws IOException {
+        var entity = new AzureAiStudioEmbeddingsRequestEntity(List.of("abc"), null, 100, true);
+
+        XContentBuilder builder = XContentFactory.contentBuilder(XContentType.JSON);
+        entity.toXContent(builder, null);
+        String xContentResult = Strings.toString(builder);
+
+        assertThat(xContentResult, is("""
+            {"input":["abc"],"dimensions":100}"""));
+    }
+
+}
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/request/azureaistudio/AzureAiStudioEmbeddingsRequestTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/request/azureaistudio/AzureAiStudioEmbeddingsRequestTests.java
new file mode 100644
index 0000000000000..524d813a4da1f
--- /dev/null
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/request/azureaistudio/AzureAiStudioEmbeddingsRequestTests.java
@@ -0,0 +1,185 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.request.azureaistudio;
+
+import org.apache.http.HttpHeaders;
+import org.apache.http.client.methods.HttpPost;
+import org.elasticsearch.core.Nullable;
+import org.elasticsearch.test.ESTestCase;
+import org.elasticsearch.xcontent.XContentType;
+import org.elasticsearch.xpack.inference.common.Truncator;
+import org.elasticsearch.xpack.inference.common.TruncatorTests;
+import org.elasticsearch.xpack.inference.external.request.HttpRequest;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioEndpointType;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioProvider;
+import org.elasticsearch.xpack.inference.services.azureaistudio.embeddings.AzureAiStudioEmbeddingsModelTests;
+
+import java.io.IOException;
+import java.util.List;
+
+import static org.elasticsearch.xpack.inference.external.http.Utils.entityAsMap;
+import static org.elasticsearch.xpack.inference.external.request.azureopenai.AzureOpenAiUtils.API_KEY_HEADER;
+import static org.hamcrest.Matchers.aMapWithSize;
+import static org.hamcrest.Matchers.instanceOf;
+import static org.hamcrest.Matchers.is;
+
+public class AzureAiStudioEmbeddingsRequestTests extends ESTestCase {
+
+    public void testCreateRequest_WithOpenAiProvider_NoAdditionalParams() throws IOException {
+        var request = createRequest(
+            "http://openaitarget.local",
+            AzureAiStudioProvider.OPENAI,
+            AzureAiStudioEndpointType.TOKEN,
+            "apikey",
+            "abcd",
+            null
+        );
+        var httpRequest = request.createHttpRequest();
+        var httpPost = validateRequestUrlAndContentType(httpRequest, "http://openaitarget.local");
+        validateRequestApiKey(httpPost, AzureAiStudioProvider.OPENAI, "apikey");
+
+        var requestMap = entityAsMap(httpPost.getEntity().getContent());
+        assertThat(requestMap, aMapWithSize(1));
+        assertThat(requestMap.get("input"), is(List.of("abcd")));
+    }
+
+    public void testCreateRequest_WithOpenAiProvider_WithUserParam() throws IOException {
+        var request = createRequest(
+            "http://openaitarget.local",
+            AzureAiStudioProvider.OPENAI,
+            AzureAiStudioEndpointType.TOKEN,
+            "apikey",
+            "abcd",
+            "userid"
+        );
+        var httpRequest = request.createHttpRequest();
+        var httpPost = validateRequestUrlAndContentType(httpRequest, "http://openaitarget.local");
+        validateRequestApiKey(httpPost, AzureAiStudioProvider.OPENAI, "apikey");
+
+        var requestMap = entityAsMap(httpPost.getEntity().getContent());
+        assertThat(requestMap, aMapWithSize(2));
+        assertThat(requestMap.get("input"), is(List.of("abcd")));
+        assertThat(requestMap.get("user"), is("userid"));
+    }
+
+    public void testCreateRequest_WithCohereProvider_NoAdditionalParams() throws IOException {
+        var request = createRequest(
+            "http://coheretarget.local",
+            AzureAiStudioProvider.COHERE,
+            AzureAiStudioEndpointType.TOKEN,
+            "apikey",
+            "abcd",
+            null
+        );
+        var httpRequest = request.createHttpRequest();
+        var httpPost = validateRequestUrlAndContentType(httpRequest, "http://coheretarget.local/v1/embeddings");
+        validateRequestApiKey(httpPost, AzureAiStudioProvider.COHERE, "apikey");
+
+        var requestMap = entityAsMap(httpPost.getEntity().getContent());
+        assertThat(requestMap, aMapWithSize(1));
+        assertThat(requestMap.get("input"), is(List.of("abcd")));
+    }
+
+    public void testCreateRequest_WithCohereProvider_WithUserParam() throws IOException {
+        var request = createRequest(
+            "http://coheretarget.local",
+            AzureAiStudioProvider.COHERE,
+            AzureAiStudioEndpointType.TOKEN,
+            "apikey",
+            "abcd",
+            "userid"
+        );
+        var httpRequest = request.createHttpRequest();
+        var httpPost = validateRequestUrlAndContentType(httpRequest, "http://coheretarget.local/v1/embeddings");
+        validateRequestApiKey(httpPost, AzureAiStudioProvider.COHERE, "apikey");
+
+        var requestMap = entityAsMap(httpPost.getEntity().getContent());
+        assertThat(requestMap, aMapWithSize(2));
+        assertThat(requestMap.get("input"), is(List.of("abcd")));
+        assertThat(requestMap.get("user"), is("userid"));
+    }
+
+    public void testTruncate_ReducesInputTextSizeByHalf() throws IOException {
+        var request = createRequest(
+            "http://openaitarget.local",
+            AzureAiStudioProvider.OPENAI,
+            AzureAiStudioEndpointType.TOKEN,
+            "apikey",
+            "abcd",
+            null
+        );
+        var truncatedRequest = request.truncate();
+
+        var httpRequest = truncatedRequest.createHttpRequest();
+        assertThat(httpRequest.httpRequestBase(), instanceOf(HttpPost.class));
+
+        var httpPost = (HttpPost) httpRequest.httpRequestBase();
+        var requestMap = entityAsMap(httpPost.getEntity().getContent());
+        assertThat(requestMap, aMapWithSize(1));
+        assertThat(requestMap.get("input"), is(List.of("ab")));
+    }
+
+    public void testIsTruncated_ReturnsTrue() {
+        var request = createRequest(
+            "http://openaitarget.local",
+            AzureAiStudioProvider.OPENAI,
+            AzureAiStudioEndpointType.TOKEN,
+            "apikey",
+            "abcd",
+            null
+        );
+        assertFalse(request.getTruncationInfo()[0]);
+
+        var truncatedRequest = request.truncate();
+        assertTrue(truncatedRequest.getTruncationInfo()[0]);
+    }
+
+    private HttpPost validateRequestUrlAndContentType(HttpRequest request, String expectedUrl) throws IOException {
+        assertThat(request.httpRequestBase(), instanceOf(HttpPost.class));
+        var httpPost = (HttpPost) request.httpRequestBase();
+        assertThat(httpPost.getURI().toString(), is(expectedUrl));
+        assertThat(httpPost.getLastHeader(HttpHeaders.CONTENT_TYPE).getValue(), is(XContentType.JSON.mediaType()));
+        return httpPost;
+    }
+
+    private void validateRequestApiKey(HttpPost httpPost, AzureAiStudioProvider provider, String apiKey) {
+        if (provider == AzureAiStudioProvider.OPENAI) {
+            assertThat(httpPost.getLastHeader(API_KEY_HEADER).getValue(), is(apiKey));
+        } else {
+            assertThat(httpPost.getLastHeader(HttpHeaders.AUTHORIZATION).getValue(), is(apiKey));
+        }
+    }
+
+    public static AzureAiStudioEmbeddingsRequest createRequest(
+        String target,
+        AzureAiStudioProvider provider,
+        AzureAiStudioEndpointType endpointType,
+        String apiKey,
+        String input,
+        @Nullable String user
+    ) {
+        var model = AzureAiStudioEmbeddingsModelTests.createModel(
+            "id",
+            target,
+            provider,
+            endpointType,
+            apiKey,
+            null,
+            false,
+            null,
+            null,
+            user,
+            null
+        );
+        return new AzureAiStudioEmbeddingsRequest(
+            TruncatorTests.createTruncator(),
+            new Truncator.TruncationResult(List.of(input), new boolean[] { false }),
+            model
+        );
+    }
+}
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/request/cohere/CohereCompletionRequestEntityTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/request/cohere/CohereCompletionRequestEntityTests.java
new file mode 100644
index 0000000000000..dbe6a9438d884
--- /dev/null
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/request/cohere/CohereCompletionRequestEntityTests.java
@@ -0,0 +1,53 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.request.cohere;
+
+import org.elasticsearch.common.Strings;
+import org.elasticsearch.test.ESTestCase;
+import org.elasticsearch.xcontent.XContentBuilder;
+import org.elasticsearch.xcontent.XContentFactory;
+import org.elasticsearch.xcontent.XContentType;
+import org.elasticsearch.xpack.inference.external.request.cohere.completion.CohereCompletionRequestEntity;
+
+import java.io.IOException;
+import java.util.List;
+
+import static org.hamcrest.CoreMatchers.is;
+
+public class CohereCompletionRequestEntityTests extends ESTestCase {
+
+    public void testXContent_WritesAllFields() throws IOException {
+        var entity = new CohereCompletionRequestEntity(List.of("some input"), "model");
+
+        XContentBuilder builder = XContentFactory.contentBuilder(XContentType.JSON);
+        entity.toXContent(builder, null);
+        String xContentResult = Strings.toString(builder);
+
+        assertThat(xContentResult, is("""
+            {"message":"some input","model":"model"}"""));
+    }
+
+    public void testXContent_DoesNotWriteModelIfNotSpecified() throws IOException {
+        var entity = new CohereCompletionRequestEntity(List.of("some input"), null);
+
+        XContentBuilder builder = XContentFactory.contentBuilder(XContentType.JSON);
+        entity.toXContent(builder, null);
+        String xContentResult = Strings.toString(builder);
+
+        assertThat(xContentResult, is("""
+            {"message":"some input"}"""));
+    }
+
+    public void testXContent_ThrowsIfInputIsNull() {
+        expectThrows(NullPointerException.class, () -> new CohereCompletionRequestEntity(null, null));
+    }
+
+    public void testXContent_ThrowsIfMessageInInputIsNull() {
+        expectThrows(NullPointerException.class, () -> new CohereCompletionRequestEntity(List.of((String) null), null));
+    }
+}
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/request/cohere/CohereCompletionRequestTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/request/cohere/CohereCompletionRequestTests.java
new file mode 100644
index 0000000000000..d6d0d5c00eaf4
--- /dev/null
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/request/cohere/CohereCompletionRequestTests.java
@@ -0,0 +1,74 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.request.cohere;
+
+import org.apache.http.HttpHeaders;
+import org.apache.http.client.methods.HttpPost;
+import org.elasticsearch.test.ESTestCase;
+import org.elasticsearch.xcontent.XContentType;
+import org.elasticsearch.xpack.inference.external.request.cohere.completion.CohereCompletionRequest;
+import org.elasticsearch.xpack.inference.services.cohere.completion.CohereCompletionModelTests;
+
+import java.io.IOException;
+import java.util.List;
+import java.util.Map;
+
+import static org.elasticsearch.xpack.inference.external.http.Utils.entityAsMap;
+import static org.hamcrest.Matchers.instanceOf;
+import static org.hamcrest.Matchers.is;
+import static org.hamcrest.Matchers.sameInstance;
+
+public class CohereCompletionRequestTests extends ESTestCase {
+
+    public void testCreateRequest_UrlDefined() throws IOException {
+        var request = new CohereCompletionRequest(List.of("abc"), CohereCompletionModelTests.createModel("url", "secret", null));
+
+        var httpRequest = request.createHttpRequest();
+        assertThat(httpRequest.httpRequestBase(), instanceOf(HttpPost.class));
+
+        var httpPost = (HttpPost) httpRequest.httpRequestBase();
+
+        assertThat(httpPost.getURI().toString(), is("url"));
+        assertThat(httpPost.getLastHeader(HttpHeaders.CONTENT_TYPE).getValue(), is(XContentType.JSON.mediaType()));
+        assertThat(httpPost.getLastHeader(HttpHeaders.AUTHORIZATION).getValue(), is("Bearer secret"));
+        assertThat(httpPost.getLastHeader(CohereUtils.REQUEST_SOURCE_HEADER).getValue(), is(CohereUtils.ELASTIC_REQUEST_SOURCE));
+
+        var requestMap = entityAsMap(httpPost.getEntity().getContent());
+        assertThat(requestMap, is(Map.of("message", "abc")));
+    }
+
+    public void testCreateRequest_ModelDefined() throws IOException {
+        var request = new CohereCompletionRequest(List.of("abc"), CohereCompletionModelTests.createModel("url", "secret", "model"));
+
+        var httpRequest = request.createHttpRequest();
+        assertThat(httpRequest.httpRequestBase(), instanceOf(HttpPost.class));
+
+        var httpPost = (HttpPost) httpRequest.httpRequestBase();
+
+        assertThat(httpPost.getURI().toString(), is("url"));
+        assertThat(httpPost.getLastHeader(HttpHeaders.CONTENT_TYPE).getValue(), is(XContentType.JSON.mediaType()));
+        assertThat(httpPost.getLastHeader(HttpHeaders.AUTHORIZATION).getValue(), is("Bearer secret"));
+        assertThat(httpPost.getLastHeader(CohereUtils.REQUEST_SOURCE_HEADER).getValue(), is(CohereUtils.ELASTIC_REQUEST_SOURCE));
+
+        var requestMap = entityAsMap(httpPost.getEntity().getContent());
+        assertThat(requestMap, is(Map.of("message", "abc", "model", "model")));
+    }
+
+    public void testTruncate_ReturnsSameInstance() {
+        var request = new CohereCompletionRequest(List.of("abc"), CohereCompletionModelTests.createModel("url", "secret", "model"));
+        var truncatedRequest = request.truncate();
+
+        assertThat(truncatedRequest, sameInstance(request));
+    }
+
+    public void testTruncationInfo_ReturnsNull() {
+        var request = new CohereCompletionRequest(List.of("abc"), CohereCompletionModelTests.createModel("url", "secret", "model"));
+
+        assertNull(request.getTruncationInfo());
+    }
+}
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/request/cohere/CohereRequestTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/request/cohere/CohereRequestTests.java
new file mode 100644
index 0000000000000..444fee7cac3c7
--- /dev/null
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/request/cohere/CohereRequestTests.java
@@ -0,0 +1,36 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.request.cohere;
+
+import org.apache.http.HttpHeaders;
+import org.apache.http.client.methods.HttpPost;
+import org.elasticsearch.common.settings.SecureString;
+import org.elasticsearch.test.ESTestCase;
+import org.elasticsearch.xcontent.XContentType;
+import org.elasticsearch.xpack.inference.external.cohere.CohereAccount;
+
+import java.net.URI;
+
+import static org.hamcrest.Matchers.is;
+
+public class CohereRequestTests extends ESTestCase {
+
+    public void testDecorateWithAuthHeader() {
+        var request = new HttpPost("http://www.abc.com");
+
+        CohereRequest.decorateWithAuthHeader(
+            request,
+            new CohereAccount(URI.create("http://www.abc.com"), new SecureString(new char[] { 'a', 'b', 'c' }))
+        );
+
+        assertThat(request.getFirstHeader(HttpHeaders.CONTENT_TYPE).getValue(), is(XContentType.JSON.mediaType()));
+        assertThat(request.getFirstHeader(HttpHeaders.AUTHORIZATION).getValue(), is("Bearer abc"));
+        assertThat(request.getFirstHeader(CohereUtils.REQUEST_SOURCE_HEADER).getValue(), is(CohereUtils.ELASTIC_REQUEST_SOURCE));
+    }
+
+}
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/response/AzureAndOpenAiErrorResponseEntityTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/response/AzureAndOpenAiErrorResponseEntityTests.java
new file mode 100644
index 0000000000000..fd133a26f5532
--- /dev/null
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/response/AzureAndOpenAiErrorResponseEntityTests.java
@@ -0,0 +1,48 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.response;
+
+import org.apache.http.HttpResponse;
+import org.elasticsearch.common.Strings;
+import org.elasticsearch.test.ESTestCase;
+import org.elasticsearch.xpack.inference.external.http.HttpResult;
+
+import static org.hamcrest.Matchers.is;
+import static org.mockito.Mockito.mock;
+
+public class AzureAndOpenAiErrorResponseEntityTests extends ESTestCase {
+
+    private static HttpResult getMockResult(String jsonString) {
+        var response = mock(HttpResponse.class);
+        return new HttpResult(response, Strings.toUTF8Bytes(jsonString));
+    }
+
+    public void testErrorResponse_ExtractsError() {
+        var result = getMockResult("""
+            {"error":{"message":"test_error_message"}}""");
+
+        var error = AzureAndOpenAiErrorResponseEntity.fromResponse(result);
+        assertNotNull(error);
+        assertThat(error.getErrorMessage(), is("test_error_message"));
+    }
+
+    public void testErrorResponse_ReturnsNullIfNoError() {
+        var result = getMockResult("""
+            {"noerror":true}""");
+
+        var error = AzureAndOpenAiErrorResponseEntity.fromResponse(result);
+        assertNull(error);
+    }
+
+    public void testErrorResponse_ReturnsNullIfNotJson() {
+        var result = getMockResult("not a json string");
+
+        var error = AzureAndOpenAiErrorResponseEntity.fromResponse(result);
+        assertNull(error);
+    }
+}
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/response/AzureAndOpenAiExternalResponseHandlerTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/response/AzureAndOpenAiExternalResponseHandlerTests.java
new file mode 100644
index 0000000000000..4c9fb143c3a5c
--- /dev/null
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/response/AzureAndOpenAiExternalResponseHandlerTests.java
@@ -0,0 +1,245 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.response;
+
+import org.apache.http.Header;
+import org.apache.http.HeaderElement;
+import org.apache.http.HttpResponse;
+import org.apache.http.StatusLine;
+import org.apache.http.message.BasicHeader;
+import org.elasticsearch.ElasticsearchStatusException;
+import org.elasticsearch.common.Strings;
+import org.elasticsearch.rest.RestStatus;
+import org.elasticsearch.test.ESTestCase;
+import org.elasticsearch.xpack.inference.external.http.HttpResult;
+import org.elasticsearch.xpack.inference.external.http.retry.ContentTooLargeException;
+import org.elasticsearch.xpack.inference.external.http.retry.RetryException;
+import org.elasticsearch.xpack.inference.external.request.RequestTests;
+
+import java.nio.charset.StandardCharsets;
+
+import static org.hamcrest.Matchers.containsString;
+import static org.hamcrest.core.Is.is;
+import static org.mockito.ArgumentMatchers.anyString;
+import static org.mockito.Mockito.mock;
+import static org.mockito.Mockito.when;
+
+public class AzureAndOpenAiExternalResponseHandlerTests extends ESTestCase {
+
+    public void testCheckForFailureStatusCode() {
+        var statusLine = mock(StatusLine.class);
+
+        var httpResponse = mock(HttpResponse.class);
+        when(httpResponse.getStatusLine()).thenReturn(statusLine);
+        var header = mock(Header.class);
+        when(header.getElements()).thenReturn(new HeaderElement[] {});
+        when(httpResponse.getFirstHeader(anyString())).thenReturn(header);
+
+        var mockRequest = RequestTests.mockRequest("id");
+        var httpResult = new HttpResult(httpResponse, new byte[] {});
+        var handler = new AzureAndOpenAiExternalResponseHandler(
+            "",
+            (request, result) -> null,
+            AzureAndOpenAiErrorResponseEntity::fromResponse
+        );
+
+        // 200 ok
+        when(statusLine.getStatusCode()).thenReturn(200);
+        handler.checkForFailureStatusCode(mockRequest, httpResult);
+        // 503
+        when(statusLine.getStatusCode()).thenReturn(503);
+        var retryException = expectThrows(RetryException.class, () -> handler.checkForFailureStatusCode(mockRequest, httpResult));
+        assertTrue(retryException.shouldRetry());
+        assertThat(
+            retryException.getCause().getMessage(),
+            containsString("Received a server busy error status code for request from inference entity id [id] status [503]")
+        );
+        assertThat(((ElasticsearchStatusException) retryException.getCause()).status(), is(RestStatus.BAD_REQUEST));
+        // 501
+        when(statusLine.getStatusCode()).thenReturn(501);
+        retryException = expectThrows(RetryException.class, () -> handler.checkForFailureStatusCode(mockRequest, httpResult));
+        assertFalse(retryException.shouldRetry());
+        assertThat(
+            retryException.getCause().getMessage(),
+            containsString("Received a server error status code for request from inference entity id [id] status [501]")
+        );
+        assertThat(((ElasticsearchStatusException) retryException.getCause()).status(), is(RestStatus.BAD_REQUEST));
+        // 500
+        when(statusLine.getStatusCode()).thenReturn(500);
+        retryException = expectThrows(RetryException.class, () -> handler.checkForFailureStatusCode(mockRequest, httpResult));
+        assertTrue(retryException.shouldRetry());
+        assertThat(
+            retryException.getCause().getMessage(),
+            containsString("Received a server error status code for request from inference entity id [id] status [500]")
+        );
+        assertThat(((ElasticsearchStatusException) retryException.getCause()).status(), is(RestStatus.BAD_REQUEST));
+        // 429
+        when(statusLine.getStatusCode()).thenReturn(429);
+        retryException = expectThrows(RetryException.class, () -> handler.checkForFailureStatusCode(mockRequest, httpResult));
+        assertTrue(retryException.shouldRetry());
+        assertThat(retryException.getCause().getMessage(), containsString("Received a rate limit status code."));
+        assertThat(((ElasticsearchStatusException) retryException.getCause()).status(), is(RestStatus.TOO_MANY_REQUESTS));
+        // 413
+        when(statusLine.getStatusCode()).thenReturn(413);
+        retryException = expectThrows(ContentTooLargeException.class, () -> handler.checkForFailureStatusCode(mockRequest, httpResult));
+        assertTrue(retryException.shouldRetry());
+        assertThat(retryException.getCause().getMessage(), containsString("Received a content too large status code"));
+        assertThat(((ElasticsearchStatusException) retryException.getCause()).status(), is(RestStatus.REQUEST_ENTITY_TOO_LARGE));
+        // 400 content too large
+        retryException = expectThrows(
+            ContentTooLargeException.class,
+            () -> handler.checkForFailureStatusCode(mockRequest, createContentTooLargeResult(400))
+        );
+        assertTrue(retryException.shouldRetry());
+        assertThat(retryException.getCause().getMessage(), containsString("Received a content too large status code"));
+        assertThat(((ElasticsearchStatusException) retryException.getCause()).status(), is(RestStatus.BAD_REQUEST));
+        // 400 generic bad request should not be marked as a content too large
+        when(statusLine.getStatusCode()).thenReturn(400);
+        retryException = expectThrows(RetryException.class, () -> handler.checkForFailureStatusCode(mockRequest, httpResult));
+        assertFalse(retryException.shouldRetry());
+        assertThat(
+            retryException.getCause().getMessage(),
+            containsString("Received an unsuccessful status code for request from inference entity id [id] status [400]")
+        );
+        assertThat(((ElasticsearchStatusException) retryException.getCause()).status(), is(RestStatus.BAD_REQUEST));
+        // 400 is not flagged as a content too large when the error message is different
+        when(statusLine.getStatusCode()).thenReturn(400);
+        retryException = expectThrows(
+            RetryException.class,
+            () -> handler.checkForFailureStatusCode(mockRequest, createResult(400, "blah"))
+        );
+        assertFalse(retryException.shouldRetry());
+        assertThat(
+            retryException.getCause().getMessage(),
+            containsString("Received an unsuccessful status code for request from inference entity id [id] status [400]")
+        );
+        assertThat(((ElasticsearchStatusException) retryException.getCause()).status(), is(RestStatus.BAD_REQUEST));
+        // 401
+        when(statusLine.getStatusCode()).thenReturn(401);
+        retryException = expectThrows(RetryException.class, () -> handler.checkForFailureStatusCode(mockRequest, httpResult));
+        assertFalse(retryException.shouldRetry());
+        assertThat(
+            retryException.getCause().getMessage(),
+            containsString("Received an authentication error status code for request from inference entity id [id] status [401]")
+        );
+        assertThat(((ElasticsearchStatusException) retryException.getCause()).status(), is(RestStatus.UNAUTHORIZED));
+        // 300
+        when(statusLine.getStatusCode()).thenReturn(300);
+        retryException = expectThrows(RetryException.class, () -> handler.checkForFailureStatusCode(mockRequest, httpResult));
+        assertFalse(retryException.shouldRetry());
+        assertThat(
+            retryException.getCause().getMessage(),
+            containsString("Unhandled redirection for request from inference entity id [id] status [300]")
+        );
+        assertThat(((ElasticsearchStatusException) retryException.getCause()).status(), is(RestStatus.MULTIPLE_CHOICES));
+        // 402
+        when(statusLine.getStatusCode()).thenReturn(402);
+        retryException = expectThrows(RetryException.class, () -> handler.checkForFailureStatusCode(mockRequest, httpResult));
+        assertFalse(retryException.shouldRetry());
+        assertThat(
+            retryException.getCause().getMessage(),
+            containsString("Received an unsuccessful status code for request from inference entity id [id] status [402]")
+        );
+        assertThat(((ElasticsearchStatusException) retryException.getCause()).status(), is(RestStatus.PAYMENT_REQUIRED));
+    }
+
+    public void testBuildRateLimitErrorMessage() {
+        int statusCode = 429;
+        var statusLine = mock(StatusLine.class);
+        when(statusLine.getStatusCode()).thenReturn(statusCode);
+        var response = mock(HttpResponse.class);
+        when(response.getStatusLine()).thenReturn(statusLine);
+        var httpResult = new HttpResult(response, new byte[] {});
+
+        {
+            when(response.getFirstHeader(AzureAndOpenAiExternalResponseHandler.REQUESTS_LIMIT)).thenReturn(
+                new BasicHeader(AzureAndOpenAiExternalResponseHandler.REQUESTS_LIMIT, "3000")
+            );
+            when(response.getFirstHeader(AzureAndOpenAiExternalResponseHandler.REMAINING_REQUESTS)).thenReturn(
+                new BasicHeader(AzureAndOpenAiExternalResponseHandler.REMAINING_REQUESTS, "2999")
+            );
+            when(response.getFirstHeader(AzureAndOpenAiExternalResponseHandler.TOKENS_LIMIT)).thenReturn(
+                new BasicHeader(AzureAndOpenAiExternalResponseHandler.TOKENS_LIMIT, "10000")
+            );
+            when(response.getFirstHeader(AzureAndOpenAiExternalResponseHandler.REMAINING_TOKENS)).thenReturn(
+                new BasicHeader(AzureAndOpenAiExternalResponseHandler.REMAINING_TOKENS, "99800")
+            );
+
+            var error = AzureAndOpenAiExternalResponseHandler.buildRateLimitErrorMessage(httpResult);
+            assertThat(
+                error,
+                containsString("Token limit [10000], remaining tokens [99800]. Request limit [3000], remaining requests [2999]")
+            );
+        }
+
+        {
+            when(response.getFirstHeader(AzureAndOpenAiExternalResponseHandler.TOKENS_LIMIT)).thenReturn(null);
+            when(response.getFirstHeader(AzureAndOpenAiExternalResponseHandler.REMAINING_TOKENS)).thenReturn(null);
+            var error = AzureAndOpenAiExternalResponseHandler.buildRateLimitErrorMessage(httpResult);
+            assertThat(
+                error,
+                containsString("Token limit [unknown], remaining tokens [unknown]. Request limit [3000], remaining requests [2999]")
+            );
+        }
+
+        {
+            when(response.getFirstHeader(AzureAndOpenAiExternalResponseHandler.REQUESTS_LIMIT)).thenReturn(null);
+            when(response.getFirstHeader(AzureAndOpenAiExternalResponseHandler.REMAINING_REQUESTS)).thenReturn(
+                new BasicHeader(AzureAndOpenAiExternalResponseHandler.REMAINING_REQUESTS, "2999")
+            );
+            when(response.getFirstHeader(AzureAndOpenAiExternalResponseHandler.TOKENS_LIMIT)).thenReturn(null);
+            when(response.getFirstHeader(AzureAndOpenAiExternalResponseHandler.REMAINING_TOKENS)).thenReturn(null);
+            var error = AzureAndOpenAiExternalResponseHandler.buildRateLimitErrorMessage(httpResult);
+            assertThat(error, containsString("Remaining tokens [unknown]. Remaining requests [2999]"));
+        }
+
+        {
+            when(response.getFirstHeader(AzureAndOpenAiExternalResponseHandler.REQUESTS_LIMIT)).thenReturn(null);
+            when(response.getFirstHeader(AzureAndOpenAiExternalResponseHandler.REMAINING_REQUESTS)).thenReturn(
+                new BasicHeader(AzureAndOpenAiExternalResponseHandler.REMAINING_REQUESTS, "2999")
+            );
+            when(response.getFirstHeader(AzureAndOpenAiExternalResponseHandler.TOKENS_LIMIT)).thenReturn(
+                new BasicHeader(AzureAndOpenAiExternalResponseHandler.TOKENS_LIMIT, "10000")
+            );
+            when(response.getFirstHeader(AzureAndOpenAiExternalResponseHandler.REMAINING_TOKENS)).thenReturn(null);
+            var error = AzureAndOpenAiExternalResponseHandler.buildRateLimitErrorMessage(httpResult);
+            assertThat(
+                error,
+                containsString("Token limit [10000], remaining tokens [unknown]. Request limit [unknown], remaining requests [2999]")
+            );
+        }
+    }
+
+    private static HttpResult createContentTooLargeResult(int statusCode) {
+        return createResult(
+            statusCode,
+            "This model's maximum context length is 8192 tokens, however you requested 13531 tokens (13531 in your prompt;"
+                + "0 for the completion). Please reduce your prompt; or completion length."
+        );
+    }
+
+    private static HttpResult createResult(int statusCode, String message) {
+        var statusLine = mock(StatusLine.class);
+        when(statusLine.getStatusCode()).thenReturn(statusCode);
+        var httpResponse = mock(HttpResponse.class);
+        when(httpResponse.getStatusLine()).thenReturn(statusLine);
+
+        String responseJson = Strings.format("""
+                {
+                    "error": {
+                        "message": "%s",
+                        "type": "content_too_large",
+                        "param": null,
+                        "code": null
+                    }
+                }
+            """, message);
+
+        return new HttpResult(httpResponse, responseJson.getBytes(StandardCharsets.UTF_8));
+    }
+}
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/response/azureaistudio/AzureAiStudioChatCompletionResponseEntityTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/response/azureaistudio/AzureAiStudioChatCompletionResponseEntityTests.java
new file mode 100644
index 0000000000000..7d5aafa181b19
--- /dev/null
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/response/azureaistudio/AzureAiStudioChatCompletionResponseEntityTests.java
@@ -0,0 +1,96 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.response.azureaistudio;
+
+import org.apache.http.HttpResponse;
+import org.elasticsearch.test.ESTestCase;
+import org.elasticsearch.xpack.core.inference.results.ChatCompletionResults;
+import org.elasticsearch.xpack.inference.external.http.HttpResult;
+import org.elasticsearch.xpack.inference.external.request.azureaistudio.AzureAiStudioChatCompletionRequest;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioEndpointType;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioProvider;
+import org.elasticsearch.xpack.inference.services.azureaistudio.completion.AzureAiStudioChatCompletionModelTests;
+
+import java.io.IOException;
+import java.nio.charset.StandardCharsets;
+import java.util.List;
+
+import static org.hamcrest.Matchers.equalTo;
+import static org.hamcrest.Matchers.is;
+import static org.mockito.Mockito.mock;
+
+public class AzureAiStudioChatCompletionResponseEntityTests extends ESTestCase {
+
+    public void testCompletionResponse_FromTokenEndpoint() throws IOException {
+        var entity = new AzureAiStudioChatCompletionResponseEntity();
+        var model = AzureAiStudioChatCompletionModelTests.createModel(
+            "id",
+            "http://testopenai.local",
+            AzureAiStudioProvider.OPENAI,
+            AzureAiStudioEndpointType.TOKEN,
+            "apikey"
+        );
+        var request = new AzureAiStudioChatCompletionRequest(model, List.of("test input"));
+        var result = (ChatCompletionResults) entity.apply(
+            request,
+            new HttpResult(mock(HttpResponse.class), testTokenResponseJson.getBytes(StandardCharsets.UTF_8))
+        );
+
+        assertThat(result.getResults().size(), equalTo(1));
+        assertThat(result.getResults().get(0).content(), is("test input string"));
+    }
+
+    public void testCompletionResponse_FromRealtimeEndpoint() throws IOException {
+        var entity = new AzureAiStudioChatCompletionResponseEntity();
+        var model = AzureAiStudioChatCompletionModelTests.createModel(
+            "id",
+            "http://testmistral.local",
+            AzureAiStudioProvider.MISTRAL,
+            AzureAiStudioEndpointType.REALTIME,
+            "apikey"
+        );
+        var request = new AzureAiStudioChatCompletionRequest(model, List.of("test input"));
+        var result = (ChatCompletionResults) entity.apply(
+            request,
+            new HttpResult(mock(HttpResponse.class), testRealtimeResponseJson.getBytes(StandardCharsets.UTF_8))
+        );
+
+        assertThat(result.getResults().size(), equalTo(1));
+        assertThat(result.getResults().get(0).content(), is("test realtime response"));
+    }
+
+    private static String testRealtimeResponseJson = """
+        {
+            "output": "test realtime response"
+        }
+        """;
+
+    private static String testTokenResponseJson = """
+        {
+            "choices": [
+                {
+                    "finish_reason": "stop",
+                    "index": 0,
+                    "message": {
+                        "content": "test input string",
+                        "role": "assistant",
+                        "tool_calls": null
+                    }
+                }
+            ],
+            "created": 1714006424,
+            "id": "f92b5b4d-0de3-4152-a3c6-5aae8a74555c",
+            "model": "",
+            "object": "chat.completion",
+            "usage": {
+                "completion_tokens": 35,
+                "prompt_tokens": 8,
+                "total_tokens": 43
+            }
+        }""";
+}
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/response/azureaistudio/AzureAiStudioEmbeddingsResponseEntityTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/response/azureaistudio/AzureAiStudioEmbeddingsResponseEntityTests.java
new file mode 100644
index 0000000000000..fd31743616e6e
--- /dev/null
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/response/azureaistudio/AzureAiStudioEmbeddingsResponseEntityTests.java
@@ -0,0 +1,60 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.response.azureaistudio;
+
+import org.apache.http.HttpResponse;
+import org.elasticsearch.test.ESTestCase;
+import org.elasticsearch.xpack.core.inference.results.TextEmbeddingResults;
+import org.elasticsearch.xpack.inference.external.http.HttpResult;
+import org.elasticsearch.xpack.inference.external.request.Request;
+
+import java.io.IOException;
+import java.nio.charset.StandardCharsets;
+import java.util.List;
+
+import static org.hamcrest.Matchers.is;
+import static org.mockito.Mockito.mock;
+
+/**
+ * Note - the underlying AzureAiStudioEmbeddingsResponseEntity uses the same
+ * response entity parser as OpenAI. This test just performs a smoke
+ * test of the wrapper
+ */
+public class AzureAiStudioEmbeddingsResponseEntityTests extends ESTestCase {
+    public void testFromResponse_CreatesResultsForASingleItem() throws IOException {
+        String responseJson = """
+            {
+              "object": "list",
+              "data": [
+                  {
+                      "object": "embedding",
+                      "index": 0,
+                      "embedding": [
+                          0.014539449,
+                          -0.015288644
+                      ]
+                  }
+              ],
+              "model": "text-embedding-ada-002-v2",
+              "usage": {
+                  "prompt_tokens": 8,
+                  "total_tokens": 8
+              }
+            }
+            """;
+
+        var entity = new AzureAiStudioEmbeddingsResponseEntity();
+
+        var parsedResults = (TextEmbeddingResults) entity.apply(
+            mock(Request.class),
+            new HttpResult(mock(HttpResponse.class), responseJson.getBytes(StandardCharsets.UTF_8))
+        );
+
+        assertThat(parsedResults.embeddings(), is(List.of(new TextEmbeddingResults.Embedding(List.of(0.014539449F, -0.015288644F)))));
+    }
+}
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/response/cohere/CohereCompletionResponseEntityTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/response/cohere/CohereCompletionResponseEntityTests.java
new file mode 100644
index 0000000000000..70e1656195c3c
--- /dev/null
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/external/response/cohere/CohereCompletionResponseEntityTests.java
@@ -0,0 +1,159 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.external.response.cohere;
+
+import org.apache.http.HttpResponse;
+import org.elasticsearch.common.ParsingException;
+import org.elasticsearch.test.ESTestCase;
+import org.elasticsearch.xpack.core.inference.results.ChatCompletionResults;
+import org.elasticsearch.xpack.inference.external.http.HttpResult;
+import org.elasticsearch.xpack.inference.external.request.Request;
+
+import java.io.IOException;
+import java.nio.charset.StandardCharsets;
+
+import static org.hamcrest.Matchers.is;
+import static org.mockito.Mockito.mock;
+
+public class CohereCompletionResponseEntityTests extends ESTestCase {
+
+    public void testFromResponse_CreatesResponseEntityForText() throws IOException {
+        String responseJson = """
+            {
+                "response_id": "some id",
+                "text": "result",
+                "generation_id": "some id",
+                "chat_history": [
+                    {
+                        "role": "USER",
+                        "message": "some input"
+                    },
+                    {
+                        "role": "CHATBOT",
+                        "message": "result"
+                    }
+                ],
+                "finish_reason": "COMPLETE",
+                "meta": {
+                    "api_version": {
+                        "version": "1"
+                    },
+                    "billed_units": {
+                        "input_tokens": 4,
+                        "output_tokens": 191
+                    },
+                    "tokens": {
+                        "input_tokens": 70,
+                        "output_tokens": 191
+                    }
+                }
+            }
+            """;
+
+        ChatCompletionResults chatCompletionResults = CohereCompletionResponseEntity.fromResponse(
+            mock(Request.class),
+            new HttpResult(mock(HttpResponse.class), responseJson.getBytes(StandardCharsets.UTF_8))
+        );
+
+        assertThat(chatCompletionResults.getResults().size(), is(1));
+        assertThat(chatCompletionResults.getResults().get(0).content(), is("result"));
+    }
+
+    public void testFromResponse_FailsWhenTextIsNotPresent() {
+        String responseJson = """
+            {
+                "response_id": "some id",
+                "not_text": "result",
+                "generation_id": "some id",
+                "chat_history": [
+                    {
+                        "role": "USER",
+                        "message": "some input"
+                    },
+                    {
+                        "role": "CHATBOT",
+                        "message": "result"
+                    }
+                ],
+                "finish_reason": "COMPLETE",
+                "meta": {
+                    "api_version": {
+                        "version": "1"
+                    },
+                    "billed_units": {
+                        "input_tokens": 4,
+                        "output_tokens": 191
+                    },
+                    "tokens": {
+                        "input_tokens": 70,
+                        "output_tokens": 191
+                    }
+                }
+            }
+            """;
+
+        var thrownException = expectThrows(
+            IllegalStateException.class,
+            () -> CohereCompletionResponseEntity.fromResponse(
+                mock(Request.class),
+                new HttpResult(mock(HttpResponse.class), responseJson.getBytes(StandardCharsets.UTF_8))
+            )
+        );
+
+        assertThat(thrownException.getMessage(), is("Failed to find required field [text] in Cohere chat response"));
+    }
+
+    public void testFromResponse_FailsWhenTextIsNotAString() {
+        String responseJson = """
+            {
+                "response_id": "some id",
+                "text": {
+                    "text": "result"
+                },
+                "generation_id": "some id",
+                "chat_history": [
+                    {
+                        "role": "USER",
+                        "message": "some input"
+                    },
+                    {
+                        "role": "CHATBOT",
+                        "message": "result"
+                    }
+                ],
+                "finish_reason": "COMPLETE",
+                "meta": {
+                    "api_version": {
+                        "version": "1"
+                    },
+                    "billed_units": {
+                        "input_tokens": 4,
+                        "output_tokens": 191
+                    },
+                    "tokens": {
+                        "input_tokens": 70,
+                        "output_tokens": 191
+                    }
+                }
+            }
+            """;
+
+        var thrownException = expectThrows(
+            ParsingException.class,
+            () -> CohereCompletionResponseEntity.fromResponse(
+                mock(Request.class),
+                new HttpResult(mock(HttpResponse.class), responseJson.getBytes(StandardCharsets.UTF_8))
+            )
+        );
+
+        assertThat(
+            thrownException.getMessage(),
+            is("Failed to parse object: expecting token of type [VALUE_STRING] but found [START_OBJECT]")
+        );
+    }
+}
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/ServiceUtilsTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/ServiceUtilsTests.java
index bf9fdbe7235b6..6f05ab79629e6 100644
--- a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/ServiceUtilsTests.java
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/ServiceUtilsTests.java
@@ -11,6 +11,7 @@
 import org.elasticsearch.action.ActionListener;
 import org.elasticsearch.action.support.PlainActionFuture;
 import org.elasticsearch.common.ValidationException;
+import org.elasticsearch.core.Booleans;
 import org.elasticsearch.core.TimeValue;
 import org.elasticsearch.inference.InferenceService;
 import org.elasticsearch.inference.InferenceServiceResults;
@@ -32,6 +33,7 @@
 import static org.elasticsearch.xpack.inference.services.ServiceUtils.createUri;
 import static org.elasticsearch.xpack.inference.services.ServiceUtils.extractOptionalEnum;
 import static org.elasticsearch.xpack.inference.services.ServiceUtils.extractOptionalPositiveInteger;
+import static org.elasticsearch.xpack.inference.services.ServiceUtils.extractOptionalPositiveLong;
 import static org.elasticsearch.xpack.inference.services.ServiceUtils.extractOptionalString;
 import static org.elasticsearch.xpack.inference.services.ServiceUtils.extractOptionalTimeValue;
 import static org.elasticsearch.xpack.inference.services.ServiceUtils.extractRequiredSecureString;
@@ -193,6 +195,95 @@ public void testRemoveAsTypeMissingReturnsNull() {
         assertThat(map.entrySet(), hasSize(3));
     }
 
+    public void testRemoveAsOneOfTypes_Validation_WithCorrectTypes() {
+        Map<String, Object> map = new HashMap<>(Map.of("a", 5, "b", "a string", "c", Boolean.TRUE, "d", 1.0));
+        ValidationException validationException = new ValidationException();
+
+        Integer i = (Integer) ServiceUtils.removeAsOneOfTypes(map, "a", List.of(String.class, Integer.class), validationException);
+        assertEquals(Integer.valueOf(5), i);
+        assertNull(map.get("a")); // field has been removed
+
+        String str = (String) ServiceUtils.removeAsOneOfTypes(map, "b", List.of(Integer.class, String.class), validationException);
+        assertEquals("a string", str);
+        assertNull(map.get("b"));
+
+        Boolean b = (Boolean) ServiceUtils.removeAsOneOfTypes(map, "c", List.of(String.class, Boolean.class), validationException);
+        assertEquals(Boolean.TRUE, b);
+        assertNull(map.get("c"));
+
+        Double d = (Double) ServiceUtils.removeAsOneOfTypes(map, "d", List.of(Booleans.class, Double.class), validationException);
+        assertEquals(Double.valueOf(1.0), d);
+        assertNull(map.get("d"));
+
+        assertThat(map.entrySet(), empty());
+    }
+
+    public void testRemoveAsOneOfTypes_Validation_WithIncorrectType() {
+        Map<String, Object> map = new HashMap<>(Map.of("a", 5, "b", "a string", "c", Boolean.TRUE, "d", 5.0, "e", 5));
+
+        var validationException = new ValidationException();
+        Object result = ServiceUtils.removeAsOneOfTypes(map, "a", List.of(String.class, Boolean.class), validationException);
+        assertNull(result);
+        assertThat(validationException.validationErrors(), hasSize(1));
+        assertThat(
+            validationException.validationErrors().get(0),
+            containsString("field [a] is not of one of the expected types. The value [5] cannot be converted to one of [String, Boolean]")
+        );
+        assertNull(map.get("a"));
+
+        validationException = new ValidationException();
+        result = ServiceUtils.removeAsOneOfTypes(map, "b", List.of(Boolean.class, Integer.class), validationException);
+        assertNull(result);
+        assertThat(validationException.validationErrors(), hasSize(1));
+        assertThat(
+            validationException.validationErrors().get(0),
+            containsString(
+                "field [b] is not of one of the expected types. The value [a string] cannot be converted to one of [Boolean, Integer]"
+            )
+        );
+        assertNull(map.get("b"));
+
+        validationException = new ValidationException();
+        result = ServiceUtils.removeAsOneOfTypes(map, "c", List.of(String.class, Integer.class), validationException);
+        assertNull(result);
+        assertThat(validationException.validationErrors(), hasSize(1));
+        assertThat(
+            validationException.validationErrors().get(0),
+            containsString(
+                "field [c] is not of one of the expected types. The value [true] cannot be converted to one of [String, Integer]"
+            )
+        );
+        assertNull(map.get("c"));
+
+        validationException = new ValidationException();
+        result = ServiceUtils.removeAsOneOfTypes(map, "d", List.of(String.class, Boolean.class), validationException);
+        assertNull(result);
+        assertThat(validationException.validationErrors(), hasSize(1));
+        assertThat(
+            validationException.validationErrors().get(0),
+            containsString("field [d] is not of one of the expected types. The value [5.0] cannot be converted to one of [String, Boolean]")
+        );
+        assertNull(map.get("d"));
+
+        validationException = new ValidationException();
+        result = ServiceUtils.removeAsOneOfTypes(map, "e", List.of(String.class, Boolean.class), validationException);
+        assertNull(result);
+        assertThat(validationException.validationErrors(), hasSize(1));
+        assertThat(
+            validationException.validationErrors().get(0),
+            containsString("field [e] is not of one of the expected types. The value [5] cannot be converted to one of [String, Boolean]")
+        );
+        assertNull(map.get("e"));
+
+        assertThat(map.entrySet(), empty());
+    }
+
+    public void testRemoveAsOneOfTypesMissingReturnsNull() {
+        Map<String, Object> map = new HashMap<>(Map.of("a", 5, "b", "a string", "c", Boolean.TRUE));
+        assertNull(ServiceUtils.removeAsOneOfTypes(map, "missing", List.of(Integer.class), new ValidationException()));
+        assertThat(map.entrySet(), hasSize(3));
+    }
+
     public void testConvertToUri_CreatesUri() {
         var validation = new ValidationException();
         var uri = convertToUri("www.elastic.co", "name", "scope", validation);
@@ -347,6 +438,22 @@ public void testExtractOptionalPositiveInt() {
         assertThat(validation.validationErrors(), hasSize(1));
     }
 
+    public void testExtractOptionalPositiveLong_IntegerValue() {
+        var validation = new ValidationException();
+        validation.addValidationError("previous error");
+        Map<String, Object> map = modifiableMap(Map.of("abc", 3));
+        assertEquals(Long.valueOf(3), extractOptionalPositiveLong(map, "abc", "scope", validation));
+        assertThat(validation.validationErrors(), hasSize(1));
+    }
+
+    public void testExtractOptionalPositiveLong() {
+        var validation = new ValidationException();
+        validation.addValidationError("previous error");
+        Map<String, Object> map = modifiableMap(Map.of("abc", 4_000_000_000L));
+        assertEquals(Long.valueOf(4_000_000_000L), extractOptionalPositiveLong(map, "abc", "scope", validation));
+        assertThat(validation.validationErrors(), hasSize(1));
+    }
+
     public void testExtractOptionalEnum_ReturnsNull_WhenFieldDoesNotExist() {
         var validation = new ValidationException();
         Map<String, Object> map = modifiableMap(Map.of("key", "value"));
@@ -470,6 +577,127 @@ public void testExtractOptionalTimeValue_ReturnsNullAndAddsException_WhenTimeVal
         );
     }
 
+    public void testExtractOptionalDouble_ExtractsAsDoubleInRange() {
+        var validationException = new ValidationException();
+        Map<String, Object> map = modifiableMap(Map.of("key", 1.01));
+        var result = ServiceUtils.extractOptionalDoubleInRange(map, "key", 0.0, 2.0, "test_scope", validationException);
+        assertEquals(Double.valueOf(1.01), result);
+        assertTrue(map.isEmpty());
+        assertThat(validationException.validationErrors().size(), is(0));
+    }
+
+    public void testExtractOptionalDouble_InRange_ReturnsNullWhenKeyNotPresent() {
+        var validationException = new ValidationException();
+        Map<String, Object> map = modifiableMap(Map.of("key", 1.01));
+        var result = ServiceUtils.extractOptionalDoubleInRange(map, "other_key", 0.0, 2.0, "test_scope", validationException);
+        assertNull(result);
+        assertThat(map.size(), is(1));
+        assertThat(map.get("key"), is(1.01));
+    }
+
+    public void testExtractOptionalDouble_InRange_HasErrorWhenBelowMinValue() {
+        var validationException = new ValidationException();
+        Map<String, Object> map = modifiableMap(Map.of("key", -2.0));
+        var result = ServiceUtils.extractOptionalDoubleInRange(map, "key", 0.0, 2.0, "test_scope", validationException);
+        assertNull(result);
+        assertThat(validationException.validationErrors().size(), is(1));
+        assertThat(
+            validationException.validationErrors().get(0),
+            is("[test_scope] Invalid value [-2.0]. [key] must be a greater than or equal to [0.0]")
+        );
+    }
+
+    public void testExtractOptionalDouble_InRange_HasErrorWhenAboveMaxValue() {
+        var validationException = new ValidationException();
+        Map<String, Object> map = modifiableMap(Map.of("key", 12.0));
+        var result = ServiceUtils.extractOptionalDoubleInRange(map, "key", 0.0, 2.0, "test_scope", validationException);
+        assertNull(result);
+        assertThat(validationException.validationErrors().size(), is(1));
+        assertThat(
+            validationException.validationErrors().get(0),
+            is("[test_scope] Invalid value [12.0]. [key] must be a less than or equal to [2.0]")
+        );
+    }
+
+    public void testExtractOptionalDouble_InRange_DoesNotCheckMinWhenNull() {
+        var validationException = new ValidationException();
+        Map<String, Object> map = modifiableMap(Map.of("key", -2.0));
+        var result = ServiceUtils.extractOptionalDoubleInRange(map, "key", null, 2.0, "test_scope", validationException);
+        assertEquals(Double.valueOf(-2.0), result);
+        assertTrue(map.isEmpty());
+        assertThat(validationException.validationErrors().size(), is(0));
+    }
+
+    public void testExtractOptionalDouble_InRange_DoesNotCheckMaxWhenNull() {
+        var validationException = new ValidationException();
+        Map<String, Object> map = modifiableMap(Map.of("key", 12.0));
+        var result = ServiceUtils.extractOptionalDoubleInRange(map, "key", 0.0, null, "test_scope", validationException);
+        assertEquals(Double.valueOf(12.0), result);
+        assertTrue(map.isEmpty());
+        assertThat(validationException.validationErrors().size(), is(0));
+    }
+
+    public void testExtractOptionalFloat_ExtractsAFloat() {
+        Map<String, Object> map = modifiableMap(Map.of("key", 1.0f));
+        var result = ServiceUtils.extractOptionalFloat(map, "key");
+        assertThat(result, is(1.0f));
+        assertTrue(map.isEmpty());
+    }
+
+    public void testExtractOptionalFloat_ReturnsNullWhenKeyNotPresent() {
+        Map<String, Object> map = modifiableMap(Map.of("key", 1.0f));
+        var result = ServiceUtils.extractOptionalFloat(map, "other_key");
+        assertNull(result);
+        assertThat(map.size(), is(1));
+        assertThat(map.get("key"), is(1.0f));
+    }
+
+    public void testExtractRequiredEnum_ExtractsAEnum() {
+        ValidationException validationException = new ValidationException();
+        Map<String, Object> map = modifiableMap(Map.of("key", "ingest"));
+        var result = ServiceUtils.extractRequiredEnum(
+            map,
+            "key",
+            "testscope",
+            InputType::fromString,
+            EnumSet.allOf(InputType.class),
+            validationException
+        );
+        assertThat(result, is(InputType.INGEST));
+    }
+
+    public void testExtractRequiredEnum_ReturnsNullWhenEnumValueIsNotPresent() {
+        ValidationException validationException = new ValidationException();
+        Map<String, Object> map = modifiableMap(Map.of("key", "invalid"));
+        var result = ServiceUtils.extractRequiredEnum(
+            map,
+            "key",
+            "testscope",
+            InputType::fromString,
+            EnumSet.allOf(InputType.class),
+            validationException
+        );
+        assertNull(result);
+        assertThat(validationException.validationErrors().size(), is(1));
+        assertThat(validationException.validationErrors().get(0), containsString("Invalid value [invalid] received. [key] must be one of"));
+    }
+
+    public void testExtractRequiredEnum_HasValidationErrorOnMissingSetting() {
+        ValidationException validationException = new ValidationException();
+        Map<String, Object> map = modifiableMap(Map.of("key", "ingest"));
+        var result = ServiceUtils.extractRequiredEnum(
+            map,
+            "missing_key",
+            "testscope",
+            InputType::fromString,
+            EnumSet.allOf(InputType.class),
+            validationException
+        );
+        assertNull(result);
+        assertThat(validationException.validationErrors().size(), is(1));
+        assertThat(validationException.validationErrors().get(0), is("[testscope] does not contain the required setting [missing_key]"));
+    }
+
     public void testGetEmbeddingSize_ReturnsError_WhenTextEmbeddingResults_IsEmpty() {
         var service = mock(InferenceService.class);
 
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/azureaistudio/AzureAiStudioServiceTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/azureaistudio/AzureAiStudioServiceTests.java
new file mode 100644
index 0000000000000..51593c8d052d9
--- /dev/null
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/azureaistudio/AzureAiStudioServiceTests.java
@@ -0,0 +1,1177 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.services.azureaistudio;
+
+import org.apache.http.HttpHeaders;
+import org.elasticsearch.ElasticsearchException;
+import org.elasticsearch.ElasticsearchStatusException;
+import org.elasticsearch.action.ActionListener;
+import org.elasticsearch.action.support.PlainActionFuture;
+import org.elasticsearch.common.ValidationException;
+import org.elasticsearch.common.settings.Settings;
+import org.elasticsearch.core.Nullable;
+import org.elasticsearch.core.TimeValue;
+import org.elasticsearch.inference.ChunkedInferenceServiceResults;
+import org.elasticsearch.inference.ChunkingOptions;
+import org.elasticsearch.inference.InferenceServiceResults;
+import org.elasticsearch.inference.InputType;
+import org.elasticsearch.inference.Model;
+import org.elasticsearch.inference.ModelConfigurations;
+import org.elasticsearch.inference.ModelSecrets;
+import org.elasticsearch.inference.SimilarityMeasure;
+import org.elasticsearch.inference.TaskType;
+import org.elasticsearch.test.ESTestCase;
+import org.elasticsearch.test.http.MockResponse;
+import org.elasticsearch.test.http.MockWebServer;
+import org.elasticsearch.threadpool.ThreadPool;
+import org.elasticsearch.xcontent.XContentType;
+import org.elasticsearch.xpack.core.inference.action.InferenceAction;
+import org.elasticsearch.xpack.core.inference.results.ChatCompletionResults;
+import org.elasticsearch.xpack.core.inference.results.ChunkedTextEmbeddingResults;
+import org.elasticsearch.xpack.core.ml.inference.results.ChunkedNlpInferenceResults;
+import org.elasticsearch.xpack.inference.external.http.HttpClientManager;
+import org.elasticsearch.xpack.inference.external.http.sender.HttpRequestSender;
+import org.elasticsearch.xpack.inference.external.http.sender.HttpRequestSenderTests;
+import org.elasticsearch.xpack.inference.external.http.sender.Sender;
+import org.elasticsearch.xpack.inference.logging.ThrottlerManager;
+import org.elasticsearch.xpack.inference.services.azureaistudio.completion.AzureAiStudioChatCompletionModel;
+import org.elasticsearch.xpack.inference.services.azureaistudio.completion.AzureAiStudioChatCompletionModelTests;
+import org.elasticsearch.xpack.inference.services.azureaistudio.completion.AzureAiStudioChatCompletionServiceSettingsTests;
+import org.elasticsearch.xpack.inference.services.azureaistudio.completion.AzureAiStudioChatCompletionTaskSettings;
+import org.elasticsearch.xpack.inference.services.azureaistudio.completion.AzureAiStudioChatCompletionTaskSettingsTests;
+import org.elasticsearch.xpack.inference.services.azureaistudio.embeddings.AzureAiStudioEmbeddingsModel;
+import org.elasticsearch.xpack.inference.services.azureaistudio.embeddings.AzureAiStudioEmbeddingsModelTests;
+import org.elasticsearch.xpack.inference.services.azureaistudio.embeddings.AzureAiStudioEmbeddingsServiceSettingsTests;
+import org.elasticsearch.xpack.inference.services.azureaistudio.embeddings.AzureAiStudioEmbeddingsTaskSettingsTests;
+import org.hamcrest.CoreMatchers;
+import org.hamcrest.MatcherAssert;
+import org.hamcrest.Matchers;
+import org.junit.After;
+import org.junit.Before;
+
+import java.io.IOException;
+import java.net.URISyntaxException;
+import java.util.HashMap;
+import java.util.List;
+import java.util.Map;
+import java.util.Set;
+import java.util.concurrent.TimeUnit;
+
+import static org.elasticsearch.xpack.inference.Utils.inferenceUtilityPool;
+import static org.elasticsearch.xpack.inference.Utils.mockClusterServiceEmpty;
+import static org.elasticsearch.xpack.inference.external.http.Utils.entityAsMap;
+import static org.elasticsearch.xpack.inference.external.http.Utils.getUrl;
+import static org.elasticsearch.xpack.inference.external.request.azureopenai.AzureOpenAiUtils.API_KEY_HEADER;
+import static org.elasticsearch.xpack.inference.results.ChunkedTextEmbeddingResultsTests.asMapWithListsInsteadOfArrays;
+import static org.elasticsearch.xpack.inference.services.ServiceComponentsTests.createWithEmptySettings;
+import static org.elasticsearch.xpack.inference.services.Utils.getInvalidModel;
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants.API_KEY_FIELD;
+import static org.hamcrest.CoreMatchers.is;
+import static org.hamcrest.Matchers.containsString;
+import static org.hamcrest.Matchers.equalTo;
+import static org.hamcrest.Matchers.hasSize;
+import static org.hamcrest.Matchers.instanceOf;
+import static org.mockito.ArgumentMatchers.anyString;
+import static org.mockito.Mockito.mock;
+import static org.mockito.Mockito.times;
+import static org.mockito.Mockito.verify;
+import static org.mockito.Mockito.verifyNoMoreInteractions;
+import static org.mockito.Mockito.when;
+
+public class AzureAiStudioServiceTests extends ESTestCase {
+    private static final TimeValue TIMEOUT = new TimeValue(30, TimeUnit.SECONDS);
+    private final MockWebServer webServer = new MockWebServer();
+    private ThreadPool threadPool;
+    private HttpClientManager clientManager;
+
+    @Before
+    public void init() throws Exception {
+        webServer.start();
+        threadPool = createThreadPool(inferenceUtilityPool());
+        clientManager = HttpClientManager.create(Settings.EMPTY, threadPool, mockClusterServiceEmpty(), mock(ThrottlerManager.class));
+    }
+
+    @After
+    public void shutdown() throws IOException {
+        clientManager.close();
+        terminate(threadPool);
+        webServer.close();
+    }
+
+    public void testParseRequestConfig_CreatesAnAzureAiStudioEmbeddingsModel() throws IOException {
+        try (var service = createService()) {
+            ActionListener<Model> modelVerificationListener = ActionListener.wrap(model -> {
+                assertThat(model, instanceOf(AzureAiStudioEmbeddingsModel.class));
+
+                var embeddingsModel = (AzureAiStudioEmbeddingsModel) model;
+                assertThat(embeddingsModel.getServiceSettings().target(), is("http://target.local"));
+                assertThat(embeddingsModel.getServiceSettings().provider(), is(AzureAiStudioProvider.OPENAI));
+                assertThat(embeddingsModel.getServiceSettings().endpointType(), is(AzureAiStudioEndpointType.TOKEN));
+                assertThat(embeddingsModel.getSecretSettings().apiKey().toString(), is("secret"));
+                assertThat(embeddingsModel.getTaskSettings().user(), is("user"));
+            }, exception -> fail("Unexpected exception: " + exception));
+
+            service.parseRequestConfig(
+                "id",
+                TaskType.TEXT_EMBEDDING,
+                getRequestConfigMap(
+                    getEmbeddingsServiceSettingsMap("http://target.local", "openai", "token", null, null, null, null),
+                    getEmbeddingsTaskSettingsMap("user"),
+                    getSecretSettingsMap("secret")
+                ),
+                Set.of(),
+                modelVerificationListener
+            );
+        }
+    }
+
+    public void testParseRequestConfig_CreatesAnAzureAiStudioChatCompletionModel() throws IOException {
+        try (var service = createService()) {
+            ActionListener<Model> modelVerificationListener = ActionListener.wrap(model -> {
+                assertThat(model, instanceOf(AzureAiStudioChatCompletionModel.class));
+
+                var completionModel = (AzureAiStudioChatCompletionModel) model;
+                assertThat(completionModel.getServiceSettings().target(), is("http://target.local"));
+                assertThat(completionModel.getServiceSettings().provider(), is(AzureAiStudioProvider.OPENAI));
+                assertThat(completionModel.getServiceSettings().endpointType(), is(AzureAiStudioEndpointType.TOKEN));
+                assertThat(completionModel.getSecretSettings().apiKey().toString(), is("secret"));
+                assertNull(completionModel.getTaskSettings().temperature());
+                assertTrue(completionModel.getTaskSettings().doSample());
+            }, exception -> fail("Unexpected exception: " + exception));
+
+            service.parseRequestConfig(
+                "id",
+                TaskType.COMPLETION,
+                getRequestConfigMap(
+                    getChatCompletionServiceSettingsMap("http://target.local", "openai", "token"),
+                    getChatCompletionTaskSettingsMap(null, null, true, null),
+                    getSecretSettingsMap("secret")
+                ),
+                Set.of(),
+                modelVerificationListener
+            );
+        }
+    }
+
+    public void testParseRequestConfig_ThrowsUnsupportedModelType() throws IOException {
+        try (var service = createService()) {
+            ActionListener<Model> modelVerificationListener = ActionListener.wrap(
+                model -> fail("Expected exception, but got model: " + model),
+                exception -> {
+                    assertThat(exception, instanceOf(ElasticsearchStatusException.class));
+                    assertThat(exception.getMessage(), is("The [azureaistudio] service does not support task type [sparse_embedding]"));
+                }
+            );
+
+            service.parseRequestConfig(
+                "id",
+                TaskType.SPARSE_EMBEDDING,
+                getRequestConfigMap(
+                    getChatCompletionServiceSettingsMap("http://target.local", "openai", "token"),
+                    getChatCompletionTaskSettingsMap(null, null, true, null),
+                    getSecretSettingsMap("secret")
+                ),
+                Set.of(),
+                modelVerificationListener
+            );
+        }
+    }
+
+    public void testParseRequestConfig_ThrowsWhenAnExtraKeyExistsInConfig() throws IOException {
+        try (var service = createService()) {
+            var config = getRequestConfigMap(
+                getChatCompletionServiceSettingsMap("http://target.local", "openai", "token"),
+                getChatCompletionTaskSettingsMap(null, null, true, null),
+                getSecretSettingsMap("secret")
+            );
+            config.put("extra_key", "value");
+
+            ActionListener<Model> modelVerificationListener = ActionListener.wrap(
+                model -> fail("Expected exception, but got model: " + model),
+                exception -> {
+                    assertThat(exception, instanceOf(ElasticsearchStatusException.class));
+                    assertThat(
+                        exception.getMessage(),
+                        is("Model configuration contains settings [{extra_key=value}] unknown to the [azureaistudio] service")
+                    );
+                }
+            );
+
+            service.parseRequestConfig("id", TaskType.COMPLETION, config, Set.of(), modelVerificationListener);
+        }
+    }
+
+    public void testParseRequestConfig_ThrowsWhenAnExtraKeyExistsInEmbeddingServiceSettingsMap() throws IOException {
+        try (var service = createService()) {
+            var serviceSettings = getEmbeddingsServiceSettingsMap("http://target.local", "openai", "token", null, null, null, null);
+            serviceSettings.put("extra_key", "value");
+
+            var config = getRequestConfigMap(serviceSettings, getEmbeddingsTaskSettingsMap("user"), getSecretSettingsMap("secret"));
+
+            ActionListener<Model> modelVerificationListener = ActionListener.wrap(
+                model -> fail("Expected exception, but got model: " + model),
+                exception -> {
+                    assertThat(exception, instanceOf(ElasticsearchStatusException.class));
+                    assertThat(
+                        exception.getMessage(),
+                        is("Model configuration contains settings [{extra_key=value}] unknown to the [azureaistudio] service")
+                    );
+                }
+            );
+
+            service.parseRequestConfig("id", TaskType.TEXT_EMBEDDING, config, Set.of(), modelVerificationListener);
+        }
+    }
+
+    public void testParseRequestConfig_ThrowsWhenDimsSetByUserExistsInEmbeddingServiceSettingsMap() throws IOException {
+        try (var service = createService()) {
+            var config = getRequestConfigMap(
+                getEmbeddingsServiceSettingsMap("http://target.local", "openai", "token", 1024, true, null, null),
+                getEmbeddingsTaskSettingsMap("user"),
+                getSecretSettingsMap("secret")
+            );
+
+            ActionListener<Model> modelVerificationListener = ActionListener.wrap(
+                model -> fail("Expected exception, but got model: " + model),
+                exception -> {
+                    assertThat(exception, instanceOf(ValidationException.class));
+                    assertThat(
+                        exception.getMessage(),
+                        containsString("[service_settings] does not allow the setting [dimensions_set_by_user]")
+                    );
+                }
+            );
+
+            service.parseRequestConfig("id", TaskType.TEXT_EMBEDDING, config, Set.of(), modelVerificationListener);
+        }
+    }
+
+    public void testParseRequestConfig_ThrowsWhenAnExtraKeyExistsInEmbeddingTaskSettingsMap() throws IOException {
+        try (var service = createService()) {
+            var taskSettings = getEmbeddingsTaskSettingsMap("user");
+            taskSettings.put("extra_key", "value");
+
+            var config = getRequestConfigMap(
+                getEmbeddingsServiceSettingsMap("http://target.local", "openai", "token", null, null, null, null),
+                taskSettings,
+                getSecretSettingsMap("secret")
+            );
+
+            ActionListener<Model> modelVerificationListener = ActionListener.wrap(
+                model -> fail("Expected exception, but got model: " + model),
+                exception -> {
+                    assertThat(exception, instanceOf(ElasticsearchStatusException.class));
+                    assertThat(
+                        exception.getMessage(),
+                        is("Model configuration contains settings [{extra_key=value}] unknown to the [azureaistudio] service")
+                    );
+                }
+            );
+
+            service.parseRequestConfig("id", TaskType.TEXT_EMBEDDING, config, Set.of(), modelVerificationListener);
+        }
+    }
+
+    public void testParseRequestConfig_ThrowsWhenAnExtraKeyExistsInEmbeddingSecretSettingsMap() throws IOException {
+        try (var service = createService()) {
+            var secretSettings = getSecretSettingsMap("secret");
+            secretSettings.put("extra_key", "value");
+
+            var config = getRequestConfigMap(
+                getEmbeddingsServiceSettingsMap("http://target.local", "openai", "token", null, null, null, null),
+                getEmbeddingsTaskSettingsMap("user"),
+                secretSettings
+            );
+
+            ActionListener<Model> modelVerificationListener = ActionListener.wrap(
+                model -> fail("Expected exception, but got model: " + model),
+                exception -> {
+                    assertThat(exception, instanceOf(ElasticsearchStatusException.class));
+                    assertThat(
+                        exception.getMessage(),
+                        is("Model configuration contains settings [{extra_key=value}] unknown to the [azureaistudio] service")
+                    );
+                }
+            );
+
+            service.parseRequestConfig("id", TaskType.TEXT_EMBEDDING, config, Set.of(), modelVerificationListener);
+        }
+    }
+
+    public void testParseRequestConfig_ThrowsWhenAnExtraKeyExistsInChatCompletionServiceSettingsMap() throws IOException {
+        try (var service = createService()) {
+            var serviceSettings = getChatCompletionServiceSettingsMap("http://target.local", "openai", "token");
+            serviceSettings.put("extra_key", "value");
+
+            var config = getRequestConfigMap(
+                serviceSettings,
+                getChatCompletionTaskSettingsMap(null, 2.0, null, null),
+                getSecretSettingsMap("secret")
+            );
+
+            ActionListener<Model> modelVerificationListener = ActionListener.wrap(
+                model -> fail("Expected exception, but got model: " + model),
+                exception -> {
+                    assertThat(exception, instanceOf(ElasticsearchStatusException.class));
+                    assertThat(
+                        exception.getMessage(),
+                        is("Model configuration contains settings [{extra_key=value}] unknown to the [azureaistudio] service")
+                    );
+                }
+            );
+
+            service.parseRequestConfig("id", TaskType.COMPLETION, config, Set.of(), modelVerificationListener);
+        }
+    }
+
+    public void testParseRequestConfig_ThrowsWhenAnExtraKeyExistsInChatCompletionTaskSettingsMap() throws IOException {
+        try (var service = createService()) {
+            var taskSettings = getChatCompletionTaskSettingsMap(null, 2.0, null, null);
+            taskSettings.put("extra_key", "value");
+
+            var config = getRequestConfigMap(
+                getChatCompletionServiceSettingsMap("http://target.local", "openai", "token"),
+                taskSettings,
+                getSecretSettingsMap("secret")
+            );
+
+            ActionListener<Model> modelVerificationListener = ActionListener.wrap(
+                model -> fail("Expected exception, but got model: " + model),
+                exception -> {
+                    assertThat(exception, instanceOf(ElasticsearchStatusException.class));
+                    assertThat(
+                        exception.getMessage(),
+                        is("Model configuration contains settings [{extra_key=value}] unknown to the [azureaistudio] service")
+                    );
+                }
+            );
+
+            service.parseRequestConfig("id", TaskType.COMPLETION, config, Set.of(), modelVerificationListener);
+        }
+    }
+
+    public void testParseRequestConfig_ThrowsWhenAnExtraKeyExistsInChatCompletionSecretSettingsMap() throws IOException {
+        try (var service = createService()) {
+            var secretSettings = getSecretSettingsMap("secret");
+            secretSettings.put("extra_key", "value");
+
+            var config = getRequestConfigMap(
+                getChatCompletionServiceSettingsMap("http://target.local", "openai", "token"),
+                getChatCompletionTaskSettingsMap(null, 2.0, null, null),
+                secretSettings
+            );
+
+            ActionListener<Model> modelVerificationListener = ActionListener.wrap(
+                model -> fail("Expected exception, but got model: " + model),
+                exception -> {
+                    assertThat(exception, instanceOf(ElasticsearchStatusException.class));
+                    assertThat(
+                        exception.getMessage(),
+                        is("Model configuration contains settings [{extra_key=value}] unknown to the [azureaistudio] service")
+                    );
+                }
+            );
+
+            service.parseRequestConfig("id", TaskType.COMPLETION, config, Set.of(), modelVerificationListener);
+        }
+    }
+
+    public void testParseRequestConfig_ThrowsWhenProviderIsNotValidForEmbeddings() throws IOException {
+        try (var service = createService()) {
+            var serviceSettings = getEmbeddingsServiceSettingsMap("http://target.local", "databricks", "token", null, null, null, null);
+
+            var config = getRequestConfigMap(serviceSettings, getEmbeddingsTaskSettingsMap("user"), getSecretSettingsMap("secret"));
+
+            ActionListener<Model> modelVerificationListener = ActionListener.wrap(
+                model -> fail("Expected exception, but got model: " + model),
+                exception -> {
+                    assertThat(exception, instanceOf(ElasticsearchStatusException.class));
+                    assertThat(exception.getMessage(), is("The [text_embedding] task type for provider [databricks] is not available"));
+                }
+            );
+
+            service.parseRequestConfig("id", TaskType.TEXT_EMBEDDING, config, Set.of(), modelVerificationListener);
+        }
+    }
+
+    public void testParseRequestConfig_ThrowsWhenEndpointTypeIsNotValidForEmbeddingsProvider() throws IOException {
+        try (var service = createService()) {
+            var serviceSettings = getEmbeddingsServiceSettingsMap("http://target.local", "openai", "realtime", null, null, null, null);
+
+            var config = getRequestConfigMap(serviceSettings, getEmbeddingsTaskSettingsMap("user"), getSecretSettingsMap("secret"));
+
+            ActionListener<Model> modelVerificationListener = ActionListener.wrap(
+                model -> fail("Expected exception, but got model: " + model),
+                exception -> {
+                    assertThat(exception, instanceOf(ElasticsearchStatusException.class));
+                    assertThat(
+                        exception.getMessage(),
+                        is("The [realtime] endpoint type with [text_embedding] task type for provider [openai] is not available")
+                    );
+                }
+            );
+
+            service.parseRequestConfig("id", TaskType.TEXT_EMBEDDING, config, Set.of(), modelVerificationListener);
+        }
+    }
+
+    public void testParseRequestConfig_ThrowsWhenEndpointTypeIsNotValidForChatCompletionProvider() throws IOException {
+        try (var service = createService()) {
+            var serviceSettings = getChatCompletionServiceSettingsMap("http://target.local", "openai", "realtime");
+
+            var config = getRequestConfigMap(
+                serviceSettings,
+                getChatCompletionTaskSettingsMap(null, null, null, null),
+                getSecretSettingsMap("secret")
+            );
+
+            ActionListener<Model> modelVerificationListener = ActionListener.wrap(
+                model -> fail("Expected exception, but got model: " + model),
+                exception -> {
+                    assertThat(exception, instanceOf(ElasticsearchStatusException.class));
+                    assertThat(
+                        exception.getMessage(),
+                        is("The [realtime] endpoint type with [completion] task type for provider [openai] is not available")
+                    );
+                }
+            );
+
+            service.parseRequestConfig("id", TaskType.COMPLETION, config, Set.of(), modelVerificationListener);
+        }
+    }
+
+    public void testParsePersistedConfig_CreatesAnAzureAiStudioEmbeddingsModel() throws IOException {
+        try (var service = createService()) {
+            var config = getPersistedConfigMap(
+                getEmbeddingsServiceSettingsMap("http://target.local", "openai", "token", 1024, true, 512, null),
+                getEmbeddingsTaskSettingsMap("user"),
+                getSecretSettingsMap("secret")
+            );
+
+            var model = service.parsePersistedConfigWithSecrets("id", TaskType.TEXT_EMBEDDING, config.config(), config.secrets());
+
+            assertThat(model, instanceOf(AzureAiStudioEmbeddingsModel.class));
+
+            var embeddingsModel = (AzureAiStudioEmbeddingsModel) model;
+            assertThat(embeddingsModel.getServiceSettings().target(), is("http://target.local"));
+            assertThat(embeddingsModel.getServiceSettings().provider(), is(AzureAiStudioProvider.OPENAI));
+            assertThat(embeddingsModel.getServiceSettings().endpointType(), is(AzureAiStudioEndpointType.TOKEN));
+            assertThat(embeddingsModel.getServiceSettings().dimensions(), is(1024));
+            assertThat(embeddingsModel.getServiceSettings().dimensionsSetByUser(), is(true));
+            assertThat(embeddingsModel.getServiceSettings().maxInputTokens(), is(512));
+            assertThat(embeddingsModel.getSecretSettings().apiKey().toString(), is("secret"));
+            assertThat(embeddingsModel.getTaskSettings().user(), is("user"));
+        }
+    }
+
+    public void testParsePersistedConfig_CreatesAnAzureAiStudioChatCompletionModel() throws IOException {
+        try (var service = createService()) {
+            var config = getPersistedConfigMap(
+                getChatCompletionServiceSettingsMap("http://target.local", "openai", "token"),
+                getChatCompletionTaskSettingsMap(1.0, 2.0, true, 512),
+                getSecretSettingsMap("secret")
+            );
+
+            var model = service.parsePersistedConfigWithSecrets("id", TaskType.COMPLETION, config.config(), config.secrets());
+
+            assertThat(model, instanceOf(AzureAiStudioChatCompletionModel.class));
+
+            var chatCompletionModel = (AzureAiStudioChatCompletionModel) model;
+            assertThat(chatCompletionModel.getServiceSettings().target(), is("http://target.local"));
+            assertThat(chatCompletionModel.getServiceSettings().provider(), is(AzureAiStudioProvider.OPENAI));
+            assertThat(chatCompletionModel.getServiceSettings().endpointType(), is(AzureAiStudioEndpointType.TOKEN));
+            assertThat(chatCompletionModel.getTaskSettings().temperature(), is(1.0));
+            assertThat(chatCompletionModel.getTaskSettings().topP(), is(2.0));
+            assertThat(chatCompletionModel.getTaskSettings().doSample(), is(true));
+            assertThat(chatCompletionModel.getTaskSettings().maxNewTokens(), is(512));
+        }
+    }
+
+    public void testParsePersistedConfig_ThrowsUnsupportedModelType() throws IOException {
+        try (var service = createService()) {
+            ActionListener<Model> modelVerificationListener = ActionListener.wrap(
+                model -> fail("Expected exception, but got model: " + model),
+                exception -> {
+                    assertThat(exception, instanceOf(ElasticsearchStatusException.class));
+                    assertThat(exception.getMessage(), is("The [azureaistudio] service does not support task type [sparse_embedding]"));
+                }
+            );
+
+            service.parseRequestConfig(
+                "id",
+                TaskType.SPARSE_EMBEDDING,
+                getRequestConfigMap(
+                    getChatCompletionServiceSettingsMap("http://target.local", "openai", "token"),
+                    getChatCompletionTaskSettingsMap(null, null, true, null),
+                    getSecretSettingsMap("secret")
+                ),
+                Set.of(),
+                modelVerificationListener
+            );
+        }
+    }
+
+    public void testParsePersistedConfigWithSecrets_ThrowsErrorTryingToParseInvalidModel() throws IOException {
+        try (var service = createService()) {
+            var config = getPersistedConfigMap(
+                getChatCompletionServiceSettingsMap("http://target.local", "openai", "token"),
+                getChatCompletionTaskSettingsMap(1.0, 2.0, true, 512),
+                getSecretSettingsMap("secret")
+            );
+
+            var thrownException = expectThrows(
+                ElasticsearchStatusException.class,
+                () -> service.parsePersistedConfigWithSecrets("id", TaskType.SPARSE_EMBEDDING, config.config(), config.secrets())
+            );
+
+            assertThat(
+                thrownException.getMessage(),
+                is("Failed to parse stored model [id] for [azureaistudio] service, please delete and add the service again")
+            );
+        }
+    }
+
+    public void testParsePersistedConfig_DoesNotThrowWhenAnExtraKeyExistsInConfig() throws IOException {
+        try (var service = createService()) {
+            var serviceSettings = getEmbeddingsServiceSettingsMap("http://target.local", "openai", "token", 1024, true, 512, null);
+            var taskSettings = getEmbeddingsTaskSettingsMap("user");
+            var secretSettings = getSecretSettingsMap("secret");
+            var config = getPersistedConfigMap(serviceSettings, taskSettings, secretSettings);
+            config.config().put("extra_key", "value");
+
+            var model = service.parsePersistedConfigWithSecrets("id", TaskType.TEXT_EMBEDDING, config.config(), config.secrets());
+
+            assertThat(model, instanceOf(AzureAiStudioEmbeddingsModel.class));
+        }
+    }
+
+    public void testParsePersistedConfig_DoesNotThrowWhenExtraKeyExistsInEmbeddingServiceSettingsMap() throws IOException {
+        try (var service = createService()) {
+            var serviceSettings = getEmbeddingsServiceSettingsMap("http://target.local", "openai", "token", 1024, true, 512, null);
+            serviceSettings.put("extra_key", "value");
+
+            var taskSettings = getEmbeddingsTaskSettingsMap("user");
+            var secretSettings = getSecretSettingsMap("secret");
+            var config = getPersistedConfigMap(serviceSettings, taskSettings, secretSettings);
+
+            var model = service.parsePersistedConfigWithSecrets("id", TaskType.TEXT_EMBEDDING, config.config(), config.secrets());
+
+            assertThat(model, instanceOf(AzureAiStudioEmbeddingsModel.class));
+        }
+    }
+
+    public void testParsePersistedConfig_DoesNotThrowWhenAnExtraKeyExistsInEmbeddingTaskSettingsMap() throws IOException {
+        try (var service = createService()) {
+            var serviceSettings = getEmbeddingsServiceSettingsMap("http://target.local", "openai", "token", 1024, true, 512, null);
+            var taskSettings = getEmbeddingsTaskSettingsMap("user");
+            taskSettings.put("extra_key", "value");
+
+            var secretSettings = getSecretSettingsMap("secret");
+            var config = getPersistedConfigMap(serviceSettings, taskSettings, secretSettings);
+
+            var model = service.parsePersistedConfigWithSecrets("id", TaskType.TEXT_EMBEDDING, config.config(), config.secrets());
+
+            assertThat(model, instanceOf(AzureAiStudioEmbeddingsModel.class));
+        }
+    }
+
+    public void testParsePersistedConfig_DoesNotThrowWhenAnExtraKeyExistsInEmbeddingSecretSettingsMap() throws IOException {
+        try (var service = createService()) {
+            var serviceSettings = getEmbeddingsServiceSettingsMap("http://target.local", "openai", "token", 1024, true, 512, null);
+            var taskSettings = getEmbeddingsTaskSettingsMap("user");
+            var secretSettings = getSecretSettingsMap("secret");
+            secretSettings.put("extra_key", "value");
+
+            var config = getPersistedConfigMap(serviceSettings, taskSettings, secretSettings);
+
+            var model = service.parsePersistedConfigWithSecrets("id", TaskType.TEXT_EMBEDDING, config.config(), config.secrets());
+
+            assertThat(model, instanceOf(AzureAiStudioEmbeddingsModel.class));
+        }
+    }
+
+    public void testParsePersistedConfig_DoesNotThrowWhenAnExtraKeyExistsInChatCompletionServiceSettingsMap() throws IOException {
+        try (var service = createService()) {
+            var serviceSettings = getChatCompletionServiceSettingsMap("http://target.local", "openai", "token");
+            serviceSettings.put("extra_key", "value");
+            var taskSettings = getChatCompletionTaskSettingsMap(1.0, 2.0, true, 512);
+            var secretSettings = getSecretSettingsMap("secret");
+            var config = getPersistedConfigMap(serviceSettings, taskSettings, secretSettings);
+
+            var model = service.parsePersistedConfigWithSecrets("id", TaskType.COMPLETION, config.config(), config.secrets());
+
+            assertThat(model, instanceOf(AzureAiStudioChatCompletionModel.class));
+        }
+    }
+
+    public void testParsePersistedConfig_DoesNotThrowWhenAnExtraKeyExistsInChatCompletionTaskSettingsMap() throws IOException {
+        try (var service = createService()) {
+            var serviceSettings = getChatCompletionServiceSettingsMap("http://target.local", "openai", "token");
+            var taskSettings = getChatCompletionTaskSettingsMap(1.0, 2.0, true, 512);
+            taskSettings.put("extra_key", "value");
+            var secretSettings = getSecretSettingsMap("secret");
+            var config = getPersistedConfigMap(serviceSettings, taskSettings, secretSettings);
+
+            var model = service.parsePersistedConfigWithSecrets("id", TaskType.COMPLETION, config.config(), config.secrets());
+
+            assertThat(model, instanceOf(AzureAiStudioChatCompletionModel.class));
+        }
+    }
+
+    public void testParsePersistedConfig_DoesNotThrowWhenAnExtraKeyExistsInChatCompletionSecretSettingsMap() throws IOException {
+        try (var service = createService()) {
+            var serviceSettings = getChatCompletionServiceSettingsMap("http://target.local", "openai", "token");
+            var taskSettings = getChatCompletionTaskSettingsMap(1.0, 2.0, true, 512);
+            var secretSettings = getSecretSettingsMap("secret");
+            secretSettings.put("extra_key", "value");
+            var config = getPersistedConfigMap(serviceSettings, taskSettings, secretSettings);
+
+            var model = service.parsePersistedConfigWithSecrets("id", TaskType.COMPLETION, config.config(), config.secrets());
+
+            assertThat(model, instanceOf(AzureAiStudioChatCompletionModel.class));
+        }
+    }
+
+    public void testParsePersistedConfig_WithoutSecretsCreatesEmbeddingsModel() throws IOException {
+        try (var service = createService()) {
+            var config = getPersistedConfigMap(
+                getEmbeddingsServiceSettingsMap("http://target.local", "openai", "token", 1024, true, 512, null),
+                getEmbeddingsTaskSettingsMap("user"),
+                Map.of()
+            );
+
+            var model = service.parsePersistedConfig("id", TaskType.TEXT_EMBEDDING, config.config());
+
+            assertThat(model, instanceOf(AzureAiStudioEmbeddingsModel.class));
+
+            var embeddingsModel = (AzureAiStudioEmbeddingsModel) model;
+            assertThat(embeddingsModel.getServiceSettings().target(), is("http://target.local"));
+            assertThat(embeddingsModel.getServiceSettings().provider(), is(AzureAiStudioProvider.OPENAI));
+            assertThat(embeddingsModel.getServiceSettings().endpointType(), is(AzureAiStudioEndpointType.TOKEN));
+            assertThat(embeddingsModel.getServiceSettings().dimensions(), is(1024));
+            assertThat(embeddingsModel.getServiceSettings().dimensionsSetByUser(), is(true));
+            assertThat(embeddingsModel.getServiceSettings().maxInputTokens(), is(512));
+            assertThat(embeddingsModel.getTaskSettings().user(), is("user"));
+        }
+    }
+
+    public void testParsePersistedConfig_WithoutSecretsCreatesChatCompletionModel() throws IOException {
+        try (var service = createService()) {
+            var config = getPersistedConfigMap(
+                getChatCompletionServiceSettingsMap("http://target.local", "openai", "token"),
+                getChatCompletionTaskSettingsMap(1.0, 2.0, true, 512),
+                Map.of()
+            );
+
+            var model = service.parsePersistedConfig("id", TaskType.COMPLETION, config.config());
+
+            assertThat(model, instanceOf(AzureAiStudioChatCompletionModel.class));
+
+            var chatCompletionModel = (AzureAiStudioChatCompletionModel) model;
+            assertThat(chatCompletionModel.getServiceSettings().target(), is("http://target.local"));
+            assertThat(chatCompletionModel.getServiceSettings().provider(), is(AzureAiStudioProvider.OPENAI));
+            assertThat(chatCompletionModel.getServiceSettings().endpointType(), is(AzureAiStudioEndpointType.TOKEN));
+            assertThat(chatCompletionModel.getTaskSettings().temperature(), is(1.0));
+            assertThat(chatCompletionModel.getTaskSettings().topP(), is(2.0));
+            assertThat(chatCompletionModel.getTaskSettings().doSample(), is(true));
+            assertThat(chatCompletionModel.getTaskSettings().maxNewTokens(), is(512));
+        }
+    }
+
+    public void testCheckModelConfig_ForEmbeddingsModel_Works() throws IOException {
+        var senderFactory = HttpRequestSenderTests.createSenderFactory(threadPool, clientManager);
+
+        try (var service = new AzureAiStudioService(senderFactory, createWithEmptySettings(threadPool))) {
+            webServer.enqueue(new MockResponse().setResponseCode(200).setBody(testEmbeddingResultJson));
+
+            var model = AzureAiStudioEmbeddingsModelTests.createModel(
+                "id",
+                getUrl(webServer),
+                AzureAiStudioProvider.OPENAI,
+                AzureAiStudioEndpointType.TOKEN,
+                "apikey",
+                null,
+                false,
+                null,
+                null,
+                null,
+                null
+            );
+
+            PlainActionFuture<Model> listener = new PlainActionFuture<>();
+            service.checkModelConfig(model, listener);
+
+            var result = listener.actionGet(TIMEOUT);
+            assertThat(
+                result,
+                is(
+                    AzureAiStudioEmbeddingsModelTests.createModel(
+                        "id",
+                        getUrl(webServer),
+                        AzureAiStudioProvider.OPENAI,
+                        AzureAiStudioEndpointType.TOKEN,
+                        "apikey",
+                        2,
+                        false,
+                        null,
+                        SimilarityMeasure.DOT_PRODUCT,
+                        null,
+                        null
+                    )
+                )
+            );
+
+            assertThat(webServer.requests(), hasSize(1));
+
+            var requestMap = entityAsMap(webServer.requests().get(0).getBody());
+            MatcherAssert.assertThat(requestMap, Matchers.is(Map.of("input", List.of("how big"))));
+        }
+    }
+
+    public void testCheckModelConfig_ForEmbeddingsModel_ThrowsIfEmbeddingSizeDoesNotMatchValueSetByUser() throws IOException {
+        var senderFactory = HttpRequestSenderTests.createSenderFactory(threadPool, clientManager);
+
+        try (var service = new AzureAiStudioService(senderFactory, createWithEmptySettings(threadPool))) {
+            webServer.enqueue(new MockResponse().setResponseCode(200).setBody(testEmbeddingResultJson));
+
+            var model = AzureAiStudioEmbeddingsModelTests.createModel(
+                "id",
+                getUrl(webServer),
+                AzureAiStudioProvider.OPENAI,
+                AzureAiStudioEndpointType.TOKEN,
+                "apikey",
+                3,
+                true,
+                null,
+                null,
+                null,
+                null
+            );
+
+            PlainActionFuture<Model> listener = new PlainActionFuture<>();
+            service.checkModelConfig(model, listener);
+
+            var exception = expectThrows(ElasticsearchStatusException.class, () -> listener.actionGet(TIMEOUT));
+            assertThat(
+                exception.getMessage(),
+                is(
+                    "The retrieved embeddings size [2] does not match the size specified in the settings [3]. "
+                        + "Please recreate the [id] configuration with the correct dimensions"
+                )
+            );
+
+            assertThat(webServer.requests(), hasSize(1));
+
+            var requestMap = entityAsMap(webServer.requests().get(0).getBody());
+            MatcherAssert.assertThat(requestMap, Matchers.is(Map.of("input", List.of("how big"), "dimensions", 3)));
+        }
+    }
+
+    public void testCheckModelConfig_WorksForChatCompletionsModel() throws IOException {
+        var senderFactory = HttpRequestSenderTests.createSenderFactory(threadPool, clientManager);
+
+        try (var service = new AzureAiStudioService(senderFactory, createWithEmptySettings(threadPool))) {
+            webServer.enqueue(new MockResponse().setResponseCode(200).setBody(testChatCompletionResultJson));
+
+            var model = AzureAiStudioChatCompletionModelTests.createModel(
+                "id",
+                getUrl(webServer),
+                AzureAiStudioProvider.OPENAI,
+                AzureAiStudioEndpointType.TOKEN,
+                "apikey",
+                null,
+                null,
+                null,
+                null,
+                null
+            );
+
+            PlainActionFuture<Model> listener = new PlainActionFuture<>();
+            service.checkModelConfig(model, listener);
+
+            var result = listener.actionGet(TIMEOUT);
+            assertThat(
+                result,
+                is(
+                    AzureAiStudioChatCompletionModelTests.createModel(
+                        "id",
+                        getUrl(webServer),
+                        AzureAiStudioProvider.OPENAI,
+                        AzureAiStudioEndpointType.TOKEN,
+                        "apikey",
+                        null,
+                        null,
+                        null,
+                        AzureAiStudioChatCompletionTaskSettings.DEFAULT_MAX_NEW_TOKENS,
+                        null
+                    )
+                )
+            );
+        }
+    }
+
+    public void testInfer_ThrowsErrorWhenModelIsNotAzureAiStudioModel() throws IOException {
+        var sender = mock(Sender.class);
+
+        var factory = mock(HttpRequestSender.Factory.class);
+        when(factory.createSender(anyString())).thenReturn(sender);
+
+        var mockModel = getInvalidModel("model_id", "service_name");
+
+        try (var service = new AzureAiStudioService(factory, createWithEmptySettings(threadPool))) {
+            PlainActionFuture<InferenceServiceResults> listener = new PlainActionFuture<>();
+            service.infer(
+                mockModel,
+                null,
+                List.of(""),
+                new HashMap<>(),
+                InputType.INGEST,
+                InferenceAction.Request.DEFAULT_TIMEOUT,
+                listener
+            );
+
+            var thrownException = expectThrows(ElasticsearchStatusException.class, () -> listener.actionGet(TIMEOUT));
+            assertThat(
+                thrownException.getMessage(),
+                is("The internal model was invalid, please delete the service [service_name] with id [model_id] and add it again.")
+            );
+
+            verify(factory, times(1)).createSender(anyString());
+            verify(sender, times(1)).start();
+        }
+
+        verify(sender, times(1)).close();
+        verifyNoMoreInteractions(factory);
+        verifyNoMoreInteractions(sender);
+    }
+
+    public void testChunkedInfer_Embeddings_CallsInfer_ConvertsFloatResponse() throws IOException, URISyntaxException {
+        var senderFactory = HttpRequestSenderTests.createSenderFactory(threadPool, clientManager);
+
+        try (var service = new AzureAiStudioService(senderFactory, createWithEmptySettings(threadPool))) {
+
+            String responseJson = """
+                {
+                    "object": "list",
+                    "data": [
+                        {
+                            "object": "embedding",
+                            "index": 0,
+                            "embedding": [
+                                0.0123,
+                                -0.0123
+                            ]
+                        }
+                    ],
+                    "model": "text-embedding-ada-002-v2",
+                    "usage": {
+                        "prompt_tokens": 8,
+                        "total_tokens": 8
+                    }
+                }
+                """;
+            webServer.enqueue(new MockResponse().setResponseCode(200).setBody(responseJson));
+
+            var model = AzureAiStudioEmbeddingsModelTests.createModel(
+                "id",
+                getUrl(webServer),
+                AzureAiStudioProvider.OPENAI,
+                AzureAiStudioEndpointType.TOKEN,
+                "apikey",
+                null,
+                false,
+                null,
+                null,
+                "user",
+                null
+            );
+            PlainActionFuture<List<ChunkedInferenceServiceResults>> listener = new PlainActionFuture<>();
+            service.chunkedInfer(
+                model,
+                List.of("abc"),
+                new HashMap<>(),
+                InputType.INGEST,
+                new ChunkingOptions(null, null),
+                InferenceAction.Request.DEFAULT_TIMEOUT,
+                listener
+            );
+
+            var result = listener.actionGet(TIMEOUT).get(0);
+            assertThat(result, CoreMatchers.instanceOf(ChunkedTextEmbeddingResults.class));
+
+            assertThat(
+                asMapWithListsInsteadOfArrays((ChunkedTextEmbeddingResults) result),
+                Matchers.is(
+                    Map.of(
+                        ChunkedTextEmbeddingResults.FIELD_NAME,
+                        List.of(
+                            Map.of(
+                                ChunkedNlpInferenceResults.TEXT,
+                                "abc",
+                                ChunkedNlpInferenceResults.INFERENCE,
+                                List.of((double) 0.0123f, (double) -0.0123f)
+                            )
+                        )
+                    )
+                )
+            );
+            assertThat(webServer.requests(), hasSize(1));
+            assertNull(webServer.requests().get(0).getUri().getQuery());
+            assertThat(webServer.requests().get(0).getHeader(HttpHeaders.CONTENT_TYPE), equalTo(XContentType.JSON.mediaType()));
+            assertThat(webServer.requests().get(0).getHeader(API_KEY_HEADER), equalTo("apikey"));
+
+            var requestMap = entityAsMap(webServer.requests().get(0).getBody());
+            assertThat(requestMap.size(), Matchers.is(2));
+            assertThat(requestMap.get("input"), Matchers.is(List.of("abc")));
+            assertThat(requestMap.get("user"), Matchers.is("user"));
+        }
+    }
+
+    public void testInfer_ThrowsWhenQueryIsPresent() throws IOException {
+        var senderFactory = HttpRequestSenderTests.createSenderFactory(threadPool, clientManager);
+
+        try (var service = new AzureAiStudioService(senderFactory, createWithEmptySettings(threadPool))) {
+            webServer.enqueue(new MockResponse().setResponseCode(200).setBody(testChatCompletionResultJson));
+
+            var model = AzureAiStudioChatCompletionModelTests.createModel(
+                "id",
+                getUrl(webServer),
+                AzureAiStudioProvider.OPENAI,
+                AzureAiStudioEndpointType.TOKEN,
+                "apikey"
+            );
+
+            PlainActionFuture<InferenceServiceResults> listener = new PlainActionFuture<>();
+            UnsupportedOperationException exception = expectThrows(
+                UnsupportedOperationException.class,
+                () -> service.infer(
+                    model,
+                    "should throw",
+                    List.of("abc"),
+                    new HashMap<>(),
+                    InputType.INGEST,
+                    InferenceAction.Request.DEFAULT_TIMEOUT,
+                    listener
+                )
+            );
+
+            assertThat(exception.getMessage(), is("Azure AI Studio service does not support inference with query input"));
+        }
+    }
+
+    public void testInfer_WithChatCompletionModel() throws IOException {
+        var senderFactory = HttpRequestSenderTests.createSenderFactory(threadPool, clientManager);
+
+        try (var service = new AzureAiStudioService(senderFactory, createWithEmptySettings(threadPool))) {
+            webServer.enqueue(new MockResponse().setResponseCode(200).setBody(testChatCompletionResultJson));
+
+            var model = AzureAiStudioChatCompletionModelTests.createModel(
+                "id",
+                getUrl(webServer),
+                AzureAiStudioProvider.OPENAI,
+                AzureAiStudioEndpointType.TOKEN,
+                "apikey"
+            );
+
+            PlainActionFuture<InferenceServiceResults> listener = new PlainActionFuture<>();
+            service.infer(
+                model,
+                null,
+                List.of("abc"),
+                new HashMap<>(),
+                InputType.INGEST,
+                InferenceAction.Request.DEFAULT_TIMEOUT,
+                listener
+            );
+
+            var result = listener.actionGet(TIMEOUT);
+            assertThat(result, CoreMatchers.instanceOf(ChatCompletionResults.class));
+
+            var completionResults = (ChatCompletionResults) result;
+            assertThat(completionResults.getResults().size(), is(1));
+            assertThat(completionResults.getResults().get(0).content(), is("test completion content"));
+        }
+    }
+
+    public void testInfer_UnauthorisedResponse() throws IOException {
+        var senderFactory = HttpRequestSenderTests.createSenderFactory(threadPool, clientManager);
+
+        try (var service = new AzureAiStudioService(senderFactory, createWithEmptySettings(threadPool))) {
+
+            String responseJson = """
+                {
+                    "error": {
+                        "message": "Incorrect API key provided:",
+                        "type": "invalid_request_error",
+                        "param": null,
+                        "code": "invalid_api_key"
+                    }
+                }
+                """;
+            webServer.enqueue(new MockResponse().setResponseCode(401).setBody(responseJson));
+
+            var model = AzureAiStudioEmbeddingsModelTests.createModel(
+                "id",
+                getUrl(webServer),
+                AzureAiStudioProvider.OPENAI,
+                AzureAiStudioEndpointType.TOKEN,
+                "apikey",
+                null,
+                false,
+                null,
+                null,
+                "user",
+                null
+            );
+            PlainActionFuture<InferenceServiceResults> listener = new PlainActionFuture<>();
+            service.infer(
+                model,
+                null,
+                List.of("abc"),
+                new HashMap<>(),
+                InputType.INGEST,
+                InferenceAction.Request.DEFAULT_TIMEOUT,
+                listener
+            );
+
+            var error = expectThrows(ElasticsearchException.class, () -> listener.actionGet(TIMEOUT));
+            assertThat(error.getMessage(), containsString("Received an authentication error status code for request"));
+            assertThat(error.getMessage(), containsString("Error message: [Incorrect API key provided:]"));
+            assertThat(webServer.requests(), hasSize(1));
+        }
+    }
+
+    // ----------------------------------------------------------------
+
+    private AzureAiStudioService createService() {
+        return new AzureAiStudioService(mock(HttpRequestSender.Factory.class), createWithEmptySettings(threadPool));
+    }
+
+    private Map<String, Object> getRequestConfigMap(
+        Map<String, Object> serviceSettings,
+        Map<String, Object> taskSettings,
+        Map<String, Object> secretSettings
+    ) {
+        var builtServiceSettings = new HashMap<>();
+        builtServiceSettings.putAll(serviceSettings);
+        builtServiceSettings.putAll(secretSettings);
+
+        return new HashMap<>(
+            Map.of(ModelConfigurations.SERVICE_SETTINGS, builtServiceSettings, ModelConfigurations.TASK_SETTINGS, taskSettings)
+        );
+    }
+
+    private record PeristedConfigRecord(Map<String, Object> config, Map<String, Object> secrets) {}
+
+    private PeristedConfigRecord getPersistedConfigMap(
+        Map<String, Object> serviceSettings,
+        Map<String, Object> taskSettings,
+        Map<String, Object> secretSettings
+    ) {
+
+        return new PeristedConfigRecord(
+            new HashMap<>(Map.of(ModelConfigurations.SERVICE_SETTINGS, serviceSettings, ModelConfigurations.TASK_SETTINGS, taskSettings)),
+            new HashMap<>(Map.of(ModelSecrets.SECRET_SETTINGS, secretSettings))
+        );
+    }
+
+    private PeristedConfigRecord getPersistedConfigMap(Map<String, Object> serviceSettings, Map<String, Object> taskSettings) {
+
+        return new PeristedConfigRecord(
+            new HashMap<>(Map.of(ModelConfigurations.SERVICE_SETTINGS, serviceSettings, ModelConfigurations.TASK_SETTINGS, taskSettings)),
+            null
+        );
+    }
+
+    private static Map<String, Object> getEmbeddingsServiceSettingsMap(
+        String target,
+        String provider,
+        String endpointType,
+        @Nullable Integer dimensions,
+        @Nullable Boolean dimensionsSetByUser,
+        @Nullable Integer maxTokens,
+        @Nullable SimilarityMeasure similarityMeasure
+    ) {
+        return AzureAiStudioEmbeddingsServiceSettingsTests.createRequestSettingsMap(
+            target,
+            provider,
+            endpointType,
+            dimensions,
+            dimensionsSetByUser,
+            maxTokens,
+            similarityMeasure
+        );
+    }
+
+    private static Map<String, Object> getEmbeddingsTaskSettingsMap(@Nullable String user) {
+        return AzureAiStudioEmbeddingsTaskSettingsTests.getTaskSettingsMap(user);
+    }
+
+    private static HashMap<String, Object> getChatCompletionServiceSettingsMap(String target, String provider, String endpointType) {
+        return AzureAiStudioChatCompletionServiceSettingsTests.createRequestSettingsMap(target, provider, endpointType);
+    }
+
+    public static Map<String, Object> getChatCompletionTaskSettingsMap(
+        @Nullable Double temperature,
+        @Nullable Double topP,
+        @Nullable Boolean doSample,
+        @Nullable Integer maxNewTokens
+    ) {
+        return AzureAiStudioChatCompletionTaskSettingsTests.getTaskSettingsMap(temperature, topP, doSample, maxNewTokens);
+    }
+
+    private static Map<String, Object> getSecretSettingsMap(String apiKey) {
+        return new HashMap<>(Map.of(API_KEY_FIELD, apiKey));
+    }
+
+    private static final String testEmbeddingResultJson = """
+        {
+          "object": "list",
+          "data": [
+              {
+                  "object": "embedding",
+                  "index": 0,
+                  "embedding": [
+                      0.0123,
+                      -0.0123
+                  ]
+              }
+          ],
+          "model": "text-embedding-ada-002-v2",
+          "usage": {
+              "prompt_tokens": 8,
+              "total_tokens": 8
+          }
+        }
+        """;
+
+    private static final String testChatCompletionResultJson = """
+        {
+            "choices": [
+                {
+                    "finish_reason": "stop",
+                    "index": 0,
+                    "message": {
+                        "content": "test completion content",
+                        "role": "assistant",
+                        "tool_calls": null
+                    }
+                }
+            ],
+            "created": 1714006424,
+            "id": "f92b5b4d-0de3-4152-a3c6-5aae8a74555c",
+            "model": "",
+            "object": "chat.completion",
+            "usage": {
+                "completion_tokens": 35,
+                "prompt_tokens": 8,
+                "total_tokens": 43
+            }
+        }
+        """;
+}
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/azureaistudio/completion/AzureAiStudioChatCompletionModelTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/azureaistudio/completion/AzureAiStudioChatCompletionModelTests.java
new file mode 100644
index 0000000000000..bd34a34285cf2
--- /dev/null
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/azureaistudio/completion/AzureAiStudioChatCompletionModelTests.java
@@ -0,0 +1,234 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.services.azureaistudio.completion;
+
+import org.elasticsearch.common.settings.SecureString;
+import org.elasticsearch.core.Nullable;
+import org.elasticsearch.inference.TaskType;
+import org.elasticsearch.test.ESTestCase;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioEndpointType;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioProvider;
+import org.elasticsearch.xpack.inference.services.settings.DefaultSecretSettings;
+import org.elasticsearch.xpack.inference.services.settings.RateLimitSettings;
+
+import java.net.URISyntaxException;
+
+import static org.elasticsearch.xpack.inference.services.azureaistudio.completion.AzureAiStudioChatCompletionTaskSettingsTests.getTaskSettingsMap;
+import static org.hamcrest.Matchers.is;
+import static org.hamcrest.Matchers.sameInstance;
+
+public class AzureAiStudioChatCompletionModelTests extends ESTestCase {
+
+    public void testOverrideWith_OverridesWithoutValues() {
+        var model = createModel(
+            "id",
+            "target",
+            AzureAiStudioProvider.OPENAI,
+            AzureAiStudioEndpointType.TOKEN,
+            "apikey",
+            1.0,
+            2.0,
+            false,
+            512,
+            null
+        );
+        var requestTaskSettingsMap = getTaskSettingsMap(null, null, null, null);
+        var overriddenModel = AzureAiStudioChatCompletionModel.of(model, requestTaskSettingsMap);
+
+        assertThat(overriddenModel, sameInstance(overriddenModel));
+    }
+
+    public void testOverrideWith_temperature() {
+        var model = createModel(
+            "id",
+            "target",
+            AzureAiStudioProvider.OPENAI,
+            AzureAiStudioEndpointType.TOKEN,
+            "apikey",
+            1.0,
+            null,
+            null,
+            null,
+            null
+        );
+        var requestTaskSettings = getTaskSettingsMap(0.5, null, null, null);
+        var overriddenModel = AzureAiStudioChatCompletionModel.of(model, requestTaskSettings);
+        assertThat(
+            overriddenModel,
+            is(
+                createModel(
+                    "id",
+                    "target",
+                    AzureAiStudioProvider.OPENAI,
+                    AzureAiStudioEndpointType.TOKEN,
+                    "apikey",
+                    0.5,
+                    null,
+                    null,
+                    null,
+                    null
+                )
+            )
+        );
+    }
+
+    public void testOverrideWith_topP() {
+        var model = createModel(
+            "id",
+            "target",
+            AzureAiStudioProvider.OPENAI,
+            AzureAiStudioEndpointType.TOKEN,
+            "apikey",
+            null,
+            0.8,
+            null,
+            null,
+            null
+        );
+        var requestTaskSettings = getTaskSettingsMap(null, 0.5, null, null);
+        var overriddenModel = AzureAiStudioChatCompletionModel.of(model, requestTaskSettings);
+        assertThat(
+            overriddenModel,
+            is(
+                createModel(
+                    "id",
+                    "target",
+                    AzureAiStudioProvider.OPENAI,
+                    AzureAiStudioEndpointType.TOKEN,
+                    "apikey",
+                    null,
+                    0.5,
+                    null,
+                    null,
+                    null
+                )
+            )
+        );
+    }
+
+    public void testOverrideWith_doSample() {
+        var model = createModel(
+            "id",
+            "target",
+            AzureAiStudioProvider.OPENAI,
+            AzureAiStudioEndpointType.TOKEN,
+            "apikey",
+            null,
+            null,
+            true,
+            null,
+            null
+        );
+        var requestTaskSettings = getTaskSettingsMap(null, null, false, null);
+        var overriddenModel = AzureAiStudioChatCompletionModel.of(model, requestTaskSettings);
+        assertThat(
+            overriddenModel,
+            is(
+                createModel(
+                    "id",
+                    "target",
+                    AzureAiStudioProvider.OPENAI,
+                    AzureAiStudioEndpointType.TOKEN,
+                    "apikey",
+                    null,
+                    null,
+                    false,
+                    null,
+                    null
+                )
+            )
+        );
+    }
+
+    public void testOverrideWith_maxNewTokens() {
+        var model = createModel(
+            "id",
+            "target",
+            AzureAiStudioProvider.OPENAI,
+            AzureAiStudioEndpointType.TOKEN,
+            "apikey",
+            null,
+            null,
+            null,
+            512,
+            null
+        );
+        var requestTaskSettings = getTaskSettingsMap(null, null, null, 128);
+        var overriddenModel = AzureAiStudioChatCompletionModel.of(model, requestTaskSettings);
+        assertThat(
+            overriddenModel,
+            is(
+                createModel(
+                    "id",
+                    "target",
+                    AzureAiStudioProvider.OPENAI,
+                    AzureAiStudioEndpointType.TOKEN,
+                    "apikey",
+                    null,
+                    null,
+                    null,
+                    128,
+                    null
+                )
+            )
+        );
+    }
+
+    public void testSetsProperUrlForOpenAITokenModel() throws URISyntaxException {
+        var model = createModel("id", "http://testtarget.local", AzureAiStudioProvider.OPENAI, AzureAiStudioEndpointType.TOKEN, "apikey");
+        assertThat(model.getEndpointUri().toString(), is("http://testtarget.local"));
+    }
+
+    public void testSetsProperUrlForNonOpenAiTokenModel() throws URISyntaxException {
+        var model = createModel("id", "http://testtarget.local", AzureAiStudioProvider.COHERE, AzureAiStudioEndpointType.TOKEN, "apikey");
+        assertThat(model.getEndpointUri().toString(), is("http://testtarget.local/v1/chat/completions"));
+    }
+
+    public void testSetsProperUrlForRealtimeEndpointModel() throws URISyntaxException {
+        var model = createModel(
+            "id",
+            "http://testtarget.local",
+            AzureAiStudioProvider.MISTRAL,
+            AzureAiStudioEndpointType.REALTIME,
+            "apikey"
+        );
+        assertThat(model.getEndpointUri().toString(), is("http://testtarget.local"));
+    }
+
+    public static AzureAiStudioChatCompletionModel createModel(
+        String id,
+        String target,
+        AzureAiStudioProvider provider,
+        AzureAiStudioEndpointType endpointType,
+        String apiKey
+    ) {
+        return createModel(id, target, provider, endpointType, apiKey, null, null, null, null, null);
+    }
+
+    public static AzureAiStudioChatCompletionModel createModel(
+        String id,
+        String target,
+        AzureAiStudioProvider provider,
+        AzureAiStudioEndpointType endpointType,
+        String apiKey,
+        @Nullable Double temperature,
+        @Nullable Double topP,
+        @Nullable Boolean doSample,
+        @Nullable Integer maxNewTokens,
+        @Nullable RateLimitSettings rateLimitSettings
+    ) {
+        return new AzureAiStudioChatCompletionModel(
+            id,
+            TaskType.COMPLETION,
+            "azureaistudio",
+            new AzureAiStudioChatCompletionServiceSettings(target, provider, endpointType, rateLimitSettings),
+            new AzureAiStudioChatCompletionTaskSettings(temperature, topP, doSample, maxNewTokens),
+            new DefaultSecretSettings(new SecureString(apiKey.toCharArray()))
+        );
+    }
+}
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/azureaistudio/completion/AzureAiStudioChatCompletionRequestTaskSettingsTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/azureaistudio/completion/AzureAiStudioChatCompletionRequestTaskSettingsTests.java
new file mode 100644
index 0000000000000..53c7cb6971f20
--- /dev/null
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/azureaistudio/completion/AzureAiStudioChatCompletionRequestTaskSettingsTests.java
@@ -0,0 +1,108 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.services.azureaistudio.completion;
+
+import org.elasticsearch.common.Strings;
+import org.elasticsearch.common.ValidationException;
+import org.elasticsearch.test.ESTestCase;
+import org.hamcrest.MatcherAssert;
+
+import java.util.HashMap;
+import java.util.Map;
+
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants.DO_SAMPLE_FIELD;
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants.MAX_NEW_TOKENS_FIELD;
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants.TEMPERATURE_FIELD;
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants.TOP_P_FIELD;
+import static org.hamcrest.Matchers.containsString;
+import static org.hamcrest.Matchers.is;
+
+public class AzureAiStudioChatCompletionRequestTaskSettingsTests extends ESTestCase {
+    public void testFromMap_ReturnsEmptySettings_WhenTheMapIsEmpty() {
+        var settings = AzureAiStudioChatCompletionRequestTaskSettings.fromMap(new HashMap<>(Map.of()));
+        assertThat(settings, is(AzureAiStudioChatCompletionRequestTaskSettings.EMPTY_SETTINGS));
+    }
+
+    public void testFromMap_ReturnsEmptySettings_WhenTheMapDoesNotContainTheFields() {
+        var settings = AzureAiStudioChatCompletionRequestTaskSettings.fromMap(new HashMap<>(Map.of("key", "model")));
+        assertThat(settings, is(AzureAiStudioChatCompletionRequestTaskSettings.EMPTY_SETTINGS));
+    }
+
+    public void testFromMap_ReturnsTemperature() {
+        var settings = AzureAiStudioChatCompletionRequestTaskSettings.fromMap(new HashMap<>(Map.of(TEMPERATURE_FIELD, 0.1)));
+        assertThat(settings.temperature(), is(0.1));
+    }
+
+    public void testFromMap_ReturnsTopP() {
+        var settings = AzureAiStudioChatCompletionRequestTaskSettings.fromMap(new HashMap<>(Map.of(TOP_P_FIELD, 0.1)));
+        assertThat(settings.topP(), is(0.1));
+    }
+
+    public void testFromMap_ReturnsDoSample() {
+        var settings = AzureAiStudioChatCompletionRequestTaskSettings.fromMap(new HashMap<>(Map.of(DO_SAMPLE_FIELD, true)));
+        assertThat(settings.doSample(), is(true));
+    }
+
+    public void testFromMap_ReturnsMaxNewTokens() {
+        var settings = AzureAiStudioChatCompletionRequestTaskSettings.fromMap(new HashMap<>(Map.of(MAX_NEW_TOKENS_FIELD, 512)));
+        assertThat(settings.maxNewTokens(), is(512));
+    }
+
+    public void testFromMap_TemperatureIsInvalidValue_ThrowsValidationException() {
+        var thrownException = expectThrows(
+            ValidationException.class,
+            () -> AzureAiStudioChatCompletionRequestTaskSettings.fromMap(new HashMap<>(Map.of(TEMPERATURE_FIELD, "invalid")))
+        );
+
+        MatcherAssert.assertThat(
+            thrownException.getMessage(),
+            containsString(
+                Strings.format("field [temperature] is not of the expected type. The value [invalid] cannot be converted to a [Double]")
+            )
+        );
+    }
+
+    public void testFromMap_TopPIsInvalidValue_ThrowsValidationException() {
+        var thrownException = expectThrows(
+            ValidationException.class,
+            () -> AzureAiStudioChatCompletionRequestTaskSettings.fromMap(new HashMap<>(Map.of(TOP_P_FIELD, "invalid")))
+        );
+
+        MatcherAssert.assertThat(
+            thrownException.getMessage(),
+            containsString(
+                Strings.format("field [top_p] is not of the expected type. The value [invalid] cannot be converted to a [Double]")
+            )
+        );
+    }
+
+    public void testFromMap_DoSampleIsInvalidValue_ThrowsStatusException() {
+        var thrownException = expectThrows(
+            ValidationException.class,
+            () -> AzureAiStudioChatCompletionRequestTaskSettings.fromMap(new HashMap<>(Map.of(DO_SAMPLE_FIELD, "invalid")))
+        );
+
+        MatcherAssert.assertThat(
+            thrownException.getMessage(),
+            containsString("field [do_sample] is not of the expected type. The value [invalid] cannot be converted to a [Boolean]")
+        );
+    }
+
+    public void testFromMap_MaxTokensIsInvalidValue_ThrowsStatusException() {
+        var thrownException = expectThrows(
+            ValidationException.class,
+            () -> AzureAiStudioChatCompletionRequestTaskSettings.fromMap(new HashMap<>(Map.of(MAX_NEW_TOKENS_FIELD, "invalid")))
+        );
+
+        MatcherAssert.assertThat(
+            thrownException.getMessage(),
+            containsString("field [max_new_tokens] is not of the expected type. The value [invalid] cannot be converted to a [Integer]")
+        );
+    }
+
+}
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/azureaistudio/completion/AzureAiStudioChatCompletionServiceSettingsTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/azureaistudio/completion/AzureAiStudioChatCompletionServiceSettingsTests.java
new file mode 100644
index 0000000000000..79d6e384d7693
--- /dev/null
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/azureaistudio/completion/AzureAiStudioChatCompletionServiceSettingsTests.java
@@ -0,0 +1,121 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.services.azureaistudio.completion;
+
+import org.elasticsearch.common.Strings;
+import org.elasticsearch.test.ESTestCase;
+import org.elasticsearch.xcontent.XContentBuilder;
+import org.elasticsearch.xcontent.XContentFactory;
+import org.elasticsearch.xcontent.XContentType;
+import org.elasticsearch.xpack.inference.services.ConfigurationParseContext;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioEndpointType;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioProvider;
+import org.elasticsearch.xpack.inference.services.settings.RateLimitSettings;
+import org.hamcrest.CoreMatchers;
+
+import java.io.IOException;
+import java.util.HashMap;
+import java.util.Map;
+
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants.ENDPOINT_TYPE_FIELD;
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants.PROVIDER_FIELD;
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants.TARGET_FIELD;
+import static org.hamcrest.Matchers.is;
+
+public class AzureAiStudioChatCompletionServiceSettingsTests extends ESTestCase {
+    public void testFromMap_Request_CreatesSettingsCorrectly() {
+        var target = "http://sometarget.local";
+        var provider = "openai";
+        var endpointType = "token";
+
+        var serviceSettings = AzureAiStudioChatCompletionServiceSettings.fromMap(
+            createRequestSettingsMap(target, provider, endpointType),
+            ConfigurationParseContext.REQUEST
+        );
+
+        assertThat(
+            serviceSettings,
+            is(new AzureAiStudioChatCompletionServiceSettings(target, AzureAiStudioProvider.OPENAI, AzureAiStudioEndpointType.TOKEN, null))
+        );
+    }
+
+    public void testFromMap_RequestWithRateLimit_CreatesSettingsCorrectly() {
+        var target = "http://sometarget.local";
+        var provider = "openai";
+        var endpointType = "token";
+
+        var settingsMap = createRequestSettingsMap(target, provider, endpointType);
+        settingsMap.put(RateLimitSettings.FIELD_NAME, new HashMap<>(Map.of(RateLimitSettings.REQUESTS_PER_MINUTE_FIELD, 3)));
+
+        var serviceSettings = AzureAiStudioChatCompletionServiceSettings.fromMap(settingsMap, ConfigurationParseContext.REQUEST);
+
+        assertThat(
+            serviceSettings,
+            is(
+                new AzureAiStudioChatCompletionServiceSettings(
+                    target,
+                    AzureAiStudioProvider.OPENAI,
+                    AzureAiStudioEndpointType.TOKEN,
+                    new RateLimitSettings(3)
+                )
+            )
+        );
+    }
+
+    public void testFromMap_Persistent_CreatesSettingsCorrectly() {
+        var target = "http://sometarget.local";
+        var provider = "openai";
+        var endpointType = "token";
+
+        var serviceSettings = AzureAiStudioChatCompletionServiceSettings.fromMap(
+            createRequestSettingsMap(target, provider, endpointType),
+            ConfigurationParseContext.PERSISTENT
+        );
+
+        assertThat(
+            serviceSettings,
+            is(new AzureAiStudioChatCompletionServiceSettings(target, AzureAiStudioProvider.OPENAI, AzureAiStudioEndpointType.TOKEN, null))
+        );
+    }
+
+    public void testToXContent_WritesAllValues() throws IOException {
+        var settings = new AzureAiStudioChatCompletionServiceSettings(
+            "target_value",
+            AzureAiStudioProvider.OPENAI,
+            AzureAiStudioEndpointType.TOKEN,
+            new RateLimitSettings(3)
+        );
+        XContentBuilder builder = XContentFactory.contentBuilder(XContentType.JSON);
+        settings.toXContent(builder, null);
+        String xContentResult = Strings.toString(builder);
+
+        assertThat(xContentResult, CoreMatchers.is("""
+            {"target":"target_value","provider":"openai","endpoint_type":"token",""" + """
+            "rate_limit":{"requests_per_minute":3}}"""));
+    }
+
+    public void testToFilteredXContent_WritesAllValues() throws IOException {
+        var settings = new AzureAiStudioChatCompletionServiceSettings(
+            "target_value",
+            AzureAiStudioProvider.OPENAI,
+            AzureAiStudioEndpointType.TOKEN,
+            new RateLimitSettings(3)
+        );
+        XContentBuilder builder = XContentFactory.contentBuilder(XContentType.JSON);
+        var filteredXContent = settings.getFilteredXContentObject();
+        filteredXContent.toXContent(builder, null);
+        String xContentResult = Strings.toString(builder);
+
+        assertThat(xContentResult, CoreMatchers.is("""
+            {"target":"target_value","provider":"openai","endpoint_type":"token"}"""));
+    }
+
+    public static HashMap<String, Object> createRequestSettingsMap(String target, String provider, String endpointType) {
+        return new HashMap<>(Map.of(TARGET_FIELD, target, PROVIDER_FIELD, provider, ENDPOINT_TYPE_FIELD, endpointType));
+    }
+}
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/azureaistudio/completion/AzureAiStudioChatCompletionTaskSettingsTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/azureaistudio/completion/AzureAiStudioChatCompletionTaskSettingsTests.java
new file mode 100644
index 0000000000000..bc541bbcf5369
--- /dev/null
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/azureaistudio/completion/AzureAiStudioChatCompletionTaskSettingsTests.java
@@ -0,0 +1,186 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.services.azureaistudio.completion;
+
+import org.elasticsearch.common.Strings;
+import org.elasticsearch.common.ValidationException;
+import org.elasticsearch.core.Nullable;
+import org.elasticsearch.test.ESTestCase;
+import org.elasticsearch.xcontent.XContentBuilder;
+import org.elasticsearch.xcontent.XContentFactory;
+import org.elasticsearch.xcontent.XContentType;
+import org.hamcrest.MatcherAssert;
+
+import java.io.IOException;
+import java.util.HashMap;
+import java.util.Map;
+
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants.DO_SAMPLE_FIELD;
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants.MAX_NEW_TOKENS_FIELD;
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants.TEMPERATURE_FIELD;
+import static org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants.TOP_P_FIELD;
+import static org.hamcrest.Matchers.containsString;
+import static org.hamcrest.Matchers.is;
+
+public class AzureAiStudioChatCompletionTaskSettingsTests extends ESTestCase {
+
+    public void testFromMap_AllValues() {
+        var taskMap = getTaskSettingsMap(1.0, 2.0, true, 512);
+        assertEquals(
+            new AzureAiStudioChatCompletionTaskSettings(1.0, 2.0, true, 512),
+            AzureAiStudioChatCompletionTaskSettings.fromMap(taskMap)
+        );
+    }
+
+    public void testFromMap_TemperatureIsInvalidValue_ThrowsValidationException() {
+        var taskMap = getTaskSettingsMap(null, 2.0, true, 512);
+        taskMap.put(TEMPERATURE_FIELD, "invalid");
+
+        var thrownException = expectThrows(ValidationException.class, () -> AzureAiStudioChatCompletionTaskSettings.fromMap(taskMap));
+
+        MatcherAssert.assertThat(
+            thrownException.getMessage(),
+            containsString(
+                Strings.format("field [temperature] is not of the expected type. The value [invalid] cannot be converted to a [Double]")
+            )
+        );
+    }
+
+    public void testFromMap_TopPIsInvalidValue_ThrowsValidationException() {
+        var taskMap = getTaskSettingsMap(null, 2.0, true, 512);
+        taskMap.put(TOP_P_FIELD, "invalid");
+
+        var thrownException = expectThrows(ValidationException.class, () -> AzureAiStudioChatCompletionTaskSettings.fromMap(taskMap));
+
+        MatcherAssert.assertThat(
+            thrownException.getMessage(),
+            containsString(
+                Strings.format("field [top_p] is not of the expected type. The value [invalid] cannot be converted to a [Double]")
+            )
+        );
+    }
+
+    public void testFromMap_DoSampleIsInvalidValue_ThrowsValidationException() {
+        var taskMap = getTaskSettingsMap(null, 2.0, true, 512);
+        taskMap.put(DO_SAMPLE_FIELD, "invalid");
+
+        var thrownException = expectThrows(ValidationException.class, () -> AzureAiStudioChatCompletionTaskSettings.fromMap(taskMap));
+
+        MatcherAssert.assertThat(
+            thrownException.getMessage(),
+            containsString("field [do_sample] is not of the expected type. The value [invalid] cannot be converted to a [Boolean]")
+        );
+    }
+
+    public void testFromMap_MaxNewTokensIsInvalidValue_ThrowsValidationException() {
+        var taskMap = getTaskSettingsMap(null, 2.0, true, 512);
+        taskMap.put(MAX_NEW_TOKENS_FIELD, "invalid");
+
+        var thrownException = expectThrows(ValidationException.class, () -> AzureAiStudioChatCompletionTaskSettings.fromMap(taskMap));
+
+        MatcherAssert.assertThat(
+            thrownException.getMessage(),
+            containsString(
+                Strings.format("field [max_new_tokens] is not of the expected type. The value [invalid] cannot be converted to a [Integer]")
+            )
+        );
+    }
+
+    public void testFromMap_WithNoValues_DoesNotThrowException() {
+        var taskMap = AzureAiStudioChatCompletionTaskSettings.fromMap(new HashMap<String, Object>(Map.of()));
+        assertNull(taskMap.temperature());
+        assertNull(taskMap.topP());
+        assertNull(taskMap.doSample());
+        assertNull(taskMap.maxNewTokens());
+    }
+
+    public void testOverrideWith_KeepsOriginalValuesWithOverridesAreNull() {
+        var settings = AzureAiStudioChatCompletionTaskSettings.fromMap(getTaskSettingsMap(1.0, 2.0, true, 512));
+        var overrideSettings = AzureAiStudioChatCompletionTaskSettings.of(
+            settings,
+            AzureAiStudioChatCompletionRequestTaskSettings.EMPTY_SETTINGS
+        );
+        MatcherAssert.assertThat(overrideSettings, is(settings));
+    }
+
+    public void testOverrideWith_UsesTemperatureOverride() {
+        var settings = AzureAiStudioChatCompletionTaskSettings.fromMap(getTaskSettingsMap(1.0, 2.0, true, 512));
+        var overrideSettings = AzureAiStudioChatCompletionRequestTaskSettings.fromMap(getTaskSettingsMap(1.5, null, null, null));
+        var overriddenTaskSettings = AzureAiStudioChatCompletionTaskSettings.of(settings, overrideSettings);
+        MatcherAssert.assertThat(overriddenTaskSettings, is(new AzureAiStudioChatCompletionTaskSettings(1.5, 2.0, true, 512)));
+    }
+
+    public void testOverrideWith_UsesTopPOverride() {
+        var settings = AzureAiStudioChatCompletionTaskSettings.fromMap(getTaskSettingsMap(1.0, 2.0, true, 512));
+        var overrideSettings = AzureAiStudioChatCompletionRequestTaskSettings.fromMap(getTaskSettingsMap(null, 0.2, null, null));
+        var overriddenTaskSettings = AzureAiStudioChatCompletionTaskSettings.of(settings, overrideSettings);
+        MatcherAssert.assertThat(overriddenTaskSettings, is(new AzureAiStudioChatCompletionTaskSettings(1.0, 0.2, true, 512)));
+    }
+
+    public void testOverrideWith_UsesDoSampleOverride() {
+        var settings = AzureAiStudioChatCompletionTaskSettings.fromMap(getTaskSettingsMap(1.0, 2.0, true, 512));
+        var overrideSettings = AzureAiStudioChatCompletionRequestTaskSettings.fromMap(getTaskSettingsMap(null, null, false, null));
+        var overriddenTaskSettings = AzureAiStudioChatCompletionTaskSettings.of(settings, overrideSettings);
+        MatcherAssert.assertThat(overriddenTaskSettings, is(new AzureAiStudioChatCompletionTaskSettings(1.0, 2.0, false, 512)));
+    }
+
+    public void testOverrideWith_UsesMaxNewTokensOverride() {
+        var settings = AzureAiStudioChatCompletionTaskSettings.fromMap(getTaskSettingsMap(1.0, 2.0, true, 512));
+        var overrideSettings = AzureAiStudioChatCompletionRequestTaskSettings.fromMap(getTaskSettingsMap(null, null, null, 128));
+        var overriddenTaskSettings = AzureAiStudioChatCompletionTaskSettings.of(settings, overrideSettings);
+        MatcherAssert.assertThat(overriddenTaskSettings, is(new AzureAiStudioChatCompletionTaskSettings(1.0, 2.0, true, 128)));
+    }
+
+    public void testToXContent_WithoutParameters() throws IOException {
+        var settings = AzureAiStudioChatCompletionTaskSettings.fromMap(getTaskSettingsMap(null, null, null, null));
+
+        XContentBuilder builder = XContentFactory.contentBuilder(XContentType.JSON);
+        settings.toXContent(builder, null);
+        String xContentResult = Strings.toString(builder);
+
+        assertThat(xContentResult, is("{}"));
+    }
+
+    public void testToXContent_WithParameters() throws IOException {
+        var settings = AzureAiStudioChatCompletionTaskSettings.fromMap(getTaskSettingsMap(1.0, 2.0, true, 512));
+
+        XContentBuilder builder = XContentFactory.contentBuilder(XContentType.JSON);
+        settings.toXContent(builder, null);
+        String xContentResult = Strings.toString(builder);
+
+        assertThat(xContentResult, is("""
+            {"temperature":1.0,"top_p":2.0,"do_sample":true,"max_new_tokens":512}"""));
+    }
+
+    public static Map<String, Object> getTaskSettingsMap(
+        @Nullable Double temperature,
+        @Nullable Double topP,
+        @Nullable Boolean doSample,
+        @Nullable Integer maxNewTokens
+    ) {
+        var map = new HashMap<String, Object>();
+
+        if (temperature != null) {
+            map.put(TEMPERATURE_FIELD, temperature);
+        }
+
+        if (topP != null) {
+            map.put(TOP_P_FIELD, topP);
+        }
+
+        if (doSample != null) {
+            map.put(DO_SAMPLE_FIELD, doSample);
+        }
+
+        if (maxNewTokens != null) {
+            map.put(MAX_NEW_TOKENS_FIELD, maxNewTokens);
+        }
+
+        return map;
+    }
+}
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/azureaistudio/embeddings/AzureAiStudioEmbeddingsModelTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/azureaistudio/embeddings/AzureAiStudioEmbeddingsModelTests.java
new file mode 100644
index 0000000000000..5a450f03b4e01
--- /dev/null
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/azureaistudio/embeddings/AzureAiStudioEmbeddingsModelTests.java
@@ -0,0 +1,138 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.services.azureaistudio.embeddings;
+
+import org.elasticsearch.common.settings.SecureString;
+import org.elasticsearch.core.Nullable;
+import org.elasticsearch.inference.SimilarityMeasure;
+import org.elasticsearch.inference.TaskType;
+import org.elasticsearch.test.ESTestCase;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioEndpointType;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioProvider;
+import org.elasticsearch.xpack.inference.services.settings.DefaultSecretSettings;
+import org.elasticsearch.xpack.inference.services.settings.RateLimitSettings;
+
+import java.net.URISyntaxException;
+
+import static org.elasticsearch.xpack.inference.services.azureaistudio.embeddings.AzureAiStudioEmbeddingsTaskSettingsTests.getTaskSettingsMap;
+import static org.hamcrest.Matchers.is;
+import static org.hamcrest.Matchers.sameInstance;
+
+public class AzureAiStudioEmbeddingsModelTests extends ESTestCase {
+
+    public void testOverrideWith_OverridesUser() {
+        var model = createModel(
+            "id",
+            "http://testtarget.local",
+            AzureAiStudioProvider.OPENAI,
+            AzureAiStudioEndpointType.TOKEN,
+            "apikey",
+            null,
+            false,
+            null,
+            null,
+            null,
+            null
+        );
+
+        var requestTaskSettingsMap = getTaskSettingsMap("override_user");
+        var overriddenModel = AzureAiStudioEmbeddingsModel.of(model, requestTaskSettingsMap);
+
+        assertThat(
+            overriddenModel,
+            is(
+                createModel(
+                    "id",
+                    "http://testtarget.local",
+                    AzureAiStudioProvider.OPENAI,
+                    AzureAiStudioEndpointType.TOKEN,
+                    "apikey",
+                    null,
+                    false,
+                    null,
+                    null,
+                    "override_user",
+                    null
+                )
+            )
+        );
+    }
+
+    public void testOverrideWith_OverridesWithoutValues() {
+        var model = createModel(
+            "id",
+            "http://testtarget.local",
+            AzureAiStudioProvider.OPENAI,
+            AzureAiStudioEndpointType.TOKEN,
+            "apikey",
+            null,
+            false,
+            null,
+            null,
+            null,
+            null
+        );
+
+        var requestTaskSettingsMap = getTaskSettingsMap(null);
+        var overriddenModel = AzureAiStudioEmbeddingsModel.of(model, requestTaskSettingsMap);
+
+        assertThat(overriddenModel, sameInstance(overriddenModel));
+    }
+
+    public void testSetsProperUrlForOpenAIModel() throws URISyntaxException {
+        var model = createModel("id", "http://testtarget.local", AzureAiStudioProvider.OPENAI, AzureAiStudioEndpointType.TOKEN, "apikey");
+        assertThat(model.getEndpointUri().toString(), is("http://testtarget.local"));
+    }
+
+    public void testSetsProperUrlForCohereModel() throws URISyntaxException {
+        var model = createModel("id", "http://testtarget.local", AzureAiStudioProvider.COHERE, AzureAiStudioEndpointType.TOKEN, "apikey");
+        assertThat(model.getEndpointUri().toString(), is("http://testtarget.local/v1/embeddings"));
+    }
+
+    public static AzureAiStudioEmbeddingsModel createModel(
+        String inferenceId,
+        String target,
+        AzureAiStudioProvider provider,
+        AzureAiStudioEndpointType endpointType,
+        String apiKey
+    ) {
+        return createModel(inferenceId, target, provider, endpointType, apiKey, null, false, null, null, null, null);
+    }
+
+    public static AzureAiStudioEmbeddingsModel createModel(
+        String inferenceId,
+        String target,
+        AzureAiStudioProvider provider,
+        AzureAiStudioEndpointType endpointType,
+        String apiKey,
+        @Nullable Integer dimensions,
+        boolean dimensionsSetByUser,
+        @Nullable Integer maxTokens,
+        @Nullable SimilarityMeasure similarity,
+        @Nullable String user,
+        RateLimitSettings rateLimitSettings
+    ) {
+        return new AzureAiStudioEmbeddingsModel(
+            inferenceId,
+            TaskType.TEXT_EMBEDDING,
+            "azureaistudio",
+            new AzureAiStudioEmbeddingsServiceSettings(
+                target,
+                provider,
+                endpointType,
+                dimensions,
+                dimensionsSetByUser,
+                maxTokens,
+                similarity,
+                rateLimitSettings
+            ),
+            new AzureAiStudioEmbeddingsTaskSettings(user),
+            new DefaultSecretSettings(new SecureString(apiKey.toCharArray()))
+        );
+    }
+}
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/azureaistudio/embeddings/AzureAiStudioEmbeddingsRequestTaskSettingsTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/azureaistudio/embeddings/AzureAiStudioEmbeddingsRequestTaskSettingsTests.java
new file mode 100644
index 0000000000000..665d350bf249a
--- /dev/null
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/azureaistudio/embeddings/AzureAiStudioEmbeddingsRequestTaskSettingsTests.java
@@ -0,0 +1,44 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.services.azureaistudio.embeddings;
+
+import org.elasticsearch.common.ValidationException;
+import org.elasticsearch.test.ESTestCase;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants;
+
+import java.util.HashMap;
+import java.util.Map;
+
+import static org.hamcrest.Matchers.containsString;
+import static org.hamcrest.Matchers.is;
+
+public class AzureAiStudioEmbeddingsRequestTaskSettingsTests extends ESTestCase {
+    public void testFromMap_ReturnsEmptySettings_WhenTheMapIsEmpty() {
+        var settings = AzureAiStudioEmbeddingsRequestTaskSettings.fromMap(new HashMap<>(Map.of()));
+        assertThat(settings, is(AzureAiStudioEmbeddingsRequestTaskSettings.EMPTY_SETTINGS));
+    }
+
+    public void testFromMap_ReturnsEmptySettings_WhenTheMapDoesNotContainTheFields() {
+        var settings = AzureAiStudioEmbeddingsRequestTaskSettings.fromMap(new HashMap<>(Map.of("key", "model")));
+        assertNull(settings.user());
+    }
+
+    public void testFromMap_ReturnsUser() {
+        var settings = AzureAiStudioEmbeddingsRequestTaskSettings.fromMap(new HashMap<>(Map.of(AzureAiStudioConstants.USER_FIELD, "user")));
+        assertThat(settings.user(), is("user"));
+    }
+
+    public void testFromMap_WhenUserIsEmpty_ThrowsValidationException() {
+        var exception = expectThrows(
+            ValidationException.class,
+            () -> AzureAiStudioEmbeddingsRequestTaskSettings.fromMap(new HashMap<>(Map.of(AzureAiStudioConstants.USER_FIELD, "")))
+        );
+
+        assertThat(exception.getMessage(), containsString("[user] must be a non-empty string"));
+    }
+}
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/azureaistudio/embeddings/AzureAiStudioEmbeddingsServiceSettingsTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/azureaistudio/embeddings/AzureAiStudioEmbeddingsServiceSettingsTests.java
new file mode 100644
index 0000000000000..283bfa1490df2
--- /dev/null
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/azureaistudio/embeddings/AzureAiStudioEmbeddingsServiceSettingsTests.java
@@ -0,0 +1,339 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.services.azureaistudio.embeddings;
+
+import org.elasticsearch.common.Strings;
+import org.elasticsearch.common.ValidationException;
+import org.elasticsearch.core.Nullable;
+import org.elasticsearch.inference.SimilarityMeasure;
+import org.elasticsearch.test.ESTestCase;
+import org.elasticsearch.xcontent.XContentBuilder;
+import org.elasticsearch.xcontent.XContentFactory;
+import org.elasticsearch.xcontent.XContentType;
+import org.elasticsearch.xpack.inference.services.ConfigurationParseContext;
+import org.elasticsearch.xpack.inference.services.ServiceFields;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioEndpointType;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioProvider;
+import org.elasticsearch.xpack.inference.services.settings.RateLimitSettings;
+import org.hamcrest.CoreMatchers;
+import org.hamcrest.MatcherAssert;
+
+import java.io.IOException;
+import java.util.HashMap;
+import java.util.Map;
+
+import static org.elasticsearch.xpack.inference.services.ServiceFields.SIMILARITY;
+import static org.hamcrest.Matchers.containsString;
+import static org.hamcrest.Matchers.is;
+
+public class AzureAiStudioEmbeddingsServiceSettingsTests extends ESTestCase {
+
+    public void testFromMap_Request_CreatesSettingsCorrectly() {
+        var target = "http://sometarget.local";
+        var provider = "openai";
+        var endpointType = "token";
+        var dims = 1536;
+        var maxInputTokens = 512;
+        var serviceSettings = AzureAiStudioEmbeddingsServiceSettings.fromMap(
+            createRequestSettingsMap(target, provider, endpointType, dims, null, maxInputTokens, SimilarityMeasure.COSINE),
+            ConfigurationParseContext.REQUEST
+        );
+
+        assertThat(
+            serviceSettings,
+            is(
+                new AzureAiStudioEmbeddingsServiceSettings(
+                    target,
+                    AzureAiStudioProvider.OPENAI,
+                    AzureAiStudioEndpointType.TOKEN,
+                    dims,
+                    true,
+                    maxInputTokens,
+                    SimilarityMeasure.COSINE,
+                    null
+                )
+            )
+        );
+    }
+
+    public void testFromMap_RequestWithRateLimit_CreatesSettingsCorrectly() {
+        var target = "http://sometarget.local";
+        var provider = "openai";
+        var endpointType = "token";
+        var dims = 1536;
+        var maxInputTokens = 512;
+        var settingsMap = createRequestSettingsMap(target, provider, endpointType, dims, null, maxInputTokens, SimilarityMeasure.COSINE);
+        settingsMap.put(RateLimitSettings.FIELD_NAME, new HashMap<>(Map.of(RateLimitSettings.REQUESTS_PER_MINUTE_FIELD, 3)));
+
+        var serviceSettings = AzureAiStudioEmbeddingsServiceSettings.fromMap(settingsMap, ConfigurationParseContext.REQUEST);
+
+        assertThat(
+            serviceSettings,
+            is(
+                new AzureAiStudioEmbeddingsServiceSettings(
+                    target,
+                    AzureAiStudioProvider.OPENAI,
+                    AzureAiStudioEndpointType.TOKEN,
+                    dims,
+                    true,
+                    maxInputTokens,
+                    SimilarityMeasure.COSINE,
+                    new RateLimitSettings(3)
+                )
+            )
+        );
+    }
+
+    public void testFromMap_Request_DimensionsSetByUser_IsFalse_WhenDimensionsAreNotPresent() {
+        var target = "http://sometarget.local";
+        var provider = "openai";
+        var endpointType = "token";
+        var maxInputTokens = 512;
+        var settingsMap = createRequestSettingsMap(target, provider, endpointType, null, null, maxInputTokens, SimilarityMeasure.COSINE);
+        var serviceSettings = AzureAiStudioEmbeddingsServiceSettings.fromMap(settingsMap, ConfigurationParseContext.REQUEST);
+
+        assertThat(
+            serviceSettings,
+            is(
+                new AzureAiStudioEmbeddingsServiceSettings(
+                    target,
+                    AzureAiStudioProvider.OPENAI,
+                    AzureAiStudioEndpointType.TOKEN,
+                    null,
+                    false,
+                    maxInputTokens,
+                    SimilarityMeasure.COSINE,
+                    null
+                )
+            )
+        );
+    }
+
+    public void testFromMap_Request_DimensionsSetByUser_ShouldThrowWhenPresent() {
+        var target = "http://sometarget.local";
+        var provider = "openai";
+        var endpointType = "token";
+        var maxInputTokens = 512;
+
+        var settingsMap = createRequestSettingsMap(target, provider, endpointType, null, true, maxInputTokens, SimilarityMeasure.COSINE);
+
+        var thrownException = expectThrows(
+            ValidationException.class,
+            () -> AzureAiStudioEmbeddingsServiceSettings.fromMap(settingsMap, ConfigurationParseContext.REQUEST)
+        );
+
+        MatcherAssert.assertThat(
+            thrownException.getMessage(),
+            containsString(
+                Strings.format(
+                    "Validation Failed: 1: [service_settings] does not allow the setting [%s];",
+                    AzureAiStudioConstants.DIMENSIONS_SET_BY_USER
+                )
+            )
+        );
+    }
+
+    public void testFromMap_Persistent_CreatesSettingsCorrectly() {
+        var target = "http://sometarget.local";
+        var provider = "openai";
+        var endpointType = "token";
+        var dims = 1536;
+        var maxInputTokens = 512;
+
+        var settingsMap = createRequestSettingsMap(target, provider, endpointType, dims, false, maxInputTokens, SimilarityMeasure.COSINE);
+        var serviceSettings = AzureAiStudioEmbeddingsServiceSettings.fromMap(settingsMap, ConfigurationParseContext.PERSISTENT);
+
+        assertThat(
+            serviceSettings,
+            is(
+                new AzureAiStudioEmbeddingsServiceSettings(
+                    target,
+                    AzureAiStudioProvider.OPENAI,
+                    AzureAiStudioEndpointType.TOKEN,
+                    dims,
+                    false,
+                    maxInputTokens,
+                    SimilarityMeasure.COSINE,
+                    null
+                )
+            )
+        );
+    }
+
+    public void testFromMap_PersistentContext_DoesNotThrowException_WhenDimensionsIsNull() {
+        var target = "http://sometarget.local";
+        var provider = "openai";
+        var endpointType = "token";
+
+        var settingsMap = createRequestSettingsMap(target, provider, endpointType, null, true, null, null);
+        var serviceSettings = AzureAiStudioEmbeddingsServiceSettings.fromMap(settingsMap, ConfigurationParseContext.PERSISTENT);
+
+        assertThat(
+            serviceSettings,
+            is(
+                new AzureAiStudioEmbeddingsServiceSettings(
+                    target,
+                    AzureAiStudioProvider.OPENAI,
+                    AzureAiStudioEndpointType.TOKEN,
+                    null,
+                    true,
+                    null,
+                    null,
+                    null
+                )
+            )
+        );
+    }
+
+    public void testFromMap_PersistentContext_DoesNotThrowException_WhenSimilarityIsPresent() {
+        var target = "http://sometarget.local";
+        var provider = "openai";
+        var endpointType = "token";
+
+        var settingsMap = createRequestSettingsMap(target, provider, endpointType, null, true, null, SimilarityMeasure.DOT_PRODUCT);
+        var serviceSettings = AzureAiStudioEmbeddingsServiceSettings.fromMap(settingsMap, ConfigurationParseContext.PERSISTENT);
+
+        assertThat(
+            serviceSettings,
+            is(
+                new AzureAiStudioEmbeddingsServiceSettings(
+                    target,
+                    AzureAiStudioProvider.OPENAI,
+                    AzureAiStudioEndpointType.TOKEN,
+                    null,
+                    true,
+                    null,
+                    SimilarityMeasure.DOT_PRODUCT,
+                    null
+                )
+            )
+        );
+    }
+
+    public void testFromMap_PersistentContext_ThrowsException_WhenDimensionsSetByUserIsNull() {
+        var target = "http://sometarget.local";
+        var provider = "openai";
+        var endpointType = "token";
+
+        var settingsMap = createRequestSettingsMap(target, provider, endpointType, 1, null, null, null);
+
+        var exception = expectThrows(
+            ValidationException.class,
+            () -> AzureAiStudioEmbeddingsServiceSettings.fromMap(settingsMap, ConfigurationParseContext.PERSISTENT)
+        );
+
+        assertThat(
+            exception.getMessage(),
+            containsString("Validation Failed: 1: [service_settings] does not contain the required setting [dimensions_set_by_user];")
+        );
+    }
+
+    public void testToXContent_WritesDimensionsSetByUserTrue() throws IOException {
+        var entity = new AzureAiStudioEmbeddingsServiceSettings(
+            "target_value",
+            AzureAiStudioProvider.OPENAI,
+            AzureAiStudioEndpointType.TOKEN,
+            null,
+            true,
+            null,
+            null,
+            new RateLimitSettings(2)
+        );
+
+        XContentBuilder builder = XContentFactory.contentBuilder(XContentType.JSON);
+        entity.toXContent(builder, null);
+        String xContentResult = Strings.toString(builder);
+
+        assertThat(xContentResult, CoreMatchers.is("""
+            {"target":"target_value","provider":"openai","endpoint_type":"token",""" + """
+            "rate_limit":{"requests_per_minute":2},"dimensions_set_by_user":true}"""));
+    }
+
+    public void testToXContent_WritesAllValues() throws IOException {
+        var entity = new AzureAiStudioEmbeddingsServiceSettings(
+            "target_value",
+            AzureAiStudioProvider.OPENAI,
+            AzureAiStudioEndpointType.TOKEN,
+            1024,
+            false,
+            512,
+            null,
+            new RateLimitSettings(3)
+        );
+
+        XContentBuilder builder = XContentFactory.contentBuilder(XContentType.JSON);
+        entity.toXContent(builder, null);
+        String xContentResult = Strings.toString(builder);
+
+        assertThat(xContentResult, CoreMatchers.is("""
+            {"target":"target_value","provider":"openai","endpoint_type":"token",""" + """
+            "rate_limit":{"requests_per_minute":3},"dimensions":1024,"max_input_tokens":512,"dimensions_set_by_user":false}"""));
+    }
+
+    public void testToFilteredXContent_WritesAllValues_ExceptDimensionsSetByUser() throws IOException {
+        var entity = new AzureAiStudioEmbeddingsServiceSettings(
+            "target_value",
+            AzureAiStudioProvider.OPENAI,
+            AzureAiStudioEndpointType.TOKEN,
+            1024,
+            false,
+            512,
+            null,
+            new RateLimitSettings(3)
+        );
+
+        XContentBuilder builder = XContentFactory.contentBuilder(XContentType.JSON);
+        var filteredXContent = entity.getFilteredXContentObject();
+        filteredXContent.toXContent(builder, null);
+        String xContentResult = Strings.toString(builder);
+
+        assertThat(xContentResult, CoreMatchers.is("""
+            {"target":"target_value","provider":"openai","endpoint_type":"token",""" + """
+            "dimensions":1024,"max_input_tokens":512}"""));
+    }
+
+    public static HashMap<String, Object> createRequestSettingsMap(
+        String target,
+        String provider,
+        String endpointType,
+        @Nullable Integer dimensions,
+        @Nullable Boolean dimensionsSetByUser,
+        @Nullable Integer maxTokens,
+        @Nullable SimilarityMeasure similarityMeasure
+    ) {
+        var map = new HashMap<String, Object>(
+            Map.of(
+                AzureAiStudioConstants.TARGET_FIELD,
+                target,
+                AzureAiStudioConstants.PROVIDER_FIELD,
+                provider,
+                AzureAiStudioConstants.ENDPOINT_TYPE_FIELD,
+                endpointType
+            )
+        );
+
+        if (dimensions != null) {
+            map.put(ServiceFields.DIMENSIONS, dimensions);
+        }
+
+        if (dimensionsSetByUser != null) {
+            map.put(AzureAiStudioConstants.DIMENSIONS_SET_BY_USER, dimensionsSetByUser.equals(Boolean.TRUE));
+        }
+
+        if (maxTokens != null) {
+            map.put(ServiceFields.MAX_INPUT_TOKENS, maxTokens);
+        }
+
+        if (similarityMeasure != null) {
+            map.put(SIMILARITY, similarityMeasure.toString());
+        }
+
+        return map;
+    }
+}
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/azureaistudio/embeddings/AzureAiStudioEmbeddingsTaskSettingsTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/azureaistudio/embeddings/AzureAiStudioEmbeddingsTaskSettingsTests.java
new file mode 100644
index 0000000000000..3d1b7f0c7499c
--- /dev/null
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/azureaistudio/embeddings/AzureAiStudioEmbeddingsTaskSettingsTests.java
@@ -0,0 +1,101 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.services.azureaistudio.embeddings;
+
+import org.elasticsearch.common.Strings;
+import org.elasticsearch.common.ValidationException;
+import org.elasticsearch.core.Nullable;
+import org.elasticsearch.test.ESTestCase;
+import org.elasticsearch.xcontent.XContentBuilder;
+import org.elasticsearch.xcontent.XContentFactory;
+import org.elasticsearch.xcontent.XContentType;
+import org.elasticsearch.xpack.inference.services.azureaistudio.AzureAiStudioConstants;
+import org.hamcrest.MatcherAssert;
+
+import java.io.IOException;
+import java.util.HashMap;
+import java.util.Map;
+
+import static org.hamcrest.Matchers.is;
+
+public class AzureAiStudioEmbeddingsTaskSettingsTests extends ESTestCase {
+
+    public void testFromMap_WithUser() {
+        assertEquals(
+            new AzureAiStudioEmbeddingsTaskSettings("user"),
+            AzureAiStudioEmbeddingsTaskSettings.fromMap(new HashMap<>(Map.of(AzureAiStudioConstants.USER_FIELD, "user")))
+        );
+    }
+
+    public void testFromMap_UserIsEmptyString() {
+        var thrownException = expectThrows(
+            ValidationException.class,
+            () -> AzureAiStudioEmbeddingsTaskSettings.fromMap(new HashMap<>(Map.of(AzureAiStudioConstants.USER_FIELD, "")))
+        );
+
+        MatcherAssert.assertThat(
+            thrownException.getMessage(),
+            is(Strings.format("Validation Failed: 1: [task_settings] Invalid value empty string. [user] must be a non-empty string;"))
+        );
+    }
+
+    public void testFromMap_MissingUser_DoesNotThrowException() {
+        var taskSettings = AzureAiStudioEmbeddingsTaskSettings.fromMap(new HashMap<>(Map.of()));
+        assertNull(taskSettings.user());
+    }
+
+    public void testOverrideWith_KeepsOriginalValuesWithOverridesAreNull() {
+        var taskSettings = AzureAiStudioEmbeddingsTaskSettings.fromMap(new HashMap<>(Map.of(AzureAiStudioConstants.USER_FIELD, "user")));
+
+        var overriddenTaskSettings = AzureAiStudioEmbeddingsTaskSettings.of(
+            taskSettings,
+            AzureAiStudioEmbeddingsRequestTaskSettings.EMPTY_SETTINGS
+        );
+        MatcherAssert.assertThat(overriddenTaskSettings, is(taskSettings));
+    }
+
+    public void testOverrideWith_UsesOverriddenSettings() {
+        var taskSettings = AzureAiStudioEmbeddingsTaskSettings.fromMap(new HashMap<>(Map.of(AzureAiStudioConstants.USER_FIELD, "user")));
+
+        var requestTaskSettings = AzureAiStudioEmbeddingsRequestTaskSettings.fromMap(
+            new HashMap<>(Map.of(AzureAiStudioConstants.USER_FIELD, "user2"))
+        );
+
+        var overriddenTaskSettings = AzureAiStudioEmbeddingsTaskSettings.of(taskSettings, requestTaskSettings);
+        MatcherAssert.assertThat(overriddenTaskSettings, is(new AzureAiStudioEmbeddingsTaskSettings("user2")));
+    }
+
+    public void testToXContent_WithoutParameters() throws IOException {
+        var settings = AzureAiStudioEmbeddingsTaskSettings.fromMap(getTaskSettingsMap(null));
+
+        XContentBuilder builder = XContentFactory.contentBuilder(XContentType.JSON);
+        settings.toXContent(builder, null);
+        String xContentResult = Strings.toString(builder);
+
+        assertThat(xContentResult, is("{}"));
+    }
+
+    public void testToXContent_WithParameters() throws IOException {
+        var settings = AzureAiStudioEmbeddingsTaskSettings.fromMap(getTaskSettingsMap("testuser"));
+
+        XContentBuilder builder = XContentFactory.contentBuilder(XContentType.JSON);
+        settings.toXContent(builder, null);
+        String xContentResult = Strings.toString(builder);
+
+        assertThat(xContentResult, is("""
+            {"user":"testuser"}"""));
+    }
+
+    public static Map<String, Object> getTaskSettingsMap(@Nullable String user) {
+        Map<String, Object> map = new HashMap<>();
+        if (user != null) {
+            map.put(AzureAiStudioConstants.USER_FIELD, user);
+        }
+        return map;
+    }
+}
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/cohere/completion/CohereCompletionModelTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/cohere/completion/CohereCompletionModelTests.java
new file mode 100644
index 0000000000000..5352d8006f1e1
--- /dev/null
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/cohere/completion/CohereCompletionModelTests.java
@@ -0,0 +1,48 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.services.cohere.completion;
+
+import org.elasticsearch.common.settings.SecureString;
+import org.elasticsearch.core.Nullable;
+import org.elasticsearch.inference.EmptyTaskSettings;
+import org.elasticsearch.inference.TaskType;
+import org.elasticsearch.test.ESTestCase;
+import org.elasticsearch.xpack.inference.services.settings.DefaultSecretSettings;
+
+import java.util.HashMap;
+import java.util.Map;
+
+import static org.hamcrest.Matchers.is;
+
+public class CohereCompletionModelTests extends ESTestCase {
+
+    public void testCreateModel_AlwaysWithEmptyTaskSettings() {
+        var model = new CohereCompletionModel(
+            "model",
+            TaskType.COMPLETION,
+            "service",
+            new HashMap<>(Map.of()),
+            new HashMap<>(Map.of("model", "overridden model")),
+            null
+        );
+
+        assertThat(model.getTaskSettings(), is(EmptyTaskSettings.INSTANCE));
+    }
+
+    public static CohereCompletionModel createModel(String url, String apiKey, @Nullable String model) {
+        return new CohereCompletionModel(
+            "id",
+            TaskType.COMPLETION,
+            "service",
+            new CohereCompletionServiceSettings(url, model, null),
+            new EmptyTaskSettings(),
+            new DefaultSecretSettings(new SecureString(apiKey.toCharArray()))
+        );
+    }
+
+}
diff --git a/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/cohere/completion/CohereCompletionServiceSettingsTests.java b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/cohere/completion/CohereCompletionServiceSettingsTests.java
new file mode 100644
index 0000000000000..f4cab3c2b0f1e
--- /dev/null
+++ b/x-pack/plugin/inference/src/test/java/org/elasticsearch/xpack/inference/services/cohere/completion/CohereCompletionServiceSettingsTests.java
@@ -0,0 +1,101 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.inference.services.cohere.completion;
+
+import org.elasticsearch.common.Strings;
+import org.elasticsearch.common.io.stream.Writeable;
+import org.elasticsearch.test.AbstractWireSerializingTestCase;
+import org.elasticsearch.xcontent.XContentBuilder;
+import org.elasticsearch.xcontent.XContentFactory;
+import org.elasticsearch.xcontent.XContentType;
+import org.elasticsearch.xpack.inference.services.ServiceFields;
+import org.elasticsearch.xpack.inference.services.settings.RateLimitSettings;
+import org.elasticsearch.xpack.inference.services.settings.RateLimitSettingsTests;
+
+import java.io.IOException;
+import java.util.HashMap;
+import java.util.Map;
+
+import static org.hamcrest.Matchers.is;
+
+public class CohereCompletionServiceSettingsTests extends AbstractWireSerializingTestCase<CohereCompletionServiceSettings> {
+
+    public static CohereCompletionServiceSettings createRandom() {
+        return new CohereCompletionServiceSettings(randomAlphaOfLength(8), randomAlphaOfLength(8), RateLimitSettingsTests.createRandom());
+    }
+
+    public void testFromMap_WithRateLimitSettingsNull() {
+        var url = "https://www.abc.com";
+        var model = "model";
+
+        var serviceSettings = CohereCompletionServiceSettings.fromMap(
+            new HashMap<>(Map.of(ServiceFields.URL, url, ServiceFields.MODEL_ID, model))
+        );
+
+        assertThat(serviceSettings, is(new CohereCompletionServiceSettings(url, model, null)));
+    }
+
+    public void testFromMap_WithRateLimitSettings() {
+        var url = "https://www.abc.com";
+        var model = "model";
+        var requestsPerMinute = 100;
+
+        var serviceSettings = CohereCompletionServiceSettings.fromMap(
+            new HashMap<>(
+                Map.of(
+                    ServiceFields.URL,
+                    url,
+                    ServiceFields.MODEL_ID,
+                    model,
+                    RateLimitSettings.FIELD_NAME,
+                    new HashMap<>(Map.of(RateLimitSettings.REQUESTS_PER_MINUTE_FIELD, requestsPerMinute))
+                )
+            )
+        );
+
+        assertThat(serviceSettings, is(new CohereCompletionServiceSettings(url, model, new RateLimitSettings(requestsPerMinute))));
+    }
+
+    public void testToXContent_WritesAllValues() throws IOException {
+        var serviceSettings = new CohereCompletionServiceSettings("url", "model", new RateLimitSettings(3));
+
+        XContentBuilder builder = XContentFactory.contentBuilder(XContentType.JSON);
+        serviceSettings.toXContent(builder, null);
+        String xContentResult = Strings.toString(builder);
+
+        assertThat(xContentResult, is("""
+            {"url":"url","model_id":"model","rate_limit":{"requests_per_minute":3}}"""));
+    }
+
+    public void testToXContent_WithFilteredObject_WritesAllValues_Except_RateLimit() throws IOException {
+        var serviceSettings = new CohereCompletionServiceSettings("url", "model", new RateLimitSettings(3));
+
+        XContentBuilder builder = XContentFactory.contentBuilder(XContentType.JSON);
+        var filteredXContent = serviceSettings.getFilteredXContentObject();
+        filteredXContent.toXContent(builder, null);
+        String xContentResult = Strings.toString(builder);
+
+        assertThat(xContentResult, is("""
+            {"url":"url","model_id":"model"}"""));
+    }
+
+    @Override
+    protected Writeable.Reader<CohereCompletionServiceSettings> instanceReader() {
+        return CohereCompletionServiceSettings::new;
+    }
+
+    @Override
+    protected CohereCompletionServiceSettings createTestInstance() {
+        return createRandom();
+    }
+
+    @Override
+    protected CohereCompletionServiceSettings mutateInstance(CohereCompletionServiceSettings instance) throws IOException {
+        return randomValueOtherThan(instance, this::createTestInstance);
+    }
+}
diff --git a/x-pack/plugin/profiling/src/internalClusterTest/java/org/elasticsearch/xpack/profiling/action/GetFlameGraphActionIT.java b/x-pack/plugin/profiling/src/internalClusterTest/java/org/elasticsearch/xpack/profiling/action/GetFlameGraphActionIT.java
index 49a5cfa7ca067..db343b62c5a1d 100644
--- a/x-pack/plugin/profiling/src/internalClusterTest/java/org/elasticsearch/xpack/profiling/action/GetFlameGraphActionIT.java
+++ b/x-pack/plugin/profiling/src/internalClusterTest/java/org/elasticsearch/xpack/profiling/action/GetFlameGraphActionIT.java
@@ -22,6 +22,7 @@ public void testGetStackTracesUnfiltered() throws Exception {
             null,
             null,
             null,
+            null,
             null
         );
         GetFlamegraphResponse response = client().execute(GetFlamegraphAction.INSTANCE, request).get();
diff --git a/x-pack/plugin/profiling/src/internalClusterTest/java/org/elasticsearch/xpack/profiling/action/GetStackTracesActionIT.java b/x-pack/plugin/profiling/src/internalClusterTest/java/org/elasticsearch/xpack/profiling/action/GetStackTracesActionIT.java
index 9de148c33c467..6463cda554e5b 100644
--- a/x-pack/plugin/profiling/src/internalClusterTest/java/org/elasticsearch/xpack/profiling/action/GetStackTracesActionIT.java
+++ b/x-pack/plugin/profiling/src/internalClusterTest/java/org/elasticsearch/xpack/profiling/action/GetStackTracesActionIT.java
@@ -28,6 +28,7 @@ public void testGetStackTracesUnfiltered() throws Exception {
             null,
             null,
             null,
+            null,
             null
         );
         request.setAdjustSampleCount(true);
@@ -72,6 +73,7 @@ public void testGetStackTracesGroupedByServiceName() throws Exception {
             null,
             null,
             null,
+            null,
             null
         );
         request.setAdjustSampleCount(true);
@@ -91,7 +93,7 @@ public void testGetStackTracesGroupedByServiceName() throws Exception {
         assertEquals(18, stackTrace.typeIds.length);
         assertEquals(0.0000048475146d, stackTrace.annualCO2Tons, 0.0000000001d);
         assertEquals(0.18834d, stackTrace.annualCostsUSD, 0.00001d);
-        assertEquals(Long.valueOf(2L), stackTrace.subGroups.get("basket"));
+        assertEquals(Long.valueOf(2L), stackTrace.subGroups.getCount("basket"));
 
         assertNotNull(response.getStackFrames());
         StackFrame stackFrame = response.getStackFrames().get("8NlMClggx8jaziUTJXlmWAAAAAAAAIYI");
@@ -101,28 +103,6 @@ public void testGetStackTracesGroupedByServiceName() throws Exception {
         assertEquals("vmlinux", response.getExecutables().get("lHp5_WAgpLy2alrUVab6HA"));
     }
 
-    public void testGetStackTracesGroupedByInvalidField() {
-        GetStackTracesRequest request = new GetStackTracesRequest(
-            1000,
-            600.0d,
-            1.0d,
-            1.0d,
-            null,
-            null,
-            null,
-            // only service.name is supported (note the trailing "s")
-            "service.names",
-            null,
-            null,
-            null,
-            null,
-            null
-        );
-        request.setAdjustSampleCount(true);
-        IllegalArgumentException e = expectThrows(IllegalArgumentException.class, client().execute(GetStackTracesAction.INSTANCE, request));
-        assertEquals("Requested custom event aggregation field [service.names] but only [service.name] is supported.", e.getMessage());
-    }
-
     public void testGetStackTracesFromAPMWithMatchNoDownsampling() throws Exception {
         BoolQueryBuilder query = QueryBuilders.boolQuery();
         query.must().add(QueryBuilders.termQuery("transaction.name", "encodeSha1"));
@@ -142,6 +122,7 @@ public void testGetStackTracesFromAPMWithMatchNoDownsampling() throws Exception
             null,
             null,
             null,
+            null,
             null
         );
         GetStackTracesResponse response = client().execute(GetStackTracesAction.INSTANCE, request).get();
@@ -161,7 +142,7 @@ public void testGetStackTracesFromAPMWithMatchNoDownsampling() throws Exception
         assertEquals(39, stackTrace.typeIds.length);
         assertTrue(stackTrace.annualCO2Tons > 0.0d);
         assertTrue(stackTrace.annualCostsUSD > 0.0d);
-        assertEquals(Long.valueOf(3L), stackTrace.subGroups.get("encodeSha1"));
+        assertEquals(Long.valueOf(3L), stackTrace.subGroups.getCount("encodeSha1"));
 
         assertNotNull(response.getStackFrames());
         StackFrame stackFrame = response.getStackFrames().get("fhsEKXDuxJ-jIJrZpdRuSAAAAAAAAFtj");
@@ -187,6 +168,7 @@ public void testGetStackTracesFromAPMWithMatchAndDownsampling() throws Exception
             null,
             null,
             null,
+            null,
             null
         );
         // ensures consistent results in the random sampler aggregation that is used internally
@@ -237,6 +219,7 @@ public void testGetStackTracesFromAPMNoMatch() throws Exception {
             null,
             null,
             null,
+            null,
             null
         );
         GetStackTracesResponse response = client().execute(GetStackTracesAction.INSTANCE, request).get();
@@ -259,6 +242,7 @@ public void testGetStackTracesFromAPMIndexNotAvailable() throws Exception {
             null,
             null,
             null,
+            null,
             null
         );
         GetStackTracesResponse response = client().execute(GetStackTracesAction.INSTANCE, request).get();
@@ -281,6 +265,7 @@ public void testGetStackTracesFromAPMStackTraceFieldNotAvailable() throws Except
             null,
             null,
             null,
+            null,
             null
         );
         GetStackTracesResponse response = client().execute(GetStackTracesAction.INSTANCE, request).get();
diff --git a/x-pack/plugin/profiling/src/internalClusterTest/java/org/elasticsearch/xpack/profiling/action/GetTopNFunctionsActionIT.java b/x-pack/plugin/profiling/src/internalClusterTest/java/org/elasticsearch/xpack/profiling/action/GetTopNFunctionsActionIT.java
index ab5bbc3812eb5..c6250dae4d649 100644
--- a/x-pack/plugin/profiling/src/internalClusterTest/java/org/elasticsearch/xpack/profiling/action/GetTopNFunctionsActionIT.java
+++ b/x-pack/plugin/profiling/src/internalClusterTest/java/org/elasticsearch/xpack/profiling/action/GetTopNFunctionsActionIT.java
@@ -25,6 +25,7 @@ public void testGetTopNFunctionsUnfiltered() throws Exception {
             null,
             null,
             null,
+            null,
             null
         );
         request.setAdjustSampleCount(true);
@@ -46,6 +47,7 @@ public void testGetTopNFunctionsGroupedByServiceName() throws Exception {
             null,
             null,
             null,
+            null,
             null
         );
         request.setAdjustSampleCount(true);
@@ -73,6 +75,7 @@ public void testGetTopNFunctionsFromAPM() throws Exception {
             null,
             null,
             null,
+            null,
             null
         );
         GetTopNFunctionsResponse response = client().execute(GetTopNFunctionsAction.INSTANCE, request).get();
diff --git a/x-pack/plugin/profiling/src/main/java/org/elasticsearch/xpack/profiling/action/GetStackTracesRequest.java b/x-pack/plugin/profiling/src/main/java/org/elasticsearch/xpack/profiling/action/GetStackTracesRequest.java
index be30c9662fddb..6bd93c6df6cc8 100644
--- a/x-pack/plugin/profiling/src/main/java/org/elasticsearch/xpack/profiling/action/GetStackTracesRequest.java
+++ b/x-pack/plugin/profiling/src/main/java/org/elasticsearch/xpack/profiling/action/GetStackTracesRequest.java
@@ -13,6 +13,7 @@
 import org.elasticsearch.action.support.TransportAction;
 import org.elasticsearch.common.ParsingException;
 import org.elasticsearch.common.io.stream.StreamOutput;
+import org.elasticsearch.core.UpdateForV9;
 import org.elasticsearch.index.query.QueryBuilder;
 import org.elasticsearch.tasks.CancellableTask;
 import org.elasticsearch.tasks.Task;
@@ -42,7 +43,9 @@ public class GetStackTracesRequest extends ActionRequest implements IndicesReque
     public static final ParseField LIMIT_FIELD = new ParseField("limit");
     public static final ParseField INDICES_FIELD = new ParseField("indices");
     public static final ParseField STACKTRACE_IDS_FIELD = new ParseField("stacktrace_ids_field");
+    @UpdateForV9 // Remove this BWC layer and allow only AGGREGATION_FIELDS
     public static final ParseField AGGREGATION_FIELD = new ParseField("aggregation_field");
+    public static final ParseField AGGREGATION_FIELDS = new ParseField("aggregation_fields");
     public static final ParseField REQUESTED_DURATION_FIELD = new ParseField("requested_duration");
     public static final ParseField AWS_COST_FACTOR_FIELD = new ParseField("aws_cost_factor");
     public static final ParseField AZURE_COST_FACTOR_FIELD = new ParseField("azure_cost_factor");
@@ -59,7 +62,9 @@ public class GetStackTracesRequest extends ActionRequest implements IndicesReque
     private String[] indices;
     private boolean userProvidedIndices;
     private String stackTraceIdsField;
+    @UpdateForV9 // Remove this BWC layer and allow only aggregationFields
     private String aggregationField;
+    private String[] aggregationFields;
     private Double requestedDuration;
     private Double awsCostFactor;
     private Double azureCostFactor;
@@ -78,7 +83,7 @@ public class GetStackTracesRequest extends ActionRequest implements IndicesReque
     private Integer shardSeed;
 
     public GetStackTracesRequest() {
-        this(null, null, null, null, null, null, null, null, null, null, null, null, null);
+        this(null, null, null, null, null, null, null, null, null, null, null, null, null, null);
     }
 
     public GetStackTracesRequest(
@@ -90,6 +95,7 @@ public GetStackTracesRequest(
         String[] indices,
         String stackTraceIdsField,
         String aggregationField,
+        String[] aggregationFields,
         Double customCO2PerKWH,
         Double customDatacenterPUE,
         Double customPerCoreWattX86,
@@ -105,6 +111,7 @@ public GetStackTracesRequest(
         this.userProvidedIndices = indices != null && indices.length > 0;
         this.stackTraceIdsField = stackTraceIdsField;
         this.aggregationField = aggregationField;
+        this.aggregationFields = aggregationFields;
         this.customCO2PerKWH = customCO2PerKWH;
         this.customDatacenterPUE = customDatacenterPUE;
         this.customPerCoreWattX86 = customPerCoreWattX86;
@@ -181,6 +188,19 @@ public String getAggregationField() {
         return aggregationField;
     }
 
+    public String[] getAggregationFields() {
+        return aggregationField != null ? new String[] { aggregationField } : aggregationFields;
+    }
+
+    public boolean hasAggregationFields() {
+        String[] f = getAggregationFields();
+        return f != null && f.length > 0;
+    }
+
+    public boolean isLegacyAggregationField() {
+        return aggregationField != null;
+    }
+
     public boolean isAdjustSampleCount() {
         return Boolean.TRUE.equals(adjustSampleCount);
     }
@@ -244,8 +264,10 @@ public void parseXContent(XContentParser parser) throws IOException {
                 }
             } else if (token == XContentParser.Token.START_ARRAY) {
                 if (INDICES_FIELD.match(currentFieldName, parser.getDeprecationHandler())) {
-                    this.indices = parseIndices(parser);
+                    this.indices = parseToStringArray(parser, INDICES_FIELD);
                     this.userProvidedIndices = true;
+                } else if (AGGREGATION_FIELDS.match(currentFieldName, parser.getDeprecationHandler())) {
+                    this.aggregationFields = parseToStringArray(parser, AGGREGATION_FIELDS);
                 } else {
                     throw new ParsingException(parser.getTokenLocation(), "Unexpected token " + token + " in [" + currentFieldName + "].");
                 }
@@ -260,12 +282,12 @@ public void parseXContent(XContentParser parser) throws IOException {
         }
     }
 
-    private String[] parseIndices(XContentParser parser) throws IOException {
+    private String[] parseToStringArray(XContentParser parser, ParseField parseField) throws IOException {
         XContentParser.Token token;
-        List<String> indices = new ArrayList<>();
+        List<String> values = new ArrayList<>();
         while ((token = parser.nextToken()) != XContentParser.Token.END_ARRAY) {
             if (token == XContentParser.Token.VALUE_STRING) {
-                indices.add(parser.text());
+                values.add(parser.text());
             } else {
                 throw new ParsingException(
                     parser.getTokenLocation(),
@@ -274,12 +296,12 @@ private String[] parseIndices(XContentParser parser) throws IOException {
                         + "] but found ["
                         + token
                         + "] in ["
-                        + INDICES_FIELD.getPreferredName()
+                        + parseField.getPreferredName()
                         + "]."
                 );
             }
         }
-        return indices.toArray(new String[0]);
+        return values.toArray(new String[0]);
     }
 
     @Override
@@ -300,6 +322,32 @@ public ActionRequestValidationException validate() {
                 );
             }
         }
+        if (aggregationField != null && aggregationFields != null) {
+            validationException = addValidationError(
+                "["
+                    + AGGREGATION_FIELD.getPreferredName()
+                    + "] must not be set when ["
+                    + AGGREGATION_FIELDS.getPreferredName()
+                    + "] is also set",
+                validationException
+            );
+
+        }
+        if (aggregationFields != null) {
+            // limit so we avoid an explosion of buckets
+            if (aggregationFields.length < 1 || aggregationFields.length > 2) {
+                validationException = addValidationError(
+                    "["
+                        + AGGREGATION_FIELDS.getPreferredName()
+                        + "] must contain either one or two elements but contains ["
+                        + aggregationFields.length
+                        + "] elements.",
+                    validationException
+                );
+            }
+
+        }
+
         if (aggregationField != null && aggregationField.isBlank()) {
             validationException = addValidationError(
                 "[" + AGGREGATION_FIELD.getPreferredName() + "] must be non-empty",
@@ -339,6 +387,7 @@ public String getDescription() {
                 appendField(sb, "indices", indices);
                 appendField(sb, "stacktrace_ids_field", stackTraceIdsField);
                 appendField(sb, "aggregation_field", aggregationField);
+                appendField(sb, "aggregation_fields", aggregationFields);
                 appendField(sb, "sample_size", sampleSize);
                 appendField(sb, "limit", limit);
                 appendField(sb, "requested_duration", requestedDuration);
diff --git a/x-pack/plugin/profiling/src/main/java/org/elasticsearch/xpack/profiling/action/GetStackTracesResponseBuilder.java b/x-pack/plugin/profiling/src/main/java/org/elasticsearch/xpack/profiling/action/GetStackTracesResponseBuilder.java
index 1b31642d07be1..8bb207c0f990f 100644
--- a/x-pack/plugin/profiling/src/main/java/org/elasticsearch/xpack/profiling/action/GetStackTracesResponseBuilder.java
+++ b/x-pack/plugin/profiling/src/main/java/org/elasticsearch/xpack/profiling/action/GetStackTracesResponseBuilder.java
@@ -155,7 +155,7 @@ public GetStackTracesResponse build() {
                 if (event != null) {
                     StackTrace stackTrace = entry.getValue();
                     stackTrace.count = event.count;
-                    if (event.subGroups.isEmpty() == false) {
+                    if (event.subGroups != null) {
                         stackTrace.subGroups = event.subGroups;
                     }
                     stackTrace.annualCO2Tons = event.annualCO2Tons;
diff --git a/x-pack/plugin/profiling/src/main/java/org/elasticsearch/xpack/profiling/action/StackTrace.java b/x-pack/plugin/profiling/src/main/java/org/elasticsearch/xpack/profiling/action/StackTrace.java
index 2a4e5f42fe657..0be6d91450eda 100644
--- a/x-pack/plugin/profiling/src/main/java/org/elasticsearch/xpack/profiling/action/StackTrace.java
+++ b/x-pack/plugin/profiling/src/main/java/org/elasticsearch/xpack/profiling/action/StackTrace.java
@@ -26,7 +26,7 @@ final class StackTrace implements ToXContentObject {
     String[] fileIds;
     String[] frameIds;
     int[] typeIds;
-    Map<String, Long> subGroups;
+    SubGroup subGroups;
     double annualCO2Tons;
     double annualCostsUSD;
     long count;
diff --git a/x-pack/plugin/profiling/src/main/java/org/elasticsearch/xpack/profiling/action/SubGroup.java b/x-pack/plugin/profiling/src/main/java/org/elasticsearch/xpack/profiling/action/SubGroup.java
new file mode 100644
index 0000000000000..25ba70ee7185a
--- /dev/null
+++ b/x-pack/plugin/profiling/src/main/java/org/elasticsearch/xpack/profiling/action/SubGroup.java
@@ -0,0 +1,142 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.profiling.action;
+
+import org.elasticsearch.core.UpdateForV9;
+import org.elasticsearch.xcontent.ToXContentFragment;
+import org.elasticsearch.xcontent.XContentBuilder;
+
+import java.io.IOException;
+import java.util.HashMap;
+import java.util.Map;
+import java.util.Objects;
+
+public class SubGroup implements ToXContentFragment {
+    private final String name;
+    private Long count;
+    @UpdateForV9 // remove legacy XContent rendering
+    private final boolean renderLegacyXContent;
+    private final Map<String, SubGroup> subgroups;
+
+    public static SubGroup root(String name, boolean renderLegacyXContent) {
+        return new SubGroup(name, null, renderLegacyXContent, new HashMap<>());
+    }
+
+    public SubGroup(String name, Long count, boolean renderLegacyXContent, Map<String, SubGroup> subgroups) {
+        this.name = name;
+        this.count = count;
+        this.renderLegacyXContent = renderLegacyXContent;
+        this.subgroups = subgroups;
+    }
+
+    public SubGroup addCount(String name, long count) {
+        if (this.subgroups.containsKey(name) == false) {
+            this.subgroups.put(name, new SubGroup(name, count, renderLegacyXContent, new HashMap<>()));
+        } else {
+            SubGroup s = this.subgroups.get(name);
+            s.count += count;
+        }
+        return this;
+    }
+
+    public SubGroup getOrAddChild(String name) {
+        if (subgroups.containsKey(name) == false) {
+            this.subgroups.put(name, new SubGroup(name, null, renderLegacyXContent, new HashMap<>()));
+        }
+        return this.subgroups.get(name);
+    }
+
+    public Long getCount(String name) {
+        SubGroup subGroup = this.subgroups.get(name);
+        return subGroup != null ? subGroup.count : null;
+    }
+
+    public SubGroup getSubGroup(String name) {
+        return this.subgroups.get(name);
+    }
+
+    public SubGroup copy() {
+        Map<String, SubGroup> copy = new HashMap<>(subgroups.size());
+        for (Map.Entry<String, SubGroup> subGroup : subgroups.entrySet()) {
+            copy.put(subGroup.getKey(), subGroup.getValue().copy());
+        }
+        return new SubGroup(name, count, renderLegacyXContent, copy);
+    }
+
+    @Override
+    public XContentBuilder toXContent(XContentBuilder builder, Params params) throws IOException {
+        if (renderLegacyXContent) {
+            // This assumes that we only have one level of sub groups
+            if (subgroups != null && subgroups.isEmpty() == false) {
+                for (SubGroup subgroup : subgroups.values()) {
+                    builder.field(subgroup.name, subgroup.count);
+                }
+            }
+            return builder;
+        } else {
+            builder.startObject(name);
+            // only the root node has no count
+            if (count != null) {
+                builder.field("count", count);
+            }
+            if (subgroups != null && subgroups.isEmpty() == false) {
+                for (SubGroup subgroup : subgroups.values()) {
+                    subgroup.toXContent(builder, params);
+                }
+            }
+            return builder.endObject();
+        }
+    }
+
+    @Override
+    public boolean equals(Object o) {
+        if (this == o) {
+            return true;
+        }
+        if (o == null || getClass() != o.getClass()) {
+            return false;
+        }
+        SubGroup subGroup = (SubGroup) o;
+        return Objects.equals(name, subGroup.name)
+            && Objects.equals(count, subGroup.count)
+            && Objects.equals(subgroups, subGroup.subgroups);
+    }
+
+    @Override
+    public int hashCode() {
+        return Objects.hash(name, count, subgroups);
+    }
+
+    @Override
+    public String toString() {
+        return name;
+    }
+
+    public void merge(SubGroup s) {
+        if (s == null) {
+            return;
+        }
+        // must have the same name
+        if (this.name.equals(s.name)) {
+            if (this.count != null && s.count != null) {
+                this.count += s.count;
+            } else if (this.count == null) {
+                this.count = s.count;
+            }
+            for (SubGroup subGroup : s.subgroups.values()) {
+                if (this.subgroups.containsKey(subGroup.name)) {
+                    // merge
+                    this.subgroups.get(subGroup.name).merge(subGroup);
+                } else {
+                    // add sub group as is (recursively)
+                    this.subgroups.put(subGroup.name, subGroup.copy());
+                }
+            }
+        }
+    }
+}
diff --git a/x-pack/plugin/profiling/src/main/java/org/elasticsearch/xpack/profiling/action/SubGroupCollector.java b/x-pack/plugin/profiling/src/main/java/org/elasticsearch/xpack/profiling/action/SubGroupCollector.java
new file mode 100644
index 0000000000000..63491a63243dc
--- /dev/null
+++ b/x-pack/plugin/profiling/src/main/java/org/elasticsearch/xpack/profiling/action/SubGroupCollector.java
@@ -0,0 +1,156 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.profiling.action;
+
+import org.apache.logging.log4j.LogManager;
+import org.apache.logging.log4j.Logger;
+import org.elasticsearch.search.aggregations.AbstractAggregationBuilder;
+import org.elasticsearch.search.aggregations.InternalAggregations;
+import org.elasticsearch.search.aggregations.bucket.MultiBucketsAggregation;
+import org.elasticsearch.search.aggregations.bucket.terms.TermsAggregationBuilder;
+
+import java.util.Iterator;
+
+public final class SubGroupCollector {
+    /**
+     * Users may provide a custom field via the API that is used to sub-divide profiling events. This is useful in the context of TopN
+     * where we want to provide additional breakdown of where a certain function has been called (e.g. a certain service or transaction).
+     */
+    static final String CUSTOM_EVENT_SUB_AGGREGATION_NAME = "custom_event_group_";
+
+    private static final Logger log = LogManager.getLogger(SubGroupCollector.class);
+
+    private final String[] aggregationFields;
+    private final boolean legacyAggregationField;
+
+    public static SubGroupCollector attach(
+        AbstractAggregationBuilder<?> parentAggregation,
+        String[] aggregationFields,
+        boolean legacyAggregationField
+    ) {
+        SubGroupCollector c = new SubGroupCollector(aggregationFields, legacyAggregationField);
+        c.addAggregations(parentAggregation);
+        return c;
+    }
+
+    private SubGroupCollector(String[] aggregationFields, boolean legacyAggregationField) {
+        this.aggregationFields = aggregationFields;
+        this.legacyAggregationField = legacyAggregationField;
+    }
+
+    private boolean hasAggregationFields() {
+        return aggregationFields != null && aggregationFields.length > 0;
+    }
+
+    private void addAggregations(AbstractAggregationBuilder<?> parentAggregation) {
+        if (hasAggregationFields()) {
+            // cast to Object to disambiguate this from a varargs call
+            log.trace("Grouping stacktrace events by {}.", (Object) aggregationFields);
+            AbstractAggregationBuilder<?> parentAgg = parentAggregation;
+            for (String aggregationField : aggregationFields) {
+                String aggName = CUSTOM_EVENT_SUB_AGGREGATION_NAME + aggregationField;
+                TermsAggregationBuilder agg = new TermsAggregationBuilder(aggName).field(aggregationField);
+                parentAgg.subAggregation(agg);
+                parentAgg = agg;
+            }
+        }
+    }
+
+    void collectResults(MultiBucketsAggregation.Bucket bucket, TraceEvent event) {
+        collectResults(new BucketAdapter(bucket), event);
+    }
+
+    void collectResults(Bucket bucket, TraceEvent event) {
+        if (hasAggregationFields()) {
+            if (event.subGroups == null) {
+                event.subGroups = SubGroup.root(aggregationFields[0], legacyAggregationField);
+            }
+            collectInternal(bucket.getAggregations(), event.subGroups, 0);
+        }
+    }
+
+    private void collectInternal(Agg parentAgg, SubGroup parentGroup, int aggField) {
+        if (aggField == aggregationFields.length) {
+            return;
+        }
+        String aggName = CUSTOM_EVENT_SUB_AGGREGATION_NAME + aggregationFields[aggField];
+        for (Bucket b : parentAgg.getBuckets(aggName)) {
+            String subGroupName = b.getKey();
+            parentGroup.addCount(subGroupName, b.getCount());
+            SubGroup currentGroup = parentGroup.getSubGroup(subGroupName);
+            int nextAggField = aggField + 1;
+            if (nextAggField < aggregationFields.length) {
+                collectInternal(b.getAggregations(), currentGroup.getOrAddChild(aggregationFields[nextAggField]), nextAggField);
+            }
+        }
+    }
+
+    // The sole purpose of the code below is to abstract our code from the aggs framework to make it unit-testable
+    interface Agg {
+        Iterable<Bucket> getBuckets(String aggName);
+
+    }
+
+    interface Bucket {
+        String getKey();
+
+        long getCount();
+
+        Agg getAggregations();
+    }
+
+    static class InternalAggregationAdapter implements Agg {
+        private final InternalAggregations agg;
+
+        InternalAggregationAdapter(InternalAggregations agg) {
+            this.agg = agg;
+        }
+
+        @Override
+        public Iterable<Bucket> getBuckets(String aggName) {
+            MultiBucketsAggregation multiBucketsAggregation = agg.get(aggName);
+            return () -> {
+                Iterator<? extends MultiBucketsAggregation.Bucket> it = multiBucketsAggregation.getBuckets().iterator();
+                return new Iterator<>() {
+                    @Override
+                    public boolean hasNext() {
+                        return it.hasNext();
+                    }
+
+                    @Override
+                    public Bucket next() {
+                        return new BucketAdapter(it.next());
+                    }
+                };
+            };
+        }
+    }
+
+    static class BucketAdapter implements Bucket {
+        private final MultiBucketsAggregation.Bucket bucket;
+
+        BucketAdapter(MultiBucketsAggregation.Bucket bucket) {
+            this.bucket = bucket;
+        }
+
+        @Override
+        public String getKey() {
+            return bucket.getKeyAsString();
+        }
+
+        @Override
+        public long getCount() {
+            return bucket.getDocCount();
+        }
+
+        @Override
+        public Agg getAggregations() {
+            return new InternalAggregationAdapter(bucket.getAggregations());
+        }
+    }
+}
diff --git a/x-pack/plugin/profiling/src/main/java/org/elasticsearch/xpack/profiling/action/TopNFunction.java b/x-pack/plugin/profiling/src/main/java/org/elasticsearch/xpack/profiling/action/TopNFunction.java
index 800b006b3cc17..87b32698db8d1 100644
--- a/x-pack/plugin/profiling/src/main/java/org/elasticsearch/xpack/profiling/action/TopNFunction.java
+++ b/x-pack/plugin/profiling/src/main/java/org/elasticsearch/xpack/profiling/action/TopNFunction.java
@@ -11,11 +11,9 @@
 import org.elasticsearch.xcontent.XContentBuilder;
 
 import java.io.IOException;
-import java.util.HashMap;
-import java.util.Map;
 import java.util.Objects;
 
-final class TopNFunction implements Cloneable, ToXContentObject, Comparable<TopNFunction> {
+final class TopNFunction implements ToXContentObject, Comparable<TopNFunction> {
     private final String id;
     private int rank;
     private final int frameType;
@@ -31,7 +29,7 @@ final class TopNFunction implements Cloneable, ToXContentObject, Comparable<TopN
     private double totalAnnualCO2Tons;
     private double selfAnnualCostsUSD;
     private double totalAnnualCostsUSD;
-    private final Map<String, Long> subGroups;
+    private SubGroup subGroups;
 
     TopNFunction(
         String id,
@@ -59,7 +57,7 @@ final class TopNFunction implements Cloneable, ToXContentObject, Comparable<TopN
             0.0d,
             0.0d,
             0.0d,
-            new HashMap<>()
+            null
         );
     }
 
@@ -79,7 +77,7 @@ final class TopNFunction implements Cloneable, ToXContentObject, Comparable<TopN
         double totalAnnualCO2Tons,
         double selfAnnualCostsUSD,
         double totalAnnualCostsUSD,
-        Map<String, Long> subGroups
+        SubGroup subGroups
     ) {
         this.id = id;
         this.rank = rank;
@@ -147,15 +145,15 @@ public void addTotalAnnualCostsUSD(double costs) {
         this.totalAnnualCostsUSD += costs;
     }
 
-    public void addSubGroups(Map<String, Long> subGroups) {
-        for (Map.Entry<String, Long> subGroup : subGroups.entrySet()) {
-            long count = this.subGroups.getOrDefault(subGroup.getKey(), 0L);
-            this.subGroups.put(subGroup.getKey(), count + subGroup.getValue());
+    public void addSubGroups(SubGroup subGroups) {
+        if (this.subGroups == null) {
+            this.subGroups = subGroups.copy();
+        } else {
+            this.subGroups.merge(subGroups);
         }
     }
 
-    @Override
-    protected TopNFunction clone() {
+    public TopNFunction copy() {
         return new TopNFunction(
             id,
             rank,
@@ -172,7 +170,7 @@ protected TopNFunction clone() {
             totalAnnualCO2Tons,
             selfAnnualCostsUSD,
             totalAnnualCostsUSD,
-            new HashMap<>(subGroups)
+            subGroups.copy()
         );
     }
 
@@ -190,7 +188,11 @@ public XContentBuilder toXContent(XContentBuilder builder, Params params) throws
         builder.field("line_number", this.sourceLine);
         builder.field("executable_file_name", this.exeFilename);
         builder.endObject();
-        builder.field("sub_groups", subGroups);
+        if (subGroups != null) {
+            builder.startObject("sub_groups");
+            subGroups.toXContent(builder, params);
+            builder.endObject();
+        }
         builder.field("self_count", this.selfCount);
         builder.field("total_count", this.totalCount);
         builder.field("self_annual_co2_tons").rawValue(NumberUtils.doubleToString(selfAnnualCO2Tons));
diff --git a/x-pack/plugin/profiling/src/main/java/org/elasticsearch/xpack/profiling/action/TraceEvent.java b/x-pack/plugin/profiling/src/main/java/org/elasticsearch/xpack/profiling/action/TraceEvent.java
index f020ad9e6a905..b2c50512a5b9c 100644
--- a/x-pack/plugin/profiling/src/main/java/org/elasticsearch/xpack/profiling/action/TraceEvent.java
+++ b/x-pack/plugin/profiling/src/main/java/org/elasticsearch/xpack/profiling/action/TraceEvent.java
@@ -7,8 +7,6 @@
 
 package org.elasticsearch.xpack.profiling.action;
 
-import java.util.HashMap;
-import java.util.Map;
 import java.util.Objects;
 
 final class TraceEvent {
@@ -16,7 +14,7 @@ final class TraceEvent {
     double annualCO2Tons;
     double annualCostsUSD;
     long count;
-    final Map<String, Long> subGroups = new HashMap<>();
+    SubGroup subGroups;
 
     TraceEvent(String stacktraceID) {
         this(stacktraceID, 0);
diff --git a/x-pack/plugin/profiling/src/main/java/org/elasticsearch/xpack/profiling/action/TransportGetStackTracesAction.java b/x-pack/plugin/profiling/src/main/java/org/elasticsearch/xpack/profiling/action/TransportGetStackTracesAction.java
index 5467f0c10ccc8..6efab6e99da6f 100644
--- a/x-pack/plugin/profiling/src/main/java/org/elasticsearch/xpack/profiling/action/TransportGetStackTracesAction.java
+++ b/x-pack/plugin/profiling/src/main/java/org/elasticsearch/xpack/profiling/action/TransportGetStackTracesAction.java
@@ -254,19 +254,11 @@ private void searchGenericEventGroupedByStackTrace(
         CountedTermsAggregationBuilder groupByStackTraceId = new CountedTermsAggregationBuilder("group_by").size(
             MAX_TRACE_EVENTS_RESULT_SIZE
         ).field(request.getStackTraceIdsField());
-        if (request.getAggregationField() != null) {
-            String aggregationField = request.getAggregationField();
-            log.trace("Grouping stacktrace events by [{}].", aggregationField);
-            // be strict about the accepted field names to avoid downstream errors or leaking unintended information
-            if (aggregationField.equals("transaction.name") == false) {
-                throw new IllegalArgumentException(
-                    "Requested custom event aggregation field [" + aggregationField + "] but only [transaction.name] is supported."
-                );
-            }
-            groupByStackTraceId.subAggregation(
-                new TermsAggregationBuilder(CUSTOM_EVENT_SUB_AGGREGATION_NAME).field(request.getAggregationField())
-            );
-        }
+        SubGroupCollector subGroups = SubGroupCollector.attach(
+            groupByStackTraceId,
+            request.getAggregationFields(),
+            request.isLegacyAggregationField()
+        );
         RandomSamplerAggregationBuilder randomSampler = new RandomSamplerAggregationBuilder("sample").setSeed(request.hashCode())
             .setProbability(responseBuilder.getSamplingRate())
             .subAggregation(groupByStackTraceId);
@@ -307,14 +299,7 @@ private void searchGenericEventGroupedByStackTrace(
                         stackTraceEvents.put(stackTraceID, event);
                     }
                     event.count += count;
-                    if (request.getAggregationField() != null) {
-                        Terms eventSubGroup = stacktraceBucket.getAggregations().get(CUSTOM_EVENT_SUB_AGGREGATION_NAME);
-                        for (Terms.Bucket b : eventSubGroup.getBuckets()) {
-                            String subGroupName = b.getKeyAsString();
-                            long subGroupCount = event.subGroups.getOrDefault(subGroupName, 0L);
-                            event.subGroups.put(subGroupName, subGroupCount + b.getDocCount());
-                        }
-                    }
+                    subGroups.collectResults(stacktraceBucket, event);
                 }
                 responseBuilder.setTotalSamples(totalSamples);
                 responseBuilder.setHostEventCounts(hostEventCounts);
@@ -340,17 +325,11 @@ private void searchEventGroupedByStackTrace(
             // Especially with high cardinality fields, this makes aggregations really slow.
             .executionHint("map")
             .subAggregation(new SumAggregationBuilder("count").field("Stacktrace.count"));
-        if (request.getAggregationField() != null) {
-            String aggregationField = request.getAggregationField();
-            log.trace("Grouping stacktrace events by [{}].", aggregationField);
-            // be strict about the accepted field names to avoid downstream errors or leaking unintended information
-            if (aggregationField.equals("service.name") == false) {
-                throw new IllegalArgumentException(
-                    "Requested custom event aggregation field [" + aggregationField + "] but only [service.name] is supported."
-                );
-            }
-            groupByStackTraceId.subAggregation(new TermsAggregationBuilder(CUSTOM_EVENT_SUB_AGGREGATION_NAME).field(aggregationField));
-        }
+        SubGroupCollector subGroups = SubGroupCollector.attach(
+            groupByStackTraceId,
+            request.getAggregationFields(),
+            request.isLegacyAggregationField()
+        );
         client.prepareSearch(eventsIndex.getName())
             .setTrackTotalHits(false)
             .setSize(0)
@@ -412,14 +391,7 @@ The same stacktraces may come from different hosts (eventually from different da
                             stackTraceEvents.put(stackTraceID, event);
                         }
                         event.count += finalCount;
-                        if (request.getAggregationField() != null) {
-                            Terms subGroup = stacktraceBucket.getAggregations().get(CUSTOM_EVENT_SUB_AGGREGATION_NAME);
-                            for (Terms.Bucket b : subGroup.getBuckets()) {
-                                String subGroupName = b.getKeyAsString();
-                                long subGroupCount = event.subGroups.getOrDefault(subGroupName, 0L);
-                                event.subGroups.put(subGroupName, subGroupCount + b.getDocCount());
-                            }
-                        }
+                        subGroups.collectResults(stacktraceBucket, event);
                     }
                 }
                 responseBuilder.setTotalSamples(totalFinalCount);
diff --git a/x-pack/plugin/profiling/src/test/java/org/elasticsearch/xpack/profiling/action/GetStackTracesRequestTests.java b/x-pack/plugin/profiling/src/test/java/org/elasticsearch/xpack/profiling/action/GetStackTracesRequestTests.java
index 70bb1abfc40ac..82544f7cb7acf 100644
--- a/x-pack/plugin/profiling/src/test/java/org/elasticsearch/xpack/profiling/action/GetStackTracesRequestTests.java
+++ b/x-pack/plugin/profiling/src/test/java/org/elasticsearch/xpack/profiling/action/GetStackTracesRequestTests.java
@@ -51,6 +51,8 @@ public void testParseValidXContent() throws IOException {
             // Expect the default values
             assertNull(request.getIndices());
             assertNull(request.getStackTraceIdsField());
+            assertFalse(request.isLegacyAggregationField());
+            assertNull(request.getAggregationFields());
             assertNull(request.getAwsCostFactor());
             assertNull(request.getAzureCostFactor());
             assertNull(request.getCustomCO2PerKWH());
@@ -90,6 +92,92 @@ public void testParseValidXContentWithCustomIndex() throws IOException {
 
             // Expect the default values
             assertNull(request.getRequestedDuration());
+            assertFalse(request.isLegacyAggregationField());
+            assertNull(request.getAggregationFields());
+            assertNull(request.getAwsCostFactor());
+            assertNull(request.getAzureCostFactor());
+            assertNull(request.getCustomCO2PerKWH());
+            assertNull(request.getCustomDatacenterPUE());
+            assertNull(request.getCustomCostPerCoreHour());
+            assertNull(request.getCustomPerCoreWattX86());
+            assertNull(request.getCustomPerCoreWattARM64());
+        }
+    }
+
+    public void testParseValidXContentWithOneAggregationField() throws IOException {
+        try (XContentParser content = createParser(XContentFactory.jsonBuilder()
+        //tag::noformat
+            .startObject()
+                .field("sample_size", 2000)
+                .field("indices", new String[] {"my-traces"})
+                .field("stacktrace_ids_field", "stacktraces")
+                .field("aggregation_field", "service")
+                .startObject("query")
+                    .startObject("range")
+                        .startObject("@timestamp")
+                            .field("gte", "2022-10-05")
+                        .endObject()
+                    .endObject()
+                .endObject()
+            .endObject()
+        //end::noformat
+        )) {
+
+            GetStackTracesRequest request = new GetStackTracesRequest();
+            request.parseXContent(content);
+
+            assertEquals(2000, request.getSampleSize());
+            assertArrayEquals(new String[] { "my-traces" }, request.getIndices());
+            assertEquals("stacktraces", request.getStackTraceIdsField());
+            assertArrayEquals(new String[] { "service" }, request.getAggregationFields());
+            assertTrue(request.isLegacyAggregationField());
+            // a basic check suffices here
+            assertEquals("@timestamp", ((RangeQueryBuilder) request.getQuery()).fieldName());
+
+            // Expect the default values
+            assertNull(request.getRequestedDuration());
+            assertNull(request.getAwsCostFactor());
+            assertNull(request.getAzureCostFactor());
+            assertNull(request.getCustomCO2PerKWH());
+            assertNull(request.getCustomDatacenterPUE());
+            assertNull(request.getCustomCostPerCoreHour());
+            assertNull(request.getCustomPerCoreWattX86());
+            assertNull(request.getCustomPerCoreWattARM64());
+        }
+    }
+
+    public void testParseValidXContentWithMultipleAggregationFields() throws IOException {
+        try (XContentParser content = createParser(XContentFactory.jsonBuilder()
+        //tag::noformat
+            .startObject()
+                .field("sample_size", 2000)
+                .field("indices", new String[] {"my-traces"})
+                .field("stacktrace_ids_field", "stacktraces")
+                .field("aggregation_fields", new String[] {"service", "transaction"})
+                .startObject("query")
+                    .startObject("range")
+                        .startObject("@timestamp")
+                            .field("gte", "2022-10-05")
+                        .endObject()
+                    .endObject()
+                .endObject()
+            .endObject()
+        //end::noformat
+        )) {
+
+            GetStackTracesRequest request = new GetStackTracesRequest();
+            request.parseXContent(content);
+
+            assertEquals(2000, request.getSampleSize());
+            assertArrayEquals(new String[] { "my-traces" }, request.getIndices());
+            assertEquals("stacktraces", request.getStackTraceIdsField());
+            assertArrayEquals(new String[] { "service", "transaction" }, request.getAggregationFields());
+            // a basic check suffices here
+            assertEquals("@timestamp", ((RangeQueryBuilder) request.getQuery()).fieldName());
+
+            // Expect the default values
+            assertNull(request.getRequestedDuration());
+            assertFalse(request.isLegacyAggregationField());
             assertNull(request.getAwsCostFactor());
             assertNull(request.getAzureCostFactor());
             assertNull(request.getCustomCO2PerKWH());
@@ -143,6 +231,8 @@ public void testParseValidXContentWithCustomCostAndCO2Data() throws IOException
             // Expect the default values
             assertNull(request.getIndices());
             assertNull(request.getStackTraceIdsField());
+            assertFalse(request.isLegacyAggregationField());
+            assertNull(request.getAggregationFields());
         }
     }
 
@@ -255,6 +345,7 @@ public void testValidateWrongSampleSize() {
             null,
             null,
             null,
+            null,
             null
         );
         List<String> validationErrors = request.validate().validationErrors();
@@ -276,6 +367,7 @@ public void testValidateSampleSizeIsValidWithCustomIndices() {
             null,
             null,
             null,
+            null,
             null
         );
         assertNull("Expecting no validation errors", request.validate());
@@ -295,6 +387,7 @@ public void testValidateStacktraceWithoutIndices() {
             null,
             null,
             null,
+            null,
             null
         );
         List<String> validationErrors = request.validate().validationErrors();
@@ -316,6 +409,7 @@ public void testValidateIndicesWithoutStacktraces() {
             null,
             null,
             null,
+            null,
             null
         );
         List<String> validationErrors = request.validate().validationErrors();
@@ -323,6 +417,114 @@ public void testValidateIndicesWithoutStacktraces() {
         assertEquals("[stacktrace_ids_field] is mandatory", validationErrors.get(0));
     }
 
+    public void testValidateEmptyAggregationField() {
+        GetStackTracesRequest request = new GetStackTracesRequest(
+            null,
+            1.0d,
+            1.0d,
+            1.0d,
+            null,
+            new String[] { randomAlphaOfLength(5) },
+            randomAlphaOfLength(5),
+            "",
+            null,
+            null,
+            null,
+            null,
+            null,
+            null
+        );
+        List<String> validationErrors = request.validate().validationErrors();
+        assertEquals(1, validationErrors.size());
+        assertEquals("[aggregation_field] must be non-empty", validationErrors.get(0));
+    }
+
+    public void testValidateAggregationFieldAndAggregationFields() {
+        GetStackTracesRequest request = new GetStackTracesRequest(
+            null,
+            1.0d,
+            1.0d,
+            1.0d,
+            null,
+            new String[] { randomAlphaOfLength(5) },
+            randomAlphaOfLength(5),
+            "transaction.name",
+            new String[] { "transaction.name", "service.name" },
+            null,
+            null,
+            null,
+            null,
+            null
+        );
+        List<String> validationErrors = request.validate().validationErrors();
+        assertEquals(1, validationErrors.size());
+        assertEquals("[aggregation_field] must not be set when [aggregation_fields] is also set", validationErrors.get(0));
+    }
+
+    public void testValidateAggregationFieldsContainsTooFewElements() {
+        GetStackTracesRequest request = new GetStackTracesRequest(
+            null,
+            1.0d,
+            1.0d,
+            1.0d,
+            null,
+            new String[] { randomAlphaOfLength(5) },
+            randomAlphaOfLength(5),
+            null,
+            new String[] {},
+            null,
+            null,
+            null,
+            null,
+            null
+        );
+        List<String> validationErrors = request.validate().validationErrors();
+        assertEquals(1, validationErrors.size());
+        assertEquals("[aggregation_fields] must contain either one or two elements but contains [0] elements.", validationErrors.get(0));
+    }
+
+    public void testValidateAggregationFieldsContainsTooManyElements() {
+        GetStackTracesRequest request = new GetStackTracesRequest(
+            null,
+            1.0d,
+            1.0d,
+            1.0d,
+            null,
+            new String[] { randomAlphaOfLength(5) },
+            randomAlphaOfLength(5),
+            null,
+            new String[] { "application", "service", "transaction" },
+            null,
+            null,
+            null,
+            null,
+            null
+        );
+        List<String> validationErrors = request.validate().validationErrors();
+        assertEquals(1, validationErrors.size());
+        assertEquals("[aggregation_fields] must contain either one or two elements but contains [3] elements.", validationErrors.get(0));
+    }
+
+    public void testValidateAggregationFieldsContainsEnoughElements() {
+        GetStackTracesRequest request = new GetStackTracesRequest(
+            null,
+            1.0d,
+            1.0d,
+            1.0d,
+            null,
+            new String[] { randomAlphaOfLength(5) },
+            randomAlphaOfLength(5),
+            null,
+            new String[] { "service", "service" },
+            null,
+            null,
+            null,
+            null,
+            null
+        );
+        assertNull("Expecting no validation errors", request.validate());
+    }
+
     public void testConsidersCustomIndicesInRelatedIndices() {
         String customIndex = randomAlphaOfLength(5);
         GetStackTracesRequest request = new GetStackTracesRequest(
@@ -338,6 +540,7 @@ public void testConsidersCustomIndicesInRelatedIndices() {
             null,
             null,
             null,
+            null,
             null
         );
         String[] indices = request.indices();
@@ -359,6 +562,7 @@ public void testConsidersDefaultIndicesInRelatedIndices() {
             null,
             null,
             null,
+            null,
             null
         );
         String[] indices = request.indices();
diff --git a/x-pack/plugin/profiling/src/test/java/org/elasticsearch/xpack/profiling/action/GetTopNFunctionsResponseTests.java b/x-pack/plugin/profiling/src/test/java/org/elasticsearch/xpack/profiling/action/GetTopNFunctionsResponseTests.java
index ebb3d492b024c..24f8ea85212d8 100644
--- a/x-pack/plugin/profiling/src/test/java/org/elasticsearch/xpack/profiling/action/GetTopNFunctionsResponseTests.java
+++ b/x-pack/plugin/profiling/src/test/java/org/elasticsearch/xpack/profiling/action/GetTopNFunctionsResponseTests.java
@@ -16,7 +16,6 @@
 
 import java.io.IOException;
 import java.util.List;
-import java.util.Map;
 
 import static org.elasticsearch.test.hamcrest.ElasticsearchAssertions.assertToXContentEquivalent;
 
@@ -56,7 +55,13 @@ public void testToXContent() throws IOException {
                             .field("line_number", sourceLine)
                             .field("executable_file_name", exeFilename)
                         .endObject()
-                        .field("sub_groups", Map.of("basket", 7L))
+                        .startObject("sub_groups")
+                            .startObject("transaction.name")
+                                .startObject("basket")
+                                    .field("count", 7L)
+                                .endObject()
+                            .endObject()
+                        .endObject()
                         .field("self_count", 1)
                         .field("total_count", 10)
                         .field("self_annual_co2_tons").rawValue("2.2000")
@@ -85,7 +90,7 @@ public void testToXContent() throws IOException {
             22.0d,
             12.0d,
             120.0d,
-            Map.of("basket", 7L)
+            SubGroup.root("transaction.name", false).addCount("basket", 7L)
         );
         GetTopNFunctionsResponse response = new GetTopNFunctionsResponse(1, 10, 2.2d, 12.0d, List.of(topNFunction));
         response.toXContent(actualResponse, ToXContent.EMPTY_PARAMS);
diff --git a/x-pack/plugin/profiling/src/test/java/org/elasticsearch/xpack/profiling/action/ResamplerTests.java b/x-pack/plugin/profiling/src/test/java/org/elasticsearch/xpack/profiling/action/ResamplerTests.java
index c2537edab6bbd..fec9704dc8c02 100644
--- a/x-pack/plugin/profiling/src/test/java/org/elasticsearch/xpack/profiling/action/ResamplerTests.java
+++ b/x-pack/plugin/profiling/src/test/java/org/elasticsearch/xpack/profiling/action/ResamplerTests.java
@@ -43,6 +43,7 @@ public void testNoResamplingNoSampleRateAdjustment() {
             null,
             null,
             null,
+            null,
             null
         );
         request.setAdjustSampleCount(false);
@@ -72,6 +73,7 @@ public void testNoResamplingButAdjustSampleRate() {
             null,
             null,
             null,
+            null,
             null
         );
         request.setAdjustSampleCount(true);
@@ -101,6 +103,7 @@ public void testResamplingNoSampleRateAdjustment() {
             null,
             null,
             null,
+            null,
             null
         );
         request.setAdjustSampleCount(false);
@@ -133,6 +136,7 @@ public void testResamplingNoSampleRateAdjustmentWithQuery() {
             null,
             null,
             null,
+            null,
             null
         );
 
@@ -162,6 +166,7 @@ public void testResamplingAndSampleRateAdjustment() {
             null,
             null,
             null,
+            null,
             null
         );
         request.setAdjustSampleCount(true);
diff --git a/x-pack/plugin/profiling/src/test/java/org/elasticsearch/xpack/profiling/action/SubGroupCollectorTests.java b/x-pack/plugin/profiling/src/test/java/org/elasticsearch/xpack/profiling/action/SubGroupCollectorTests.java
new file mode 100644
index 0000000000000..5d6022f322762
--- /dev/null
+++ b/x-pack/plugin/profiling/src/test/java/org/elasticsearch/xpack/profiling/action/SubGroupCollectorTests.java
@@ -0,0 +1,149 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.profiling.action;
+
+import org.elasticsearch.search.aggregations.bucket.terms.TermsAggregationBuilder;
+import org.elasticsearch.test.ESTestCase;
+
+import java.util.HashMap;
+import java.util.List;
+import java.util.Map;
+
+import static org.elasticsearch.xpack.profiling.action.SubGroupCollector.CUSTOM_EVENT_SUB_AGGREGATION_NAME;
+
+public class SubGroupCollectorTests extends ESTestCase {
+    public void testNoAggs() {
+        TermsAggregationBuilder stackTraces = new TermsAggregationBuilder("stacktraces").field("stacktrace.id");
+        TraceEvent traceEvent = new TraceEvent("1");
+
+        SubGroupCollector collector = SubGroupCollector.attach(stackTraces, new String[0], false);
+        assertTrue("Sub aggregations attached", stackTraces.getSubAggregations().isEmpty());
+
+        SubGroupCollector.Bucket currentStackTrace = bucket("1", 5);
+        collector.collectResults(currentStackTrace, traceEvent);
+
+        assertNull(traceEvent.subGroups);
+    }
+
+    public void testMultipleAggsInSingleStackTrace() {
+        TermsAggregationBuilder stackTraces = new TermsAggregationBuilder("stacktraces").field("stacktrace.id");
+        TraceEvent traceEvent = new TraceEvent("1");
+
+        SubGroupCollector collector = SubGroupCollector.attach(stackTraces, new String[] { "service.name", "transaction.name" }, false);
+        assertFalse("No sub aggregations attached", stackTraces.getSubAggregations().isEmpty());
+
+        StaticAgg services = new StaticAgg();
+        SubGroupCollector.Bucket currentStackTrace = bucket("1", 5, services);
+        // tag::noformat
+        services.addBuckets(CUSTOM_EVENT_SUB_AGGREGATION_NAME + "service.name",
+            bucket("basket", 7L,
+                agg(CUSTOM_EVENT_SUB_AGGREGATION_NAME + "transaction.name",
+                    bucket("add-to-basket", 4L),
+                    bucket("delete-from-basket", 3L)
+                )
+            ),
+            bucket("checkout", 4L,
+                agg(CUSTOM_EVENT_SUB_AGGREGATION_NAME + "transaction.name",
+                    bucket("enter-address", 4L),
+                    bucket("submit-order", 3L)
+                )
+            )
+        );
+        // end::noformat
+
+        collector.collectResults(currentStackTrace, traceEvent);
+
+        assertNotNull(traceEvent.subGroups);
+        assertEquals(Long.valueOf(7L), traceEvent.subGroups.getCount("basket"));
+        assertEquals(Long.valueOf(4L), traceEvent.subGroups.getCount("checkout"));
+        SubGroup basketTransactionNames = traceEvent.subGroups.getSubGroup("basket").getSubGroup("transaction.name");
+        assertEquals(Long.valueOf(4L), basketTransactionNames.getCount("add-to-basket"));
+        assertEquals(Long.valueOf(3L), basketTransactionNames.getCount("delete-from-basket"));
+        SubGroup checkoutTransactionNames = traceEvent.subGroups.getSubGroup("checkout").getSubGroup("transaction.name");
+        assertEquals(Long.valueOf(4L), checkoutTransactionNames.getCount("enter-address"));
+        assertEquals(Long.valueOf(3L), checkoutTransactionNames.getCount("submit-order"));
+    }
+
+    public void testSingleAggInMultipleStackTraces() {
+        TermsAggregationBuilder stackTraces = new TermsAggregationBuilder("stacktraces").field("stacktrace.id");
+        TraceEvent traceEvent = new TraceEvent("1");
+
+        SubGroupCollector collector = SubGroupCollector.attach(stackTraces, new String[] { "service.name" }, false);
+        assertFalse("No sub aggregations attached", stackTraces.getSubAggregations().isEmpty());
+
+        StaticAgg services1 = new StaticAgg();
+        SubGroupCollector.Bucket currentStackTrace1 = bucket("1", 5, services1);
+        services1.addBuckets(CUSTOM_EVENT_SUB_AGGREGATION_NAME + "service.name", bucket("basket", 7L));
+
+        collector.collectResults(currentStackTrace1, traceEvent);
+
+        StaticAgg services2 = new StaticAgg();
+        SubGroupCollector.Bucket currentStackTrace2 = bucket("1", 3, services2);
+        services2.addBuckets(CUSTOM_EVENT_SUB_AGGREGATION_NAME + "service.name", bucket("basket", 1L), bucket("checkout", 5L));
+
+        collector.collectResults(currentStackTrace2, traceEvent);
+
+        assertNotNull(traceEvent.subGroups);
+        assertEquals(Long.valueOf(8L), traceEvent.subGroups.getCount("basket"));
+        assertEquals(Long.valueOf(5L), traceEvent.subGroups.getCount("checkout"));
+    }
+
+    private SubGroupCollector.Bucket bucket(String key, long count) {
+        return bucket(key, count, null);
+    }
+
+    private SubGroupCollector.Bucket bucket(String key, long count, SubGroupCollector.Agg aggregations) {
+        return new StaticBucket(key, count, aggregations);
+    }
+
+    private SubGroupCollector.Agg agg(String name, SubGroupCollector.Bucket... buckets) {
+        StaticAgg a = new StaticAgg();
+        a.addBuckets(name, buckets);
+        return a;
+    }
+
+    private static class StaticBucket implements SubGroupCollector.Bucket {
+        private final String key;
+        private final long count;
+        private SubGroupCollector.Agg aggregations;
+
+        private StaticBucket(String key, long count, SubGroupCollector.Agg aggregations) {
+            this.key = key;
+            this.count = count;
+            this.aggregations = aggregations;
+        }
+
+        @Override
+        public String getKey() {
+            return key;
+        }
+
+        @Override
+        public long getCount() {
+            return count;
+        }
+
+        @Override
+        public SubGroupCollector.Agg getAggregations() {
+            return aggregations;
+        }
+    }
+
+    private static class StaticAgg implements SubGroupCollector.Agg {
+        private final Map<String, List<SubGroupCollector.Bucket>> buckets = new HashMap<>();
+
+        public void addBuckets(String name, SubGroupCollector.Bucket... buckets) {
+            this.buckets.put(name, List.of(buckets));
+        }
+
+        @Override
+        public Iterable<SubGroupCollector.Bucket> getBuckets(String aggName) {
+            return buckets.get(aggName);
+        }
+    }
+}
diff --git a/x-pack/plugin/profiling/src/test/java/org/elasticsearch/xpack/profiling/action/SubGroupTests.java b/x-pack/plugin/profiling/src/test/java/org/elasticsearch/xpack/profiling/action/SubGroupTests.java
new file mode 100644
index 0000000000000..c571d7c03c252
--- /dev/null
+++ b/x-pack/plugin/profiling/src/test/java/org/elasticsearch/xpack/profiling/action/SubGroupTests.java
@@ -0,0 +1,102 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.profiling.action;
+
+import org.elasticsearch.common.bytes.BytesReference;
+import org.elasticsearch.test.ESTestCase;
+import org.elasticsearch.xcontent.ToXContent;
+import org.elasticsearch.xcontent.XContentBuilder;
+import org.elasticsearch.xcontent.XContentFactory;
+import org.elasticsearch.xcontent.XContentType;
+
+import java.io.IOException;
+
+import static org.elasticsearch.test.hamcrest.ElasticsearchAssertions.assertToXContentEquivalent;
+
+public class SubGroupTests extends ESTestCase {
+    public void testToXContent() throws IOException {
+        XContentType contentType = randomFrom(XContentType.values());
+        // tag::noformat
+        XContentBuilder expectedRequest = XContentFactory.contentBuilder(contentType)
+            .startObject()
+                .startObject("transaction.name")
+                    .startObject("basket")
+                        .field("count", 7L)
+                    .endObject()
+                .endObject()
+            .endObject();
+        // end::noformat
+
+        XContentBuilder actualRequest = XContentFactory.contentBuilder(contentType);
+        actualRequest.startObject();
+        SubGroup g = SubGroup.root("transaction.name", false).addCount("basket", 7L);
+        g.toXContent(actualRequest, ToXContent.EMPTY_PARAMS);
+        actualRequest.endObject();
+
+        assertToXContentEquivalent(BytesReference.bytes(expectedRequest), BytesReference.bytes(actualRequest), contentType);
+    }
+
+    public void testRenderLegacyXContent() throws IOException {
+        XContentType contentType = randomFrom(XContentType.values());
+        // tag::noformat
+        XContentBuilder expectedRequest = XContentFactory.contentBuilder(contentType)
+            .startObject()
+                .field("basket", 7L)
+            .endObject();
+        // end::noformat
+
+        XContentBuilder actualRequest = XContentFactory.contentBuilder(contentType);
+        actualRequest.startObject();
+        SubGroup g = SubGroup.root("transaction.name", true).addCount("basket", 7L);
+        g.toXContent(actualRequest, ToXContent.EMPTY_PARAMS);
+        actualRequest.endObject();
+
+        assertToXContentEquivalent(BytesReference.bytes(expectedRequest), BytesReference.bytes(actualRequest), contentType);
+    }
+
+    public void testMergeNoCommonRoot() {
+        SubGroup root1 = SubGroup.root("transaction.name", false);
+        SubGroup root2 = SubGroup.root("service.name", false);
+
+        SubGroup toMerge = root1.copy();
+
+        toMerge.merge(root2);
+
+        assertEquals(root1, toMerge);
+    }
+
+    public void testMergeIdenticalTree() {
+        SubGroup g = SubGroup.root("transaction.name", false);
+        g.addCount("basket", 5L);
+        g.addCount("checkout", 7L);
+
+        SubGroup g2 = g.copy();
+
+        g.merge(g2);
+
+        assertEquals(Long.valueOf(10L), g.getCount("basket"));
+        assertEquals(Long.valueOf(14L), g.getCount("checkout"));
+    }
+
+    public void testMergeMixedTree() {
+        SubGroup g1 = SubGroup.root("transaction.name", false);
+        g1.addCount("basket", 5L);
+        g1.addCount("checkout", 7L);
+
+        SubGroup g2 = SubGroup.root("transaction.name", false);
+        g2.addCount("catalog", 8L);
+        g2.addCount("basket", 5L);
+        g2.addCount("checkout", 2L);
+
+        g1.merge(g2);
+
+        assertEquals(Long.valueOf(8L), g1.getCount("catalog"));
+        assertEquals(Long.valueOf(10L), g1.getCount("basket"));
+        assertEquals(Long.valueOf(9L), g1.getCount("checkout"));
+    }
+}
diff --git a/x-pack/plugin/profiling/src/test/java/org/elasticsearch/xpack/profiling/action/TopNFunctionTests.java b/x-pack/plugin/profiling/src/test/java/org/elasticsearch/xpack/profiling/action/TopNFunctionTests.java
index 9623415b41554..76379adcd3b8a 100644
--- a/x-pack/plugin/profiling/src/test/java/org/elasticsearch/xpack/profiling/action/TopNFunctionTests.java
+++ b/x-pack/plugin/profiling/src/test/java/org/elasticsearch/xpack/profiling/action/TopNFunctionTests.java
@@ -16,7 +16,6 @@
 import org.elasticsearch.xcontent.XContentType;
 
 import java.io.IOException;
-import java.util.Map;
 
 import static org.elasticsearch.test.hamcrest.ElasticsearchAssertions.assertToXContentEquivalent;
 
@@ -35,31 +34,35 @@ public void testToXContent() throws IOException {
         String frameGroupID = FrameGroupID.create(fileID, addressOrLine, exeFilename, sourceFilename, functionName);
 
         XContentType contentType = randomFrom(XContentType.values());
+        // tag::noformat
         XContentBuilder expectedRequest = XContentFactory.contentBuilder(contentType)
             .startObject()
-            .field("id", frameGroupID)
-            .field("rank", 1)
-            .startObject("frame")
-            .field("frame_type", frameType)
-            .field("inline", inline)
-            .field("address_or_line", addressOrLine)
-            .field("function_name", functionName)
-            .field("file_name", sourceFilename)
-            .field("line_number", sourceLine)
-            .field("executable_file_name", exeFilename)
-            .endObject()
-            .field("sub_groups", Map.of("basket", 7L))
-            .field("self_count", 1)
-            .field("total_count", 10)
-            .field("self_annual_co2_tons")
-            .rawValue("2.2000")
-            .field("total_annual_co2_tons")
-            .rawValue("22.0000")
-            .field("self_annual_costs_usd")
-            .rawValue("12.0000")
-            .field("total_annual_costs_usd")
-            .rawValue("120.0000")
+                .field("id", frameGroupID)
+                .field("rank", 1)
+                .startObject("frame")
+                    .field("frame_type", frameType)
+                    .field("inline", inline)
+                    .field("address_or_line", addressOrLine)
+                    .field("function_name", functionName)
+                    .field("file_name", sourceFilename)
+                    .field("line_number", sourceLine)
+                    .field("executable_file_name", exeFilename)
+                .endObject()
+                .startObject("sub_groups")
+                    .startObject("transaction.name")
+                        .startObject("basket")
+                            .field("count", 7L)
+                        .endObject()
+                    .endObject()
+                .endObject()
+                .field("self_count", 1)
+                .field("total_count", 10)
+                .field("self_annual_co2_tons").rawValue("2.2000")
+                .field("total_annual_co2_tons").rawValue("22.0000")
+                .field("self_annual_costs_usd").rawValue("12.0000")
+                .field("total_annual_costs_usd").rawValue("120.0000")
             .endObject();
+        // end::noformat
 
         XContentBuilder actualRequest = XContentFactory.contentBuilder(contentType);
         TopNFunction topNFunction = new TopNFunction(
@@ -78,7 +81,7 @@ public void testToXContent() throws IOException {
             22.0d,
             12.0d,
             120.0d,
-            Map.of("basket", 7L)
+            SubGroup.root("transaction.name", false).addCount("basket", 7L)
         );
         topNFunction.toXContent(actualRequest, ToXContent.EMPTY_PARAMS);
 
@@ -113,8 +116,8 @@ public void testEquality() {
             4.0d,
             23.2d,
             12.0d,
-            Map.of("checkout", 4L, "basket", 12L)
+            SubGroup.root("transaction.name", false).addCount("checkout", 4L).addCount("basket", 12L)
         );
-        EqualsHashCodeTestUtils.checkEqualsAndHashCode(topNFunction, (TopNFunction::clone));
+        EqualsHashCodeTestUtils.checkEqualsAndHashCode(topNFunction, (TopNFunction::copy));
     }
 }
diff --git a/x-pack/plugin/profiling/src/test/java/org/elasticsearch/xpack/profiling/action/TransportGetTopNFunctionsActionTests.java b/x-pack/plugin/profiling/src/test/java/org/elasticsearch/xpack/profiling/action/TransportGetTopNFunctionsActionTests.java
index 6e5ed79579a0f..2fcf961f9b9a5 100644
--- a/x-pack/plugin/profiling/src/test/java/org/elasticsearch/xpack/profiling/action/TransportGetTopNFunctionsActionTests.java
+++ b/x-pack/plugin/profiling/src/test/java/org/elasticsearch/xpack/profiling/action/TransportGetTopNFunctionsActionTests.java
@@ -9,7 +9,6 @@
 
 import org.elasticsearch.test.ESTestCase;
 
-import java.util.Collections;
 import java.util.List;
 import java.util.Map;
 
@@ -165,7 +164,7 @@ private TopNFunction topN(
             annualCO2TonsInclusive,
             annualCostsUSDExclusive,
             annualCostsUSDInclusive,
-            Collections.emptyMap()
+            null
         );
     }
 
diff --git a/x-pack/plugin/security/qa/multi-cluster/src/javaRestTest/java/org/elasticsearch/xpack/remotecluster/AbstractRemoteClusterSecurityTestCase.java b/x-pack/plugin/security/qa/multi-cluster/src/javaRestTest/java/org/elasticsearch/xpack/remotecluster/AbstractRemoteClusterSecurityTestCase.java
index 2aa96ffc4e443..c590e3d932a9f 100644
--- a/x-pack/plugin/security/qa/multi-cluster/src/javaRestTest/java/org/elasticsearch/xpack/remotecluster/AbstractRemoteClusterSecurityTestCase.java
+++ b/x-pack/plugin/security/qa/multi-cluster/src/javaRestTest/java/org/elasticsearch/xpack/remotecluster/AbstractRemoteClusterSecurityTestCase.java
@@ -10,7 +10,6 @@
 import org.apache.http.HttpHost;
 import org.apache.http.client.methods.HttpPost;
 import org.elasticsearch.client.Request;
-import org.elasticsearch.client.RequestOptions;
 import org.elasticsearch.client.Response;
 import org.elasticsearch.client.RestClient;
 import org.elasticsearch.client.RestClientBuilder;
@@ -293,7 +292,7 @@ protected static Response performRequestAgainstFulfillingCluster(Request request
     }
 
     protected static Response performRequestWithAdminUser(RestClient targetFulfillingClusterClient, Request request) throws IOException {
-        request.setOptions(RequestOptions.DEFAULT.toBuilder().addHeader("Authorization", basicAuthHeaderValue(USER, PASS)));
+        request.setOptions(request.getOptions().toBuilder().addHeader("Authorization", basicAuthHeaderValue(USER, PASS)));
         return targetFulfillingClusterClient.performRequest(request);
     }
 
diff --git a/x-pack/plugin/security/qa/multi-cluster/src/javaRestTest/java/org/elasticsearch/xpack/remotecluster/RemoteClusterSecurityLegacyCrossClusterApiKeysWithDlsFlsIT.java b/x-pack/plugin/security/qa/multi-cluster/src/javaRestTest/java/org/elasticsearch/xpack/remotecluster/RemoteClusterSecurityLegacyCrossClusterApiKeysWithDlsFlsIT.java
new file mode 100644
index 0000000000000..97fb275c34dd1
--- /dev/null
+++ b/x-pack/plugin/security/qa/multi-cluster/src/javaRestTest/java/org/elasticsearch/xpack/remotecluster/RemoteClusterSecurityLegacyCrossClusterApiKeysWithDlsFlsIT.java
@@ -0,0 +1,402 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.remotecluster;
+
+import org.apache.http.client.methods.HttpGet;
+import org.apache.http.util.EntityUtils;
+import org.elasticsearch.action.search.SearchResponse;
+import org.elasticsearch.client.Request;
+import org.elasticsearch.client.RequestOptions;
+import org.elasticsearch.client.Response;
+import org.elasticsearch.client.ResponseException;
+import org.elasticsearch.common.settings.Settings;
+import org.elasticsearch.core.Strings;
+import org.elasticsearch.search.SearchHit;
+import org.elasticsearch.search.SearchResponseUtils;
+import org.elasticsearch.test.cluster.ElasticsearchCluster;
+import org.elasticsearch.test.cluster.local.distribution.DistributionType;
+import org.elasticsearch.test.cluster.util.resource.Resource;
+import org.elasticsearch.test.junit.RunnableTestRuleAdapter;
+import org.elasticsearch.xcontent.ObjectPath;
+import org.elasticsearch.xcontent.XContentBuilder;
+import org.elasticsearch.xcontent.XContentFactory;
+import org.elasticsearch.xcontent.XContentParser;
+import org.elasticsearch.xcontent.XContentParserConfiguration;
+import org.elasticsearch.xcontent.XContentType;
+import org.elasticsearch.xpack.core.security.action.apikey.CrossClusterApiKeyRoleDescriptorBuilder;
+import org.junit.ClassRule;
+import org.junit.rules.RuleChain;
+import org.junit.rules.TestRule;
+
+import java.io.IOException;
+import java.util.Arrays;
+import java.util.List;
+import java.util.Locale;
+import java.util.Map;
+import java.util.Set;
+import java.util.concurrent.atomic.AtomicBoolean;
+import java.util.concurrent.atomic.AtomicReference;
+import java.util.stream.Collectors;
+
+import static org.hamcrest.Matchers.containsInAnyOrder;
+import static org.hamcrest.Matchers.containsString;
+import static org.hamcrest.Matchers.equalTo;
+
+public class RemoteClusterSecurityLegacyCrossClusterApiKeysWithDlsFlsIT extends AbstractRemoteClusterSecurityTestCase {
+
+    private static final AtomicReference<Map<String, Object>> API_KEY_MAP_REF = new AtomicReference<>();
+    private static final AtomicReference<Map<String, Object>> CCR_API_KEY_MAP_REF = new AtomicReference<>();
+    private static final AtomicBoolean SSL_ENABLED_REF = new AtomicBoolean();
+    private static final AtomicBoolean NODE1_RCS_SERVER_ENABLED = new AtomicBoolean();
+    private static final AtomicBoolean NODE2_RCS_SERVER_ENABLED = new AtomicBoolean();
+
+    private static final String CCR_USER = "ccr_user";
+
+    static {
+        fulfillingCluster = ElasticsearchCluster.local()
+            .distribution(DistributionType.DEFAULT)
+            .name("fulfilling-cluster")
+            .nodes(3)
+            .module("x-pack-ccr")
+            .apply(commonClusterConfig)
+            .setting("remote_cluster.port", "0")
+            .setting("xpack.security.remote_cluster_server.ssl.enabled", () -> String.valueOf(SSL_ENABLED_REF.get()))
+            .setting("xpack.security.remote_cluster_server.ssl.key", "remote-cluster.key")
+            .setting("xpack.security.remote_cluster_server.ssl.certificate", "remote-cluster.crt")
+            .setting("xpack.security.authc.token.enabled", "true")
+            .keystore("xpack.security.remote_cluster_server.ssl.secure_key_passphrase", "remote-cluster-password")
+            .node(0, spec -> spec.setting("remote_cluster_server.enabled", "true"))
+            .node(1, spec -> spec.setting("remote_cluster_server.enabled", () -> String.valueOf(NODE1_RCS_SERVER_ENABLED.get())))
+            .node(2, spec -> spec.setting("remote_cluster_server.enabled", () -> String.valueOf(NODE2_RCS_SERVER_ENABLED.get())))
+            .build();
+
+        queryCluster = ElasticsearchCluster.local()
+            .name("query-cluster")
+            .apply(commonClusterConfig)
+            .module("x-pack-ccr")
+            .setting("xpack.security.remote_cluster_client.ssl.enabled", () -> String.valueOf(SSL_ENABLED_REF.get()))
+            .setting("xpack.security.remote_cluster_client.ssl.certificate_authorities", "remote-cluster-ca.crt")
+            .setting("xpack.security.authc.token.enabled", "true")
+            .keystore("cluster.remote.my_remote_cluster.credentials", () -> {
+                if (API_KEY_MAP_REF.get() == null) {
+                    final Map<String, Object> apiKeyMap = createCrossClusterAccessApiKey("""
+                        {
+                          "search": [
+                            {
+                                "names": ["shared-metrics"]
+                            }
+                          ],
+                          "replication": [
+                            {
+                                "names": ["shared-metrics"]
+                            }
+                          ]
+                        }""");
+                    API_KEY_MAP_REF.set(apiKeyMap);
+                }
+                return (String) API_KEY_MAP_REF.get().get("encoded");
+            })
+            .keystore("cluster.remote.my_ccr_cluster.credentials", () -> {
+                if (CCR_API_KEY_MAP_REF.get() == null) {
+                    final Map<String, Object> apiKeyMap = createCrossClusterAccessApiKey("""
+                        {
+                          "search": [
+                            {
+                                "names": ["leader-index", "shared-*", "metrics-*"]
+                            }
+                          ],
+                          "replication": [
+                            {
+                                "names": ["leader-index", "shared-*", "metrics-*"]
+                            }
+                          ]
+                        }""");
+                    CCR_API_KEY_MAP_REF.set(apiKeyMap);
+                }
+                return (String) CCR_API_KEY_MAP_REF.get().get("encoded");
+            })
+            .rolesFile(Resource.fromClasspath("roles.yml"))
+            .user(REMOTE_METRIC_USER, PASS.toString(), "read_remote_shared_metrics", false)
+            .user(CCR_USER, PASS.toString(), "ccr_user_role", false)
+            .build();
+    }
+
+    @ClassRule
+    // Use a RuleChain to ensure that fulfilling cluster is started before query cluster
+    // `SSL_ENABLED_REF` is used to control the SSL-enabled setting on the test clusters
+    // We set it here, since randomization methods are not available in the static initialize context above
+    public static TestRule clusterRule = RuleChain.outerRule(new RunnableTestRuleAdapter(() -> {
+        SSL_ENABLED_REF.set(usually());
+        NODE1_RCS_SERVER_ENABLED.set(randomBoolean());
+        NODE2_RCS_SERVER_ENABLED.set(randomBoolean());
+    })).around(fulfillingCluster).around(queryCluster);
+
+    public void testCrossClusterSearchBlockedIfApiKeyInvalid() throws Exception {
+        configureRemoteCluster();
+        final String crossClusterAccessApiKeyId = (String) API_KEY_MAP_REF.get().get("id");
+
+        // Fulfilling cluster
+        {
+            // Spread the shards to all nodes
+            final Request createIndexRequest = new Request("PUT", "shared-metrics");
+            createIndexRequest.setJsonEntity("""
+                {
+                  "settings": {
+                    "number_of_shards": 3,
+                    "number_of_replicas": 0
+                  }
+                }""");
+            assertOK(performRequestAgainstFulfillingCluster(createIndexRequest));
+
+            // Index some documents, so we can attempt to search them from the querying cluster
+            final Request bulkRequest = new Request("POST", "/_bulk?refresh=true");
+            bulkRequest.setJsonEntity(Strings.format("""
+                { "index": { "_index": "shared-metrics" } }
+                { "name": "metric1" }
+                { "index": { "_index": "shared-metrics" } }
+                { "name": "metric2" }
+                { "index": { "_index": "shared-metrics" } }
+                { "name": "metric3" }
+                { "index": { "_index": "shared-metrics" } }
+                { "name": "metric4" }
+                """));
+            assertOK(performRequestAgainstFulfillingCluster(bulkRequest));
+        }
+
+        // Query cluster -- test searching works (the API key is valid)
+        {
+            final var searchRequest = new Request(
+                "GET",
+                String.format(
+                    Locale.ROOT,
+                    "/%s:%s/_search?ccs_minimize_roundtrips=%s",
+                    randomFrom("my_remote_cluster", "my_remote_*"),
+                    randomFrom("shared-metrics", "*"),
+                    randomBoolean()
+                )
+            );
+            final Response response = performRequestWithRemoteMetricUser(searchRequest);
+            assertOK(response);
+            final SearchResponse searchResponse = SearchResponseUtils.parseSearchResponse(responseAsParser(response));
+            try {
+                final List<String> actualIndices = Arrays.stream(searchResponse.getHits().getHits())
+                    .map(SearchHit::getIndex)
+                    .collect(Collectors.toList());
+                assertThat(Set.copyOf(actualIndices), containsInAnyOrder("shared-metrics"));
+            } finally {
+                searchResponse.decRef();
+            }
+        }
+
+        // make API key invalid
+        addDlsQueryToApiKeyDoc(crossClusterAccessApiKeyId);
+
+        // since we updated the API key doc directly, caches need to be clearer manually -- this would also happen during a rolling restart
+        // to the FC, during an upgrade
+        assertOK(performRequestAgainstFulfillingCluster(new Request("POST", "/_security/role/*/_clear_cache")));
+        assertOK(performRequestAgainstFulfillingCluster(new Request("POST", "/_security/api_key/*/_clear_cache")));
+
+        // check that GET still works
+        getCrossClusterApiKeys(crossClusterAccessApiKeyId);
+        // check that query still works
+        validateQueryCrossClusterApiKeys(crossClusterAccessApiKeyId);
+
+        {
+            final var searchRequest = new Request(
+                "GET",
+                String.format(
+                    Locale.ROOT,
+                    "/%s:%s/_search?ccs_minimize_roundtrips=%s",
+                    "my_remote_cluster",
+                    "shared-metrics",
+                    randomBoolean()
+                )
+            );
+            updateClusterSettings(
+                Settings.builder().put("cluster.remote.my_remote_cluster.skip_unavailable", Boolean.toString(true)).build()
+            );
+            final var response = performRequestWithRemoteMetricUser(searchRequest);
+            assertThat(response.getStatusLine().getStatusCode(), equalTo(200));
+            String responseJson = EntityUtils.toString(response.getEntity());
+            assertThat(responseJson, containsString("\"status\":\"skipped\""));
+            assertThat(responseJson, containsString("search does not support document or field level security if replication is assigned"));
+
+            updateClusterSettings(
+                Settings.builder().put("cluster.remote.my_remote_cluster.skip_unavailable", Boolean.toString(false)).build()
+            );
+            final ResponseException ex = expectThrows(ResponseException.class, () -> performRequestWithRemoteMetricUser(searchRequest));
+            assertThat(ex.getResponse().getStatusLine().getStatusCode(), equalTo(400));
+            assertThat(
+                ex.getMessage(),
+                containsString("search does not support document or field level security if replication is assigned")
+            );
+        }
+    }
+
+    public void testCrossClusterReplicationBlockedIfApiKeyInvalid() throws Exception {
+        // TODO improve coverage to test:
+        // * auto-follow
+        // * follow successfully, then break key
+        configureRemoteCluster("my_ccr_cluster");
+        final String crossClusterAccessApiKeyId = (String) CCR_API_KEY_MAP_REF.get().get("id");
+
+        // fulfilling cluster
+        {
+            final Request bulkRequest = new Request("POST", "/_bulk?refresh=true");
+            bulkRequest.setJsonEntity(Strings.format("""
+                { "index": { "_index": "leader-index" } }
+                { "name": "doc-1" }
+                { "index": { "_index": "leader-index" } }
+                { "name": "doc-2" }
+                { "index": { "_index": "leader-index" } }
+                { "name": "doc-3" }
+                { "index": { "_index": "leader-index" } }
+                { "name": "doc-4" }
+                { "index": { "_index": "private-index" } }
+                { "name": "doc-5" }
+                """));
+            assertOK(performRequestAgainstFulfillingCluster(bulkRequest));
+        }
+
+        // make API key invalid
+        addDlsQueryToApiKeyDoc(crossClusterAccessApiKeyId);
+        // since we updated the API key doc directly, caches need to be clearer manually -- this would also happen during a rolling restart
+        // to the FC, during an upgrade
+        assertOK(performRequestAgainstFulfillingCluster(new Request("POST", "/_security/role/*/_clear_cache")));
+        assertOK(performRequestAgainstFulfillingCluster(new Request("POST", "/_security/api_key/*/_clear_cache")));
+
+        // query cluster
+        {
+            final String followIndexName = "follower-index";
+            final Request putCcrRequest = new Request("PUT", "/" + followIndexName + "/_ccr/follow?wait_for_active_shards=1");
+            putCcrRequest.setJsonEntity("""
+                {
+                  "remote_cluster": "my_ccr_cluster",
+                  "leader_index": "leader-index"
+                }""");
+
+            final ResponseException ex = expectThrows(ResponseException.class, () -> performRequestWithCcrUser(putCcrRequest));
+            assertThat(
+                ex.getMessage(),
+                containsString("search does not support document or field level security if replication is assigned")
+            );
+            assertThat(ex.getResponse().getStatusLine().getStatusCode(), equalTo(400));
+        }
+    }
+
+    @SuppressWarnings("unchecked")
+    private void addDlsQueryToApiKeyDoc(String crossClusterAccessApiKeyId) throws IOException {
+        Map<String, Object> apiKeyAsMap = getCrossClusterApiKeys(crossClusterAccessApiKeyId);
+        Map<String, Object> roleDescriptors = (Map<String, Object>) apiKeyAsMap.get("role_descriptors");
+        Map<String, Object> crossCluster = (Map<String, Object>) roleDescriptors.get("cross_cluster");
+        List<Map<String, Object>> indices = (List<Map<String, Object>>) crossCluster.get("indices");
+        indices.forEach(index -> {
+            List<String> privileges = (List<String>) index.get("privileges");
+            if (Arrays.equals(privileges.toArray(String[]::new), CrossClusterApiKeyRoleDescriptorBuilder.CCS_INDICES_PRIVILEGE_NAMES)) {
+                index.put("query", "{\"match_all\": {}}");
+                index.put("privileges", List.of("read", "read_cross_cluster", "view_index_metadata")); // ensure privs emulate pre 8.14
+            }
+        });
+        crossCluster.put("cluster", List.of("cross_cluster_search", "cross_cluster_replication")); // ensure privs emulate pre 8.14
+        XContentBuilder builder = XContentFactory.jsonBuilder();
+        builder.startObject();
+        builder.field("cross_cluster", crossCluster);
+        builder.endObject();
+        updateApiKey(crossClusterAccessApiKeyId, org.elasticsearch.common.Strings.toString(builder));
+    }
+
+    @SuppressWarnings("unchecked")
+    private Map<String, Object> getCrossClusterApiKeys(String id) throws IOException {
+        final var request = new Request(HttpGet.METHOD_NAME, "/_security/api_key");
+        request.addParameters(Map.of("id", id));
+
+        Response response = performRequestAgainstFulfillingCluster(request);
+        Map<String, Object> responseMap = entityAsMap(response);
+        List<Map<String, Object>> apiKeys = (List<Map<String, Object>>) responseMap.get("api_keys");
+        assertThat(apiKeys.size(), equalTo(1));
+        assertNotNull(ObjectPath.eval("role_descriptors.cross_cluster", apiKeys.get(0)));
+        return apiKeys.get(0);
+    }
+
+    @SuppressWarnings("unchecked")
+    private void validateQueryCrossClusterApiKeys(String id) throws IOException {
+        final var request = new Request(HttpGet.METHOD_NAME, "/_security/_query/api_key");
+        request.setJsonEntity(Strings.format("""
+            {
+              "query": {
+                "ids": {
+                  "values": [
+                    "%s"
+                  ]
+                }
+              }
+            }
+            """, id));
+
+        Response response = performRequestAgainstFulfillingCluster(request);
+        Map<String, Object> responseMap = entityAsMap(response);
+        assertThat(responseMap.get("total"), equalTo(1));
+        assertThat(responseMap.get("count"), equalTo(1));
+        List<Map<String, Object>> apiKeys = (List<Map<String, Object>>) responseMap.get("api_keys");
+        assertThat(apiKeys.size(), equalTo(1));
+        // assumes this method is only called after we manually update the API key doc with the DLS query
+        String query = ObjectPath.eval("role_descriptors.cross_cluster.indices.0.query", apiKeys.get(0));
+        try {
+            assertThat(query, equalTo("{\"match_all\": {}}"));
+        } catch (AssertionError e) {
+            // it's ugly, but the query could be in the 0 or 1 position.
+            query = ObjectPath.eval("role_descriptors.cross_cluster.indices.1.query", apiKeys.get(0));
+            assertThat(query, equalTo("{\"match_all\": {}}"));
+        }
+    }
+
+    private static XContentParser getParser(Response response) throws IOException {
+        final byte[] responseBody = EntityUtils.toByteArray(response.getEntity());
+        return XContentType.JSON.xContent().createParser(XContentParserConfiguration.EMPTY, responseBody);
+    }
+
+    static void updateApiKey(String id, String payload) throws IOException {
+        final Request request = new Request("POST", "/.security/_update/" + id + "?refresh=true");
+        request.setJsonEntity(Strings.format("""
+            {
+              "doc": {
+                "role_descriptors": %s
+              }
+            }
+            """, payload));
+        expectWarnings(
+            request,
+            "this request accesses system indices: [.security-7],"
+                + " but in a future major version, direct access to system indices will be prevented by default"
+        );
+        Response response = performRequestAgainstFulfillingCluster(request);
+        assertOK(response);
+    }
+
+    private Response performRequestWithRemoteMetricUser(final Request request) throws IOException {
+        request.setOptions(
+            RequestOptions.DEFAULT.toBuilder().addHeader("Authorization", headerFromRandomAuthMethod(REMOTE_METRIC_USER, PASS))
+        );
+        return client().performRequest(request);
+    }
+
+    static void expectWarnings(Request request, String... expectedWarnings) {
+        final Set<String> expected = Set.of(expectedWarnings);
+        RequestOptions options = request.getOptions().toBuilder().setWarningsHandler(warnings -> {
+            final Set<String> actual = Set.copyOf(warnings);
+            // Return true if the warnings aren't what we expected; the client will treat them as a fatal error.
+            return actual.equals(expected) == false;
+        }).build();
+        request.setOptions(options);
+    }
+
+    private Response performRequestWithCcrUser(final Request request) throws IOException {
+        request.setOptions(RequestOptions.DEFAULT.toBuilder().addHeader("Authorization", basicAuthHeaderValue(CCR_USER, PASS)));
+        return client().performRequest(request);
+    }
+}
diff --git a/x-pack/plugin/security/qa/security-trial/src/javaRestTest/java/org/elasticsearch/xpack/security/apikey/ApiKeyRestIT.java b/x-pack/plugin/security/qa/security-trial/src/javaRestTest/java/org/elasticsearch/xpack/security/apikey/ApiKeyRestIT.java
index 1b0d3397daa90..5ae84517202d4 100644
--- a/x-pack/plugin/security/qa/security-trial/src/javaRestTest/java/org/elasticsearch/xpack/security/apikey/ApiKeyRestIT.java
+++ b/x-pack/plugin/security/qa/security-trial/src/javaRestTest/java/org/elasticsearch/xpack/security/apikey/ApiKeyRestIT.java
@@ -122,7 +122,7 @@ public void cleanUp() throws IOException {
     public void testGetApiKeyRoleDescriptors() throws IOException {
         // First key without assigned role descriptors, i.e. it inherits owner user's permission
         // This can be achieved by either omitting the role_descriptors field in the request or
-        // explicitly set it to an empty object
+        // explicitly set it to an empty object.
         final Request createApiKeyRequest1 = new Request("POST", "_security/api_key");
         if (randomBoolean()) {
             createApiKeyRequest1.setJsonEntity("""
@@ -1019,8 +1019,7 @@ public void testCreateCrossClusterApiKey() throws IOException {
               "access": {
                 "search": [
                   {
-                    "names": [ "metrics" ],
-                    "query": "{\\"term\\":{\\"score\\":42}}"
+                    "names": [ "metrics" ]
                   }
                 ],
                 "replication": [
@@ -1085,7 +1084,6 @@ public void testCreateCrossClusterApiKey() throws IOException {
                                 RoleDescriptor.IndicesPrivileges.builder()
                                     .indices("metrics")
                                     .privileges("read", "read_cross_cluster", "view_index_metadata")
-                                    .query("{\"term\":{\"score\":42}}")
                                     .build(),
                                 RoleDescriptor.IndicesPrivileges.builder()
                                     .indices("logs")
@@ -1105,7 +1103,6 @@ public void testCreateCrossClusterApiKey() throws IOException {
                     "names": [
                       "metrics"
                     ],
-                    "query": "{\\"term\\":{\\"score\\":42}}",
                     "allow_restricted_indices": false
                   }
                 ],
@@ -1381,6 +1378,67 @@ public void testCrossClusterApiKeyDoesNotAllowDlsFlsForReplication() throws IOEx
             }""", "replication does not support document or field level security");
     }
 
+    public void testCrossClusterApiKeyDoesNotAllowDlsFlsForSearchWhenReplicationAssigned() throws IOException {
+        assertBadCreateCrossClusterApiKeyRequest("""
+            {
+              "name": "key",
+              "access": {
+                "search": [ {"names": ["logs"], "query":{"term": {"tag": 42}}} ],
+                "replication": [ {"names": ["logs"]} ]
+              }
+            }""", "search does not support document or field level security if replication is assigned");
+
+        assertBadCreateCrossClusterApiKeyRequest("""
+            {
+              "name": "key",
+              "access": {
+                "search": [ {"names": ["logs"], "field_security": {"grant": ["*"], "except": ["private"]}} ],
+                "replication": [ {"names": ["logs"]} ]
+              }
+            }""", "search does not support document or field level security if replication is assigned");
+
+        assertBadCreateCrossClusterApiKeyRequest("""
+            {
+              "name": "key",
+              "access": {
+                "search": [ {
+                  "names": ["logs"],
+                  "query": {"term": {"tag": 42}},
+                  "field_security": {"grant": ["*"], "except": ["private"]}
+                 } ],
+                 "replication": [ {"names": ["logs"]} ]
+              }
+            }""", "search does not support document or field level security if replication is assigned");
+
+        assertBadUpdateCrossClusterApiKeyRequest("""
+            {
+              "access": {
+                "search": [ {"names": ["logs"], "query":{"term": {"tag": 42}}} ],
+                "replication": [ {"names": ["logs"]} ]
+              }
+            }""", "search does not support document or field level security if replication is assigned");
+
+        assertBadUpdateCrossClusterApiKeyRequest("""
+            {
+              "access": {
+                "search": [ {"names": ["logs"], "field_security": {"grant": ["*"], "except": ["private"]}} ],
+                "replication": [ {"names": ["logs"]} ]
+              }
+            }""", "search does not support document or field level security if replication is assigned");
+
+        assertBadUpdateCrossClusterApiKeyRequest("""
+            {
+              "access": {
+                "search": [ {
+                  "names": ["logs"],
+                  "query": {"term": {"tag": 42}},
+                  "field_security": {"grant": ["*"], "except": ["private"]}
+                 } ],
+                 "replication": [ {"names": ["logs"]} ]
+              }
+            }""", "search does not support document or field level security if replication is assigned");
+    }
+
     public void testCrossClusterApiKeyRequiresName() throws IOException {
         assertBadCreateCrossClusterApiKeyRequest("""
             {
@@ -1414,8 +1472,7 @@ public void testUpdateCrossClusterApiKey() throws IOException {
               "access": {
                 "search": [
                   {
-                    "names": [ "data" ],
-                    "query": "{\\"term\\":{\\"score\\":42}}"
+                    "names": [ "data" ]
                   }
                 ],
                 "replication": [
@@ -1437,7 +1494,6 @@ public void testUpdateCrossClusterApiKey() throws IOException {
                 RoleDescriptor.IndicesPrivileges.builder()
                     .indices("data")
                     .privileges("read", "read_cross_cluster", "view_index_metadata")
-                    .query("{\"term\":{\"score\":42}}")
                     .build(),
                 RoleDescriptor.IndicesPrivileges.builder()
                     .indices("logs")
@@ -1457,7 +1513,6 @@ public void testUpdateCrossClusterApiKey() throws IOException {
               "search": [
                 {
                   "names": [ "data" ],
-                  "query": "{\\"term\\":{\\"score\\":42}}",
                   "allow_restricted_indices": false
                 }
               ],
@@ -2069,6 +2124,16 @@ private void assertBadCreateCrossClusterApiKeyRequest(String body, String expect
         assertThat(e.getMessage(), containsString(expectedErrorMessage));
     }
 
+    private void assertBadUpdateCrossClusterApiKeyRequest(String body, String expectedErrorMessage) throws IOException {
+        // doesn't matter that `id` does not exist: validation happens before that check
+        final Request request = new Request("PUT", "/_security/cross_cluster/api_key/id");
+        request.setJsonEntity(body);
+        setUserForRequest(request, MANAGE_SECURITY_USER, END_USER_PASSWORD);
+        final ResponseException e = expectThrows(ResponseException.class, () -> client().performRequest(request));
+        assertThat(e.getResponse().getStatusLine().getStatusCode(), equalTo(400));
+        assertThat(e.getMessage(), containsString(expectedErrorMessage));
+    }
+
     private Response sendRequestWithRemoteIndices(final Request request, final boolean executeAsRemoteIndicesUser) throws IOException {
         if (executeAsRemoteIndicesUser) {
             return sendRequestAsRemoteUser(request);
diff --git a/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/authc/ApiKeyService.java b/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/authc/ApiKeyService.java
index 883d7cb8ab103..0b17bdce98858 100644
--- a/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/authc/ApiKeyService.java
+++ b/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/authc/ApiKeyService.java
@@ -143,9 +143,6 @@
 import static org.elasticsearch.xcontent.ConstructingObjectParser.optionalConstructorArg;
 import static org.elasticsearch.xpack.core.ClientHelper.SECURITY_ORIGIN;
 import static org.elasticsearch.xpack.core.ClientHelper.executeAsyncWithOrigin;
-import static org.elasticsearch.xpack.core.security.action.apikey.CrossClusterApiKeyRoleDescriptorBuilder.CCR_CLUSTER_PRIVILEGE_NAMES;
-import static org.elasticsearch.xpack.core.security.action.apikey.CrossClusterApiKeyRoleDescriptorBuilder.CCS_AND_CCR_CLUSTER_PRIVILEGE_NAMES;
-import static org.elasticsearch.xpack.core.security.action.apikey.CrossClusterApiKeyRoleDescriptorBuilder.CCS_CLUSTER_PRIVILEGE_NAMES;
 import static org.elasticsearch.xpack.core.security.authz.RoleDescriptor.WORKFLOWS_RESTRICTION_VERSION;
 import static org.elasticsearch.xpack.security.Security.SECURITY_CRYPTO_THREAD_POOL_NAME;
 import static org.elasticsearch.xpack.security.support.SecurityIndexManager.Availability.PRIMARY_SHARDS;
@@ -1423,22 +1420,28 @@ public void crossClusterApiKeyUsageStats(ActionListener<Map<String, Object>> lis
                 for (ApiKey apiKeyInfo : apiKeyInfos) {
                     assert apiKeyInfo.getType() == ApiKey.Type.CROSS_CLUSTER;
                     assert apiKeyInfo.getRoleDescriptors().size() == 1;
-                    final String[] clusterPrivileges = apiKeyInfo.getRoleDescriptors().iterator().next().getClusterPrivileges();
-                    if (Arrays.equals(clusterPrivileges, CCS_CLUSTER_PRIVILEGE_NAMES)) {
+                    final List<String> clusterPrivileges = Arrays.asList(
+                        apiKeyInfo.getRoleDescriptors().iterator().next().getClusterPrivileges()
+                    );
+
+                    if (clusterPrivileges.contains("cross_cluster_search")
+                        && clusterPrivileges.contains("cross_cluster_replication") == false) {
                         ccsKeys += 1;
-                    } else if (Arrays.equals(clusterPrivileges, CCR_CLUSTER_PRIVILEGE_NAMES)) {
-                        ccrKeys += 1;
-                    } else if (Arrays.equals(clusterPrivileges, CCS_AND_CCR_CLUSTER_PRIVILEGE_NAMES)) {
-                        ccsCcrKeys += 1;
-                    } else {
-                        final String message = "invalid cluster privileges ["
-                            + Strings.arrayToCommaDelimitedString(clusterPrivileges)
-                            + "] for cross-cluster API key ["
-                            + apiKeyInfo.getId()
-                            + "]";
-                        assert false : message;
-                        listener.onFailure(new IllegalStateException(message));
-                    }
+                    } else if (clusterPrivileges.contains("cross_cluster_replication")
+                        && clusterPrivileges.contains("cross_cluster_search") == false) {
+                            ccrKeys += 1;
+                        } else if (clusterPrivileges.contains("cross_cluster_search")
+                            && clusterPrivileges.contains("cross_cluster_replication")) {
+                                ccsCcrKeys += 1;
+                            } else {
+                                final String message = "invalid cluster privileges "
+                                    + clusterPrivileges
+                                    + " for cross-cluster API key ["
+                                    + apiKeyInfo.getId()
+                                    + "]";
+                                assert false : message;
+                                listener.onFailure(new IllegalStateException(message));
+                            }
                 }
                 listener.onResponse(Map.of("total", apiKeyInfos.size(), "ccs", ccsKeys, "ccr", ccrKeys, "ccs_ccr", ccsCcrKeys));
             }, listener::onFailure));
diff --git a/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/authz/store/RoleDescriptorStore.java b/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/authz/store/RoleDescriptorStore.java
index ae7df99a55302..50a4658c27ee4 100644
--- a/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/authz/store/RoleDescriptorStore.java
+++ b/x-pack/plugin/security/src/main/java/org/elasticsearch/xpack/security/authz/store/RoleDescriptorStore.java
@@ -17,6 +17,7 @@
 import org.elasticsearch.common.util.concurrent.ThreadContext;
 import org.elasticsearch.license.XPackLicenseState;
 import org.elasticsearch.xpack.core.common.IteratingActionListener;
+import org.elasticsearch.xpack.core.security.action.apikey.CrossClusterApiKeyRoleDescriptorBuilder;
 import org.elasticsearch.xpack.core.security.authz.RoleDescriptor;
 import org.elasticsearch.xpack.core.security.authz.store.ReservedRolesStore;
 import org.elasticsearch.xpack.core.security.authz.store.RoleReference;
@@ -107,6 +108,19 @@ public void resolveApiKeyRoleReference(
             || (apiKeyRoleReference.getRoleType() == RoleReference.ApiKeyRoleType.LIMITED_BY
                 && rolesRetrievalResult.getRoleDescriptors().stream().noneMatch(RoleDescriptor::hasRestriction))
             : "there should be zero limited-by role descriptors with restriction and no more than one assigned";
+        // TODO we need unit tests for edge-cases here, for instance, we need to test the REST API keys are never checked for invalid legacy
+        // role descriptors
+        if (apiKeyRoleReference.checkForInvalidLegacyRoleDescriptorsForCrossClusterAccess()) {
+            try {
+                CrossClusterApiKeyRoleDescriptorBuilder.checkForInvalidLegacyRoleDescriptors(
+                    apiKeyRoleReference.getApiKeyId(),
+                    roleDescriptors
+                );
+            } catch (IllegalArgumentException e) {
+                listener.onFailure(e);
+                return;
+            }
+        }
         listener.onResponse(rolesRetrievalResult);
     }
 
diff --git a/x-pack/plugin/security/src/test/java/org/elasticsearch/xpack/security/audit/logfile/LoggingAuditTrailTests.java b/x-pack/plugin/security/src/test/java/org/elasticsearch/xpack/security/audit/logfile/LoggingAuditTrailTests.java
index fb5a49428887f..22cd2816ec334 100644
--- a/x-pack/plugin/security/src/test/java/org/elasticsearch/xpack/security/audit/logfile/LoggingAuditTrailTests.java
+++ b/x-pack/plugin/security/src/test/java/org/elasticsearch/xpack/security/audit/logfile/LoggingAuditTrailTests.java
@@ -3243,13 +3243,28 @@ private CrossClusterApiKeyAccessWithSerialization randomCrossClusterApiKeyAccess
                         {
                           "names": [
                             "logs*"
-                          ]
+                          ],
+                          "query": {
+                            "term": {
+                              "tag": 42
+                            }
+                          },
+                          "field_security": {
+                            "grant": [
+                              "*"
+                            ],
+                            "except": [
+                              "private"
+                            ]
+                          }
                         }
                       ]
                     }""",
                 "[{\"cluster\":[\"cross_cluster_search\",\"monitor_enrich\"],"
                     + "\"indices\":[{\"names\":[\"logs*\"],"
-                    + "\"privileges\":[\"read\",\"read_cross_cluster\",\"view_index_metadata\"]}],"
+                    + "\"privileges\":[\"read\",\"read_cross_cluster\",\"view_index_metadata\"],"
+                    + "\"field_security\":{\"grant\":[\"*\"],\"except\":[\"private\"]},"
+                    + "\"query\":\"{\\\"term\\\":{\\\"tag\\\":42}}\"}],"
                     + "\"applications\":[],\"run_as\":[]}]"
             ),
             new CrossClusterApiKeyAccessWithSerialization(
@@ -3275,20 +3290,7 @@ private CrossClusterApiKeyAccessWithSerialization randomCrossClusterApiKeyAccess
                           {
                             "names": [
                               "logs*"
-                            ],
-                            "query": {
-                              "term": {
-                                "tag": 42
-                              }
-                            },
-                            "field_security": {
-                              "grant": [
-                                "*"
-                              ],
-                              "except": [
-                                "private"
-                              ]
-                            }
+                            ]
                           }
                         ],
                         "replication": [
@@ -3301,8 +3303,7 @@ private CrossClusterApiKeyAccessWithSerialization randomCrossClusterApiKeyAccess
                         ]
                       }""",
                 "[{\"cluster\":[\"cross_cluster_search\",\"monitor_enrich\",\"cross_cluster_replication\"],"
-                    + "\"indices\":[{\"names\":[\"logs*\"],\"privileges\":[\"read\",\"read_cross_cluster\",\"view_index_metadata\"],"
-                    + "\"field_security\":{\"grant\":[\"*\"],\"except\":[\"private\"]},\"query\":\"{\\\"term\\\":{\\\"tag\\\":42}}\"},"
+                    + "\"indices\":[{\"names\":[\"logs*\"],\"privileges\":[\"read\",\"read_cross_cluster\",\"view_index_metadata\"]},"
                     + "{\"names\":[\"archive\"],\"privileges\":[\"cross_cluster_replication\",\"cross_cluster_replication_internal\"],"
                     + "\"allow_restricted_indices\":true}],\"applications\":[],\"run_as\":[]}]"
             )
diff --git a/x-pack/plugin/src/yamlRestTest/resources/rest-api-spec/test/api_key/50_cross_cluster.yml b/x-pack/plugin/src/yamlRestTest/resources/rest-api-spec/test/api_key/50_cross_cluster.yml
index eecf1977ca188..a50a197eecf8d 100644
--- a/x-pack/plugin/src/yamlRestTest/resources/rest-api-spec/test/api_key/50_cross_cluster.yml
+++ b/x-pack/plugin/src/yamlRestTest/resources/rest-api-spec/test/api_key/50_cross_cluster.yml
@@ -53,14 +53,7 @@ teardown:
             "access": {
               "search": [
                 {
-                  "names": ["logs*"],
-                  "query": {
-                    "term": { "category": "shared" }
-                  },
-                  "field_security": {
-                    "grant": ["*"],
-                    "except": ["private"]
-                  }
+                  "names": ["logs*"]
                 }
               ],
               "replication": [
@@ -124,15 +117,6 @@ teardown:
             "read_cross_cluster",
             "view_index_metadata"
           ],
-          "field_security": {
-            "grant": [
-              "*"
-            ],
-            "except": [
-              "private"
-            ]
-          },
-          "query": "{\"term\":{\"category\":\"shared\"}}",
           "allow_restricted_indices": false
         },
         {
@@ -161,15 +145,6 @@ teardown:
         "names": [
           "logs*"
         ],
-        "field_security": {
-          "grant": [
-            "*"
-          ],
-          "except": [
-            "private"
-          ]
-        },
-        "query": "{\"term\":{\"category\":\"shared\"}}",
         "allow_restricted_indices": false
       }
     ],
diff --git a/x-pack/plugin/src/yamlRestTest/resources/rest-api-spec/test/profiling/10_basic.yml b/x-pack/plugin/src/yamlRestTest/resources/rest-api-spec/test/profiling/10_basic.yml
index 2aee382890c56..325e6ca8bda7c 100644
--- a/x-pack/plugin/src/yamlRestTest/resources/rest-api-spec/test/profiling/10_basic.yml
+++ b/x-pack/plugin/src/yamlRestTest/resources/rest-api-spec/test/profiling/10_basic.yml
@@ -138,6 +138,62 @@ teardown:
   - match: {resources.pre_8_9_1_data: false}
   - match: {resources.has_data: true}
 
+---
+"Test stacktraces agg":
+  # This test mimics the behavior of the first query of the get stacktraces API. In certain environments we have
+  # observed that the stacktrace API returns a count of 2, although we only ever add one document with a count of 1.
+  # As these failures are very rare we start by adding a minimal reproduction that only relies on core ES features
+  # and eliminates any use of profiling-related APIs.
+  - do:
+      search:
+        index: profiling-events-all
+        body:
+          "query": {
+            "bool": {
+              "filter": [
+                {
+                  "range": {
+                    "@timestamp": {
+                      "gte": "2023-11-20",
+                      "lt": "2023-11-21",
+                      "format": "yyyy-MM-dd"
+                    }
+                  }
+                }
+              ]
+            }
+          }
+          size: 0
+          track_total_hits: false
+          aggs:
+            group_by:
+              terms:
+                field: host.id
+                execution_hint: map
+                size: 150000
+              aggs:
+                group_by:
+                  terms:
+                    field: Stacktrace.id
+                    execution_hint: map
+                    size: 150000
+                  aggs:
+                    count:
+                      sum:
+                        field: Stacktrace.count
+            total_count:
+              sum:
+                field: Stacktrace.count
+            min_time:
+              min:
+                field: "@timestamp"
+            max_time:
+              max:
+                field: "@timestamp"
+
+  - match: { aggregations.group_by.buckets.0.group_by.buckets.0.key: "S07KmaoGhvNte78xwwRbZQ" }
+  - match: { aggregations.group_by.buckets.0.group_by.buckets.0.count.value: 1 }
+
 ---
 "Test get stacktraces":
   - do: