diff --git a/docs/35.0.0/api-reference/api-reference.md b/docs/35.0.0/api-reference/api-reference.md
new file mode 100644
index 0000000000..dd4a4ab638
--- /dev/null
+++ b/docs/35.0.0/api-reference/api-reference.md
@@ -0,0 +1,44 @@
+---
+id: api-reference
+title: API reference
+sidebar_label: Overview
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+This topic is an index to the Apache Druid API documentation.
+
+## HTTP APIs
+* [Druid SQL queries](./sql-api.md) to submit SQL queries using the Druid SQL API.
+* [SQL-based ingestion](./sql-ingestion-api.md) to submit SQL-based batch ingestion requests.
+* [JSON querying](./json-querying-api.md) to submit JSON-based native queries.
+* [Tasks](./tasks-api.md) to manage data ingestion operations.
+* [Supervisors](./supervisor-api.md) to manage supervisors for data ingestion lifecycle and data processing.
+* [Retention rules](./retention-rules-api.md) to define and manage data retention rules across datasources.
+* [Data management](./data-management-api.md) to manage data segments.
+* [Automatic compaction](./automatic-compaction-api.md) to optimize segment sizes after ingestion.
+* [Lookups](./lookups-api.md) to manage and modify key-value datasources.
+* [Service status](./service-status-api.md) to monitor components within the Druid cluster. 
+* [Dynamic configuration](./dynamic-configuration-api.md) to configure the behavior of the Coordinator and Overlord processes.
+* [Legacy metadata](./legacy-metadata-api.md) to retrieve datasource metadata.
+
+## Java APIs
+* [SQL JDBC driver](./sql-jdbc.md) to connect to Druid and make Druid SQL queries using the Avatica JDBC driver.
\ No newline at end of file
diff --git a/docs/35.0.0/api-reference/automatic-compaction-api.md b/docs/35.0.0/api-reference/automatic-compaction-api.md
new file mode 100644
index 0000000000..f3744a45f0
--- /dev/null
+++ b/docs/35.0.0/api-reference/automatic-compaction-api.md
@@ -0,0 +1,1592 @@
+---
+id: automatic-compaction-api
+title: Automatic compaction API
+sidebar_label: Automatic compaction
+---
+import Tabs from '@theme/Tabs';
+import TabItem from '@theme/TabItem';
+
+
+<!--
+
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+This topic describes the status and configuration API endpoints for [automatic compaction using Coordinator duties](../data-management/automatic-compaction.md#auto-compaction-using-coordinator-duties) in Apache Druid. You can configure automatic compaction in the Druid web console or API.
+
+:::info[Experimental]
+
+Instead of the automatic compaction API, you can use the supervisor API to submit auto-compaction jobs using compaction supervisors. For more information, see [Auto-compaction using compaction supervisors](../data-management/automatic-compaction.md#auto-compaction-using-compaction-supervisors).
+
+:::
+
+In this topic, `http://ROUTER_IP:ROUTER_PORT` is a placeholder for your Router service address and port. Replace it with the information for your deployment. For example, use `http://localhost:8888` for quickstart deployments.
+
+## Manage automatic compaction
+
+### Create or update automatic compaction configuration
+
+Creates or updates the automatic compaction configuration for a datasource. Pass the automatic compaction as a JSON object in the request body.
+
+The automatic compaction configuration requires only the `dataSource` property. Druid fills all other properties with default values if not specified. See [Automatic compaction dynamic configuration](../configuration/index.md#automatic-compaction-dynamic-configuration) for configuration details.
+
+Note that this endpoint returns an HTTP `200 OK` message code even if the datasource name does not exist.
+
+#### URL
+
+`POST` `/druid/coordinator/v1/config/compaction`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="1" label="200 SUCCESS">
+
+
+*Successfully submitted auto compaction configuration*
+
+</TabItem>
+</Tabs>
+
+---
+#### Sample request
+
+The following example creates an automatic compaction configuration for the datasource `wikipedia_hour`, which was ingested with `HOUR` segment granularity. This automatic compaction configuration performs compaction on `wikipedia_hour`, resulting in compacted segments that represent a day interval of data.
+
+In this example:
+
+* `wikipedia_hour` is a datasource with `HOUR` segment granularity.
+* `skipOffsetFromLatest` is set to `PT0S`, meaning that no data is skipped.
+* `partitionsSpec` is set to the default `dynamic`, allowing Druid to dynamically determine the optimal partitioning strategy.
+* `type` is set to `index_parallel`, meaning that parallel indexing is used.
+* `segmentGranularity` is set to `DAY`, meaning that each compacted segment is a day of data.
+
+<Tabs>
+
+<TabItem value="2" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/coordinator/v1/config/compaction"\
+--header 'Content-Type: application/json' \
+--data '{
+    "dataSource": "wikipedia_hour",
+    "skipOffsetFromLatest": "PT0S",
+    "tuningConfig": {
+        "partitionsSpec": {
+            "type": "dynamic"
+        },
+        "type": "index_parallel"
+    },
+    "granularitySpec": {
+        "segmentGranularity": "DAY"
+    }
+}'
+```
+
+</TabItem>
+<TabItem value="3" label="HTTP">
+
+
+```HTTP
+POST /druid/coordinator/v1/config/compaction HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+Content-Type: application/json
+Content-Length: 281
+
+{
+    "dataSource": "wikipedia_hour",
+    "skipOffsetFromLatest": "PT0S",
+    "tuningConfig": {
+        "partitionsSpec": {
+            "type": "dynamic"
+        },
+        "type": "index_parallel"
+    },
+    "granularitySpec": {
+        "segmentGranularity": "DAY"
+    }
+}
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+A successful request returns an HTTP `200 OK` message code and an empty response body.
+
+
+### Remove automatic compaction configuration
+
+Removes the automatic compaction configuration for a datasource. This updates the compaction status of the datasource to "Not enabled."
+
+#### URL
+
+`DELETE` `/druid/coordinator/v1/config/compaction/{dataSource}`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="4" label="200 SUCCESS">
+
+
+*Successfully deleted automatic compaction configuration*
+
+</TabItem>
+<TabItem value="5" label="404 NOT FOUND">
+
+
+*Datasource does not have automatic compaction or invalid datasource name*
+
+</TabItem>
+</Tabs>
+
+---
+
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="6" label="cURL">
+
+
+```shell
+curl --request DELETE "http://ROUTER_IP:ROUTER_PORT/druid/coordinator/v1/config/compaction/wikipedia_hour"
+```
+
+</TabItem>
+<TabItem value="7" label="HTTP">
+
+
+```HTTP
+DELETE /druid/coordinator/v1/config/compaction/wikipedia_hour HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+A successful request returns an HTTP `200 OK` message code and an empty response body.
+
+### Update capacity for compaction tasks
+
+:::info
+This API is now deprecated. Use [Update cluster-level compaction config](#update-cluster-level-compaction-config) instead.
+:::
+
+Updates the capacity for compaction tasks. The minimum number of compaction tasks is 1 and the maximum is 2147483647.
+
+Note that while the max compaction tasks can theoretically be set to 2147483647, the practical limit is determined by the available cluster capacity and is capped at 10% of the cluster's total capacity.
+
+#### URL
+
+`POST` `/druid/coordinator/v1/config/compaction/taskslots`
+
+#### Query parameters
+
+To limit the maximum number of compaction tasks, use the optional query parameters `ratio` and `max`:
+
+* `ratio` (optional)
+  * Type: Float
+  * Default: 0.1
+  * Limits the ratio of the total task slots to compaction task slots.
+* `max` (optional)
+  * Type: Int
+  * Default: 2147483647
+  * Limits the maximum number of task slots for compaction tasks.
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="8" label="200 SUCCESS">
+
+
+*Successfully updated compaction configuration*
+
+</TabItem>
+<TabItem value="9" label="404 NOT FOUND">
+
+
+*Invalid `max` value*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="10" label="cURL">
+
+
+```shell
+curl --request POST "http://ROUTER_IP:ROUTER_PORT/druid/coordinator/v1/config/compaction/taskslots?ratio=0.2&max=250000"
+```
+
+</TabItem>
+<TabItem value="11" label="HTTP">
+
+
+```HTTP
+POST /druid/coordinator/v1/config/compaction/taskslots?ratio=0.2&max=250000 HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+A successful request returns an HTTP `200 OK` message code and an empty response body.
+
+## View automatic compaction configuration
+
+### Get all automatic compaction configurations
+
+Retrieves all automatic compaction configurations. Returns a `compactionConfigs` object containing the active automatic compaction configurations of all datasources.
+
+You can use this endpoint to retrieve `compactionTaskSlotRatio` and `maxCompactionTaskSlots` values for managing resource allocation of compaction tasks.
+
+#### URL
+
+`GET` `/druid/coordinator/v1/config/compaction`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="12" label="200 SUCCESS">
+
+
+*Successfully retrieved automatic compaction configurations*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="13" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/coordinator/v1/config/compaction"
+```
+
+</TabItem>
+<TabItem value="14" label="HTTP">
+
+
+```HTTP
+GET /druid/coordinator/v1/config/compaction HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+```json
+{
+    "compactionConfigs": [
+        {
+            "dataSource": "wikipedia_hour",
+            "taskPriority": 25,
+            "inputSegmentSizeBytes": 100000000000000,
+            "maxRowsPerSegment": null,
+            "skipOffsetFromLatest": "PT0S",
+            "tuningConfig": {
+                "maxRowsInMemory": null,
+                "appendableIndexSpec": null,
+                "maxBytesInMemory": null,
+                "maxTotalRows": null,
+                "splitHintSpec": null,
+                "partitionsSpec": {
+                    "type": "dynamic",
+                    "maxRowsPerSegment": 5000000,
+                    "maxTotalRows": null
+                },
+                "indexSpec": null,
+                "indexSpecForIntermediatePersists": null,
+                "maxPendingPersists": null,
+                "pushTimeout": null,
+                "segmentWriteOutMediumFactory": null,
+                "maxNumConcurrentSubTasks": null,
+                "maxRetry": null,
+                "taskStatusCheckPeriodMs": null,
+                "chatHandlerTimeout": null,
+                "chatHandlerNumRetries": null,
+                "maxNumSegmentsToMerge": null,
+                "totalNumMergeTasks": null,
+                "maxColumnsToMerge": null,
+                "type": "index_parallel",
+                "forceGuaranteedRollup": false
+            },
+            "granularitySpec": {
+                "segmentGranularity": "DAY",
+                "queryGranularity": null,
+                "rollup": null
+            },
+            "dimensionsSpec": null,
+            "metricsSpec": null,
+            "transformSpec": null,
+            "ioConfig": null,
+            "taskContext": null
+        },
+        {
+            "dataSource": "wikipedia",
+            "taskPriority": 25,
+            "inputSegmentSizeBytes": 100000000000000,
+            "maxRowsPerSegment": null,
+            "skipOffsetFromLatest": "PT0S",
+            "tuningConfig": {
+                "maxRowsInMemory": null,
+                "appendableIndexSpec": null,
+                "maxBytesInMemory": null,
+                "maxTotalRows": null,
+                "splitHintSpec": null,
+                "partitionsSpec": {
+                    "type": "dynamic",
+                    "maxRowsPerSegment": 5000000,
+                    "maxTotalRows": null
+                },
+                "indexSpec": null,
+                "indexSpecForIntermediatePersists": null,
+                "maxPendingPersists": null,
+                "pushTimeout": null,
+                "segmentWriteOutMediumFactory": null,
+                "maxNumConcurrentSubTasks": null,
+                "maxRetry": null,
+                "taskStatusCheckPeriodMs": null,
+                "chatHandlerTimeout": null,
+                "chatHandlerNumRetries": null,
+                "maxNumSegmentsToMerge": null,
+                "totalNumMergeTasks": null,
+                "maxColumnsToMerge": null,
+                "type": "index_parallel",
+                "forceGuaranteedRollup": false
+            },
+            "granularitySpec": {
+                "segmentGranularity": "DAY",
+                "queryGranularity": null,
+                "rollup": null
+            },
+            "dimensionsSpec": null,
+            "metricsSpec": null,
+            "transformSpec": null,
+            "ioConfig": null,
+            "taskContext": null
+        }
+    ],
+    "compactionTaskSlotRatio": 0.1,
+    "maxCompactionTaskSlots": 2147483647,
+
+}
+```
+</details>
+
+### Get automatic compaction configuration
+
+Retrieves the automatic compaction configuration for a datasource.
+
+#### URL
+
+`GET` `/druid/coordinator/v1/config/compaction/{dataSource}`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="15" label="200 SUCCESS">
+
+
+*Successfully retrieved configuration for datasource*
+
+</TabItem>
+<TabItem value="16" label="404 NOT FOUND">
+
+
+*Invalid datasource or datasource does not have automatic compaction enabled*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+The following example retrieves the automatic compaction configuration for datasource `wikipedia_hour`.
+
+<Tabs>
+
+<TabItem value="17" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/coordinator/v1/config/compaction/wikipedia_hour"
+```
+
+</TabItem>
+<TabItem value="18" label="HTTP">
+
+
+```HTTP
+GET /druid/coordinator/v1/config/compaction/wikipedia_hour HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+```json
+{
+    "dataSource": "wikipedia_hour",
+    "taskPriority": 25,
+    "inputSegmentSizeBytes": 100000000000000,
+    "maxRowsPerSegment": null,
+    "skipOffsetFromLatest": "PT0S",
+    "tuningConfig": {
+        "maxRowsInMemory": null,
+        "appendableIndexSpec": null,
+        "maxBytesInMemory": null,
+        "maxTotalRows": null,
+        "splitHintSpec": null,
+        "partitionsSpec": {
+            "type": "dynamic",
+            "maxRowsPerSegment": 5000000,
+            "maxTotalRows": null
+        },
+        "indexSpec": null,
+        "indexSpecForIntermediatePersists": null,
+        "maxPendingPersists": null,
+        "pushTimeout": null,
+        "segmentWriteOutMediumFactory": null,
+        "maxNumConcurrentSubTasks": null,
+        "maxRetry": null,
+        "taskStatusCheckPeriodMs": null,
+        "chatHandlerTimeout": null,
+        "chatHandlerNumRetries": null,
+        "maxNumSegmentsToMerge": null,
+        "totalNumMergeTasks": null,
+        "maxColumnsToMerge": null,
+        "type": "index_parallel",
+        "forceGuaranteedRollup": false
+    },
+    "granularitySpec": {
+        "segmentGranularity": "DAY",
+        "queryGranularity": null,
+        "rollup": null
+    },
+    "dimensionsSpec": null,
+    "metricsSpec": null,
+    "transformSpec": null,
+    "ioConfig": null,
+    "taskContext": null
+}
+```
+</details>
+
+### Get automatic compaction configuration history
+
+Retrieves the history of the automatic compaction configuration for a datasource. Returns an empty list if the  datasource does not exist or there is no compaction history for the datasource.
+
+The response contains a list of objects with the following keys:
+* `globalConfig`: A JSON object containing automatic compaction configuration that applies to the entire cluster.
+* `compactionConfig`: A JSON object containing the automatic compaction configuration for the datasource.
+* `auditInfo`: A JSON object containing information about the change made, such as `author`, `comment` or `ip`.
+* `auditTime`: The date and time when the change was made.
+
+#### URL
+
+`GET` `/druid/coordinator/v1/config/compaction/{dataSource}/history`
+
+#### Query parameters
+* `interval` (optional)
+  * Type: ISO-8601
+  * Limits the results within a specified interval. Use `/` as the delimiter for the interval string.
+* `count` (optional)
+  * Type: Int
+  * Limits the number of results.
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="19" label="200 SUCCESS">
+
+
+*Successfully retrieved configuration history*
+
+</TabItem>
+<TabItem value="20" label="400 BAD REQUEST">
+
+
+*Invalid `count` value*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="21" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/coordinator/v1/config/compaction/wikipedia_hour/history"
+```
+
+</TabItem>
+<TabItem value="22" label="HTTP">
+
+
+```HTTP
+GET /druid/coordinator/v1/config/compaction/wikipedia_hour/history HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+```json
+[
+    {
+        "globalConfig": {
+            "compactionTaskSlotRatio": 0.1,
+            "maxCompactionTaskSlots": 2147483647,
+            "compactionPolicy": {
+                "type": "newestSegmentFirst",
+                "priorityDatasource": "wikipedia"
+            },
+            "useSupervisors": true,
+            "engine": "native"
+        },
+        "compactionConfig": {
+            "dataSource": "wikipedia_hour",
+            "taskPriority": 25,
+            "inputSegmentSizeBytes": 100000000000000,
+            "maxRowsPerSegment": null,
+            "skipOffsetFromLatest": "P1D",
+            "tuningConfig": null,
+            "granularitySpec": {
+                "segmentGranularity": "DAY",
+                "queryGranularity": null,
+                "rollup": null
+            },
+            "dimensionsSpec": null,
+            "metricsSpec": null,
+            "transformSpec": null,
+            "ioConfig": null,
+            "taskContext": null
+        },
+        "auditInfo": {
+            "author": "",
+            "comment": "",
+            "ip": "127.0.0.1"
+        },
+        "auditTime": "2023-07-31T18:15:19.302Z"
+    },
+    {
+        "globalConfig": {
+            "compactionTaskSlotRatio": 0.1,
+            "maxCompactionTaskSlots": 2147483647,
+            "compactionPolicy": {
+                "type": "newestSegmentFirst"
+            },
+            "useSupervisors": false,
+            "engine": "native"
+        },
+        "compactionConfig": {
+            "dataSource": "wikipedia_hour",
+            "taskPriority": 25,
+            "inputSegmentSizeBytes": 100000000000000,
+            "maxRowsPerSegment": null,
+            "skipOffsetFromLatest": "PT0S",
+            "tuningConfig": {
+                "maxRowsInMemory": null,
+                "appendableIndexSpec": null,
+                "maxBytesInMemory": null,
+                "maxTotalRows": null,
+                "splitHintSpec": null,
+                "partitionsSpec": {
+                    "type": "dynamic",
+                    "maxRowsPerSegment": 5000000,
+                    "maxTotalRows": null
+                },
+                "indexSpec": null,
+                "indexSpecForIntermediatePersists": null,
+                "maxPendingPersists": null,
+                "pushTimeout": null,
+                "segmentWriteOutMediumFactory": null,
+                "maxNumConcurrentSubTasks": null,
+                "maxRetry": null,
+                "taskStatusCheckPeriodMs": null,
+                "chatHandlerTimeout": null,
+                "chatHandlerNumRetries": null,
+                "maxNumSegmentsToMerge": null,
+                "totalNumMergeTasks": null,
+                "maxColumnsToMerge": null,
+                "type": "index_parallel",
+                "forceGuaranteedRollup": false
+            },
+            "granularitySpec": {
+                "segmentGranularity": "DAY",
+                "queryGranularity": null,
+                "rollup": null
+            },
+            "dimensionsSpec": null,
+            "metricsSpec": null,
+            "transformSpec": null,
+            "ioConfig": null,
+            "taskContext": null
+        },
+        "auditInfo": {
+            "author": "",
+            "comment": "",
+            "ip": "127.0.0.1"
+        },
+        "auditTime": "2023-07-31T18:16:16.362Z"
+    }
+]
+```
+</details>
+
+## View automatic compaction status
+
+### Get segments awaiting compaction
+
+Returns the total size of segments awaiting compaction for a given datasource. Returns a 404 response if a datasource does not have automatic compaction enabled.
+
+#### URL
+
+`GET` `/druid/coordinator/v1/compaction/progress?dataSource={dataSource}`
+
+#### Query parameter
+* `dataSource` (required)
+  * Type: String
+  * Name of the datasource for this status information.
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="23" label="200 SUCCESS">
+
+
+*Successfully retrieved segment size awaiting compaction*
+
+</TabItem>
+<TabItem value="24" label="404 NOT FOUND">
+
+
+*Unknown datasource name or datasource does not have automatic compaction enabled*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+The following example retrieves the remaining segments to be compacted for datasource `wikipedia_hour`.
+
+<Tabs>
+
+<TabItem value="25" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/coordinator/v1/compaction/progress?dataSource=wikipedia_hour"
+```
+
+</TabItem>
+<TabItem value="26" label="HTTP">
+
+
+```HTTP
+GET /druid/coordinator/v1/compaction/progress?dataSource=wikipedia_hour HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+```json
+{
+    "remainingSegmentSize": 7615837
+}
+```
+</details>
+
+
+### Get compaction status and statistics
+
+Retrieves an array of `latestStatus` objects representing the status and statistics from the latest automatic compaction run for all datasources with automatic compaction enabled.
+
+#### Compaction status response
+
+The `latestStatus` object has the following properties:
+* `dataSource`: Name of the datasource for this status information.
+* `scheduleStatus`: Automatic compaction scheduling status. Possible values are `NOT_ENABLED` and `RUNNING`. Returns `RUNNING ` if the datasource has an active automatic compaction configuration submitted. Otherwise, returns `NOT_ENABLED`.
+* `bytesAwaitingCompaction`: Total bytes of this datasource waiting to be compacted by the automatic compaction (only consider intervals/segments that are eligible for automatic compaction).
+* `bytesCompacted`: Total bytes of this datasource that are already compacted with the spec set in the automatic compaction configuration.
+* `bytesSkipped`: Total bytes of this datasource that are skipped (not eligible for automatic compaction) by the automatic compaction.
+* `segmentCountAwaitingCompaction`: Total number of segments of this datasource waiting to be compacted by the automatic compaction (only consider intervals/segments that are eligible for automatic compaction).
+* `segmentCountCompacted`: Total number of segments of this datasource that are already compacted with the spec set in the automatic compaction configuration.
+* `segmentCountSkipped`: Total number of segments of this datasource that are skipped (not eligible for automatic compaction) by the automatic compaction.
+* `intervalCountAwaitingCompaction`: Total number of intervals of this datasource waiting to be compacted by the automatic compaction (only consider intervals/segments that are eligible for automatic compaction).
+* `intervalCountCompacted`: Total number of intervals of this datasource that are already compacted with the spec set in the automatic compaction configuration.
+* `intervalCountSkipped`: Total number of intervals of this datasource that are skipped (not eligible for automatic compaction) by the automatic compaction.
+
+#### URL
+
+`GET` `/druid/coordinator/v1/compaction/status`
+
+#### Query parameters
+* `dataSource` (optional)
+  * Type: String
+  * Filter the result by name of a specific datasource.
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="27" label="200 SUCCESS">
+
+
+*Successfully retrieved `latestStatus` object*
+
+</TabItem>
+</Tabs>
+
+---
+#### Sample request
+
+<Tabs>
+
+<TabItem value="28" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/coordinator/v1/compaction/status"
+```
+
+</TabItem>
+<TabItem value="29" label="HTTP">
+
+
+```HTTP
+GET /druid/coordinator/v1/compaction/status HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+```json
+{
+    "latestStatus": [
+        {
+            "dataSource": "wikipedia_api",
+            "scheduleStatus": "RUNNING",
+            "bytesAwaitingCompaction": 0,
+            "bytesCompacted": 0,
+            "bytesSkipped": 64133616,
+            "segmentCountAwaitingCompaction": 0,
+            "segmentCountCompacted": 0,
+            "segmentCountSkipped": 8,
+            "intervalCountAwaitingCompaction": 0,
+            "intervalCountCompacted": 0,
+            "intervalCountSkipped": 1
+        },
+        {
+            "dataSource": "wikipedia_hour",
+            "scheduleStatus": "RUNNING",
+            "bytesAwaitingCompaction": 0,
+            "bytesCompacted": 5998634,
+            "bytesSkipped": 0,
+            "segmentCountAwaitingCompaction": 0,
+            "segmentCountCompacted": 1,
+            "segmentCountSkipped": 0,
+            "intervalCountAwaitingCompaction": 0,
+            "intervalCountCompacted": 1,
+            "intervalCountSkipped": 0
+        }
+    ]
+}
+```
+</details>
+
+## [Experimental] Unified Compaction APIs
+
+This section describes the new unified compaction APIs which can be used regardless of whether compaction supervisors are enabled (i.e. `useSupervisors` is `true`) or not in the compaction dynamic config.
+
+- If compaction supervisors are disabled, the APIs read or write the compaction dynamic config, same as the Coordinator-based compaction APIs above.
+- If compaction supervisors are enabled, the APIs read or write the corresponding compaction supervisors. In conjunction with the APIs described below, the supervisor APIs may also be used to read or write the compaction supervisors as they offer greater flexibility and also serve information related to supervisor and task statuses.
+
+### Update cluster-level compaction config
+
+Updates cluster-level configuration for compaction tasks which applies to all datasources, unless explicitly overridden in the datasource compaction config.
+This includes the following fields:
+
+|Config|Description|Default value|
+|------|-----------|-------------|
+|`compactionTaskSlotRatio`|Ratio of number of slots taken up by compaction tasks to the number of total task slots across all workers.|0.1|
+|`maxCompactionTaskSlots`|Maximum number of task slots that can be taken up by compaction tasks and sub-tasks. Minimum number of task slots available for compaction is 1. When using MSQ engine or Native engine with range partitioning, a single compaction job occupies more than one task slot. In this case, the minimum is 2 so that at least one compaction job can always run in the cluster.|2147483647 (i.e. total task slots)|
+|`compactionPolicy`|Policy to choose intervals for compaction. Currently, the only supported policy is [Newest segment first](#compaction-policy-newestsegmentfirst).|Newest segment first|
+|`useSupervisors`|Whether compaction should be run on Overlord using supervisors instead of Coordinator duties.|false|
+|`engine`|Engine used for running compaction tasks, unless overridden in the datasource-level compaction config. Possible values are `native` and `msq`. `msq` engine can be used for compaction only if `useSupervisors` is `true`.|`native`|
+
+#### Compaction policy `newestSegmentFirst`
+
+|Field|Description|Default value|
+|-----|-----------|-------------|
+|`type`|This must always be `newestSegmentFirst`||
+|`priorityDatasource`|Datasource to prioritize for compaction. The intervals of this datasource are chosen for compaction before the intervals of any other datasource. Within this datasource, the intervals are prioritized based on the chosen compaction policy.|None|
+
+
+#### URL
+
+`POST` `/druid/indexer/v1/compaction/config/cluster`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="8" label="200 SUCCESS">
+
+
+*Successfully updated compaction configuration*
+
+</TabItem>
+<TabItem value="9" label="404 NOT FOUND">
+
+
+*Invalid `max` value*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="10" label="cURL">
+
+
+```shell
+curl --request POST "http://ROUTER_IP:ROUTER_PORT/druid/coordinator/v1/config/compaction/cluster" \
+--header 'Content-Type: application/json' \
+--data '{
+    "compactionTaskSlotRatio": 0.5,
+    "maxCompactionTaskSlots": 1500,
+    "compactionPolicy": {
+        "type": "newestSegmentFirst",
+        "priorityDatasource": "wikipedia"
+    },
+    "useSupervisors": true,
+    "engine": "msq"
+}'
+
+```
+
+</TabItem>
+<TabItem value="11" label="HTTP">
+
+
+```HTTP
+POST /druid/indexer/v1/compaction/config/cluster HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+Content-Type: application/json
+
+{
+    "compactionTaskSlotRatio": 0.5,
+    "maxCompactionTaskSlots": 1500,
+    "compactionPolicy": {
+        "type": "newestSegmentFirst",
+        "priorityDatasource": "wikipedia"
+    },
+    "useSupervisors": true,
+    "engine": "msq"
+}
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+A successful request returns an HTTP `200 OK` message code and an empty response body.
+
+### Get cluster-level compaction config
+
+Retrieves cluster-level configuration for compaction tasks which applies to all datasources, unless explicitly overridden in the datasource compaction config.
+This includes all the fields listed in [Update cluster-level compaction config](#update-cluster-level-compaction-config).
+
+#### URL
+
+`GET` `/druid/indexer/v1/compaction/config/cluster`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="8" label="200 SUCCESS">
+
+*Successfully retrieved cluster compaction configuration*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="10" label="cURL">
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/compaction/config/cluster"
+```
+</TabItem>
+
+<TabItem value="11" label="HTTP">
+
+```HTTP
+GET /druid/indexer/v1/compaction/config/cluster HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+```json
+{
+    "compactionTaskSlotRatio": 0.5,
+    "maxCompactionTaskSlots": 1500,
+    "compactionPolicy": {
+        "type": "newestSegmentFirst",
+        "priorityDatasource": "wikipedia"
+    },
+    "useSupervisors": true,
+    "engine": "msq"
+}
+```
+
+</details>
+
+### Get automatic compaction configurations for all datasources
+
+Retrieves all datasource compaction configurations.
+
+#### URL
+
+`GET` `/druid/indexer/v1/compaction/config/datasources`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="12" label="200 SUCCESS">
+
+
+*Successfully retrieved automatic compaction configurations*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="13" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/compaction/config/datasources"
+```
+
+</TabItem>
+<TabItem value="14" label="HTTP">
+
+
+```HTTP
+GET /druid/indexer/v1/compaction/config/datasources HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+```json
+{
+    "compactionConfigs": [
+        {
+            "dataSource": "wikipedia_hour",
+            "taskPriority": 25,
+            "inputSegmentSizeBytes": 100000000000000,
+            "maxRowsPerSegment": null,
+            "skipOffsetFromLatest": "PT0S",
+            "tuningConfig": {
+                "maxRowsInMemory": null,
+                "appendableIndexSpec": null,
+                "maxBytesInMemory": null,
+                "maxTotalRows": null,
+                "splitHintSpec": null,
+                "partitionsSpec": {
+                    "type": "dynamic",
+                    "maxRowsPerSegment": 5000000,
+                    "maxTotalRows": null
+                },
+                "indexSpec": null,
+                "indexSpecForIntermediatePersists": null,
+                "maxPendingPersists": null,
+                "pushTimeout": null,
+                "segmentWriteOutMediumFactory": null,
+                "maxNumConcurrentSubTasks": null,
+                "maxRetry": null,
+                "taskStatusCheckPeriodMs": null,
+                "chatHandlerTimeout": null,
+                "chatHandlerNumRetries": null,
+                "maxNumSegmentsToMerge": null,
+                "totalNumMergeTasks": null,
+                "maxColumnsToMerge": null,
+                "type": "index_parallel",
+                "forceGuaranteedRollup": false
+            },
+            "granularitySpec": {
+                "segmentGranularity": "DAY",
+                "queryGranularity": null,
+                "rollup": null
+            },
+            "dimensionsSpec": null,
+            "metricsSpec": null,
+            "transformSpec": null,
+            "ioConfig": null,
+            "taskContext": null
+        },
+        {
+            "dataSource": "wikipedia",
+            "taskPriority": 25,
+            "inputSegmentSizeBytes": 100000000000000,
+            "maxRowsPerSegment": null,
+            "skipOffsetFromLatest": "PT0S",
+            "tuningConfig": {
+                "maxRowsInMemory": null,
+                "appendableIndexSpec": null,
+                "maxBytesInMemory": null,
+                "maxTotalRows": null,
+                "splitHintSpec": null,
+                "partitionsSpec": {
+                    "type": "dynamic",
+                    "maxRowsPerSegment": 5000000,
+                    "maxTotalRows": null
+                },
+                "indexSpec": null,
+                "indexSpecForIntermediatePersists": null,
+                "maxPendingPersists": null,
+                "pushTimeout": null,
+                "segmentWriteOutMediumFactory": null,
+                "maxNumConcurrentSubTasks": null,
+                "maxRetry": null,
+                "taskStatusCheckPeriodMs": null,
+                "chatHandlerTimeout": null,
+                "chatHandlerNumRetries": null,
+                "maxNumSegmentsToMerge": null,
+                "totalNumMergeTasks": null,
+                "maxColumnsToMerge": null,
+                "type": "index_parallel",
+                "forceGuaranteedRollup": false
+            },
+            "granularitySpec": {
+                "segmentGranularity": "DAY",
+                "queryGranularity": null,
+                "rollup": null
+            },
+            "dimensionsSpec": null,
+            "metricsSpec": null,
+            "transformSpec": null,
+            "ioConfig": null,
+            "taskContext": null
+        }
+    ]
+}
+```
+</details>
+
+### Get automatic compaction configuration for a datasource
+
+Retrieves the automatic compaction configuration for a datasource.
+
+#### URL
+
+`GET` `/druid/indexer/v1/compaction/config/datasources/{dataSource}`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="15" label="200 SUCCESS">
+
+
+*Successfully retrieved configuration for datasource*
+
+</TabItem>
+<TabItem value="16" label="404 NOT FOUND">
+
+
+*Invalid datasource or datasource does not have automatic compaction enabled*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+The following example retrieves the automatic compaction configuration for datasource `wikipedia_hour`.
+
+<Tabs>
+
+<TabItem value="17" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/compaction/config/datasources/wikipedia_hour"
+```
+
+</TabItem>
+<TabItem value="18" label="HTTP">
+
+
+```HTTP
+GET /druid/indexer/v1/compaction/config/datasources/wikipedia_hour HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+```json
+{
+    "dataSource": "wikipedia_hour",
+    "taskPriority": 25,
+    "inputSegmentSizeBytes": 100000000000000,
+    "maxRowsPerSegment": null,
+    "skipOffsetFromLatest": "PT0S",
+    "tuningConfig": {
+        "maxRowsInMemory": null,
+        "appendableIndexSpec": null,
+        "maxBytesInMemory": null,
+        "maxTotalRows": null,
+        "splitHintSpec": null,
+        "partitionsSpec": {
+            "type": "dynamic",
+            "maxRowsPerSegment": 5000000,
+            "maxTotalRows": null
+        },
+        "indexSpec": null,
+        "indexSpecForIntermediatePersists": null,
+        "maxPendingPersists": null,
+        "pushTimeout": null,
+        "segmentWriteOutMediumFactory": null,
+        "maxNumConcurrentSubTasks": null,
+        "maxRetry": null,
+        "taskStatusCheckPeriodMs": null,
+        "chatHandlerTimeout": null,
+        "chatHandlerNumRetries": null,
+        "maxNumSegmentsToMerge": null,
+        "totalNumMergeTasks": null,
+        "maxColumnsToMerge": null,
+        "type": "index_parallel",
+        "forceGuaranteedRollup": false
+    },
+    "granularitySpec": {
+        "segmentGranularity": "DAY",
+        "queryGranularity": null,
+        "rollup": null
+    },
+    "dimensionsSpec": null,
+    "metricsSpec": null,
+    "transformSpec": null,
+    "ioConfig": null,
+    "taskContext": null
+}
+```
+</details>
+
+### Create or update automatic compaction configuration for a datasource
+
+Creates or updates the automatic compaction configuration for a datasource. Pass the automatic compaction as a JSON object in the request body.
+
+The automatic compaction configuration requires only the `dataSource` property. Druid fills all other properties with default values if not specified. See [Automatic compaction dynamic configuration](../configuration/index.md#automatic-compaction-dynamic-configuration) for configuration details.
+
+Note that this endpoint returns an HTTP `200 OK` message code even if the datasource name does not exist.
+
+#### URL
+
+`POST` `/druid/indexer/v1/compaction/config/datasources/wikipedia_hour`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="1" label="200 SUCCESS">
+
+
+*Successfully submitted auto compaction configuration*
+
+</TabItem>
+</Tabs>
+
+---
+#### Sample request
+
+The following example creates an automatic compaction configuration for the datasource `wikipedia_hour`, which was ingested with `HOUR` segment granularity. This automatic compaction configuration performs compaction on `wikipedia_hour`, resulting in compacted segments that represent a day interval of data.
+
+In this example:
+
+* `wikipedia_hour` is a datasource with `HOUR` segment granularity.
+* `skipOffsetFromLatest` is set to `PT0S`, meaning that no data is skipped.
+* `partitionsSpec` is set to the default `dynamic`, allowing Druid to dynamically determine the optimal partitioning strategy.
+* `type` is set to `index_parallel`, meaning that parallel indexing is used.
+* `segmentGranularity` is set to `DAY`, meaning that each compacted segment is a day of data.
+
+<Tabs>
+
+<TabItem value="2" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/compaction/config/datasources/wikipedia_hour"\
+--header 'Content-Type: application/json' \
+--data '{
+    "dataSource": "wikipedia_hour",
+    "skipOffsetFromLatest": "PT0S",
+    "tuningConfig": {
+        "partitionsSpec": {
+            "type": "dynamic"
+        },
+        "type": "index_parallel"
+    },
+    "granularitySpec": {
+        "segmentGranularity": "DAY"
+    }
+}'
+```
+
+</TabItem>
+<TabItem value="3" label="HTTP">
+
+
+```HTTP
+POST /druid/indexer/v1/compaction/config/datasources/wikipedia_hour HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+Content-Type: application/json
+Content-Length: 281
+
+{
+    "dataSource": "wikipedia_hour",
+    "skipOffsetFromLatest": "PT0S",
+    "tuningConfig": {
+        "partitionsSpec": {
+            "type": "dynamic"
+        },
+        "type": "index_parallel"
+    },
+    "granularitySpec": {
+        "segmentGranularity": "DAY"
+    }
+}
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+A successful request returns an HTTP `200 OK` message code and an empty response body.
+
+
+### Delete automatic compaction configuration for a datasource
+
+Removes the automatic compaction configuration for a datasource. This updates the compaction status of the datasource to "Not enabled."
+
+#### URL
+
+`DELETE` `/druid/indexer/v1/compaction/config/datasources/{dataSource}`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="4" label="200 SUCCESS">
+
+
+*Successfully deleted automatic compaction configuration*
+
+</TabItem>
+<TabItem value="5" label="404 NOT FOUND">
+
+
+*Datasource does not have automatic compaction or invalid datasource name*
+
+</TabItem>
+</Tabs>
+
+---
+
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="6" label="cURL">
+
+
+```shell
+curl --request DELETE "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/compaction/config/datasources/wikipedia_hour"
+```
+
+</TabItem>
+<TabItem value="7" label="HTTP">
+
+
+```HTTP
+DELETE /druid/indexer/v1/compaction/config/wikipedia_hour HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+A successful request returns an HTTP `200 OK` message code and an empty response body.
+
+### Get compaction status for all datasources
+
+Retrieves an array of `latestStatus` objects representing the status and statistics from the latest automatic compaction run for all the datasources to which the user has read access.
+The response payload is in the same format as [Compaction status response](#compaction-status-response).
+
+#### URL
+
+`GET` `/druid/indexer/v1/compaction/status/datasources`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="27" label="200 SUCCESS">
+
+
+*Successfully retrieved `latestStatus` object*
+
+</TabItem>
+</Tabs>
+
+---
+#### Sample request
+
+<Tabs>
+
+<TabItem value="28" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/compaction/status/datasources"
+```
+
+</TabItem>
+<TabItem value="29" label="HTTP">
+
+
+```HTTP
+GET /druid/indexer/v1/compaction/status/datasources HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+```json
+{
+    "latestStatus": [
+        {
+            "dataSource": "wikipedia_api",
+            "scheduleStatus": "RUNNING",
+            "bytesAwaitingCompaction": 0,
+            "bytesCompacted": 0,
+            "bytesSkipped": 64133616,
+            "segmentCountAwaitingCompaction": 0,
+            "segmentCountCompacted": 0,
+            "segmentCountSkipped": 8,
+            "intervalCountAwaitingCompaction": 0,
+            "intervalCountCompacted": 0,
+            "intervalCountSkipped": 1
+        },
+        {
+            "dataSource": "wikipedia_hour",
+            "scheduleStatus": "RUNNING",
+            "bytesAwaitingCompaction": 0,
+            "bytesCompacted": 5998634,
+            "bytesSkipped": 0,
+            "segmentCountAwaitingCompaction": 0,
+            "segmentCountCompacted": 1,
+            "segmentCountSkipped": 0,
+            "intervalCountAwaitingCompaction": 0,
+            "intervalCountCompacted": 1,
+            "intervalCountSkipped": 0
+        }
+    ]
+}
+```
+</details>
+
+### Get compaction status for a single datasource
+
+Retrieves the latest status from the latest automatic compaction run for a datasource. The response payload is in the same format as [Compaction status response](#compaction-status-response) with zero or one entry.
+
+#### URL
+
+`GET` `/druid/indexer/v1/compaction/status/datasources/{dataSource}`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="27" label="200 SUCCESS">
+
+
+*Successfully retrieved `latestStatus` object*
+
+</TabItem>
+</Tabs>
+
+---
+#### Sample request
+
+<Tabs>
+
+<TabItem value="28" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/compaction/status/datasources/wikipedia_hour"
+```
+
+</TabItem>
+<TabItem value="29" label="HTTP">
+
+
+```HTTP
+GET /druid/indexer/v1/compaction/status/datasources/wikipedia_hour HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+```json
+{
+    "latestStatus": [
+        {
+            "dataSource": "wikipedia_hour",
+            "scheduleStatus": "RUNNING",
+            "bytesAwaitingCompaction": 0,
+            "bytesCompacted": 5998634,
+            "bytesSkipped": 0,
+            "segmentCountAwaitingCompaction": 0,
+            "segmentCountCompacted": 1,
+            "segmentCountSkipped": 0,
+            "intervalCountAwaitingCompaction": 0,
+            "intervalCountCompacted": 1,
+            "intervalCountSkipped": 0
+        }
+    ]
+}
+```
+</details>
diff --git a/docs/35.0.0/api-reference/data-management-api.md b/docs/35.0.0/api-reference/data-management-api.md
new file mode 100644
index 0000000000..fe37c6a814
--- /dev/null
+++ b/docs/35.0.0/api-reference/data-management-api.md
@@ -0,0 +1,607 @@
+---
+id: data-management-api
+title: Data management API
+sidebar_label: Data management
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+import Tabs from '@theme/Tabs';
+import TabItem from '@theme/TabItem';
+
+This topic describes the data management API endpoints for Apache Druid.
+This includes information on how to mark segments as used or unused and delete them from Druid.
+
+In this topic, `http://ROUTER_IP:ROUTER_PORT` is a placeholder for your Router service address and port.
+Replace it with the information for your deployment.
+For example, use `http://localhost:8888` for quickstart deployments.
+
+:::info
+- Coordinator APIs for data management are now deprecated. Use new APIs served by the Overlord instead.
+- Do not use these APIs while an indexing task or kill task is in progress for the same datasource and interval.
+:::
+
+## Segment management
+
+You can mark segments as used by sending POST requests to the datasource, but the Coordinator may subsequently mark segments as unused if they meet any configured [drop rules](../operations/rule-configuration.md#drop-rules).
+Even if these API requests update segments to used, you still need to configure a [load rule](../operations/rule-configuration.md#load-rules) to load them onto Historical processes.
+
+When you use these APIs concurrently with an indexing task or a kill task, the behavior is undefined.
+Druid terminates some segments and marks others as used.
+Furthermore, it is possible that all segments could be unused, yet an indexing task might still be able to read data from these segments and complete successfully.
+
+All of the following APIs, except [Segment deletion](#segment-deletion) are served by the Overlord as it is the service responsible for performing actions on segment metadata on behalf of indexing tasks.
+This makes it the single source of truth for segment metadata, thus ensuring a consistent view across the Druid cluster and allowing the Overlord to cache metadata to improve performance.
+
+### Segment IDs
+
+You must provide segment IDs when using many of the endpoints described in this topic.
+For information on segment IDs, see [Segment identification](../design/segments.md#segment-identification).
+For information on finding segment IDs in the web console, see [Segments](../operations/web-console.md#segments).
+
+### Mark a single segment unused
+
+Marks the state of a segment as unused, using the segment ID.
+This is a "soft delete" of the segment from Historicals.
+To undo this action, [mark the segment used](#mark-a-single-segment-as-used).
+
+Note that this endpoint returns an HTTP `200 OK` response code even if the segment ID or datasource doesn't exist.
+Check the response payload to confirm if any segment was actually updated.
+
+#### URL
+
+`DELETE` `/druid/indexer/v1/datasources/{datasource}/segments/{segmentId}`
+
+#### Header
+
+The following headers are required for this request:
+
+```json
+Content-Type: application/json
+Accept: application/json, text/plain
+```
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="1" label="200 SUCCESS">
+
+
+*Successfully updated segment*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+The following example updates the segment `wikipedia_hour_2015-09-12T16:00:00.000Z_2015-09-12T17:00:00.000Z_2023-08-10T04:12:03.860Z` from datasource `wikipedia_hour` as `unused`.
+
+<Tabs>
+
+<TabItem value="2" label="cURL">
+
+
+```shell
+curl --request DELETE "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/datasources/wikipedia_hour/segments/wikipedia_hour_2015-09-12T16:00:00.000Z_2015-09-12T17:00:00.000Z_2023-08-10T04:12:03.860Z" \
+--header 'Content-Type: application/json' \
+--header 'Accept: application/json, text/plain'
+```
+
+</TabItem>
+<TabItem value="3" label="HTTP">
+
+
+```HTTP
+DELETE /druid/indexer/v1/datasources/wikipedia_hour/segments/wikipedia_hour_2015-09-12T16:00:00.000Z_2015-09-12T17:00:00.000Z_2023-08-10T04:12:03.860Z HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+Content-Type: application/json
+Accept: application/json, text/plain
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+```json
+{
+    "segmentStateChanged": true,
+    "numChangedSegments": 1
+}
+```
+</details>
+
+### Mark a single segment as used
+
+Marks the state of a segment as used, using the segment ID.
+
+#### URL
+
+`POST` `/druid/indexer/v1/datasources/{datasource}/segments/{segmentId}`
+
+#### Header
+
+The following headers are required for this request:
+
+```json
+Content-Type: application/json
+Accept: application/json, text/plain
+```
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="4" label="200 SUCCESS">
+
+
+*Successfully updated segments*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+The following example updates the segment with ID `wikipedia_hour_2015-09-12T18:00:00.000Z_2015-09-12T19:00:00.000Z_2023-08-10T04:12:03.860Z` to used.
+
+<Tabs>
+
+<TabItem value="5" label="cURL">
+
+
+```shell
+curl --request POST "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/datasources/wikipedia_hour/segments/wikipedia_hour_2015-09-12T18:00:00.000Z_2015-09-12T19:00:00.000Z_2023-08-10T04:12:03.860Z" \
+--header 'Content-Type: application/json' \
+--header 'Accept: application/json, text/plain'
+```
+
+</TabItem>
+<TabItem value="6" label="HTTP">
+
+
+```HTTP
+POST /druid/indexer/v1/datasources/wikipedia_hour/segments/wikipedia_hour_2015-09-12T18:00:00.000Z_2015-09-12T19:00:00.000Z_2023-08-10T04:12:03.860Z HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+Content-Type: application/json
+Accept: application/json, text/plain
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+```json
+{
+    "segmentStateChanged": true,
+    "numChangedSegments": 1
+}
+```
+</details>
+
+### Mark a group of segments unused
+
+Marks the state of a group of segments as unused, using an array of segment IDs or an interval.
+Pass the array of segment IDs or interval as a JSON object in the request body.
+
+For the interval, specify the start and end times as ISO 8601 strings to identify segments inclusive of the start time and exclusive of the end time.
+Optionally, specify an array of segment versions with interval. Druid updates only the segments completely contained
+within the specified interval that match the optional list of versions; partially overlapping segments are not affected.
+
+#### URL
+
+`POST` `/druid/indexer/v1/datasources/{datasource}/markUnused`
+
+#### Request body
+
+The group of segments is sent as a JSON request payload that accepts the following properties:
+
+|Property|Description|Required|Example|
+|--------|-----------|--------|-------|
+|`interval`|ISO 8601 segments interval.|Yes, if `segmentIds` is not specified.|`"2015-09-12T03:00:00.000Z/2015-09-12T05:00:00.000Z"`|
+|`segmentIds`|List of segment IDs.|Yes, if `interval` is not specified.|`["segmentId1", "segmentId2"]`|
+|`versions`|List of segment versions. Must be provided with `interval`.|No.|`["2024-03-14T16:00:04.086Z", ""2024-03-12T16:00:04.086Z"]`|
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="7" label="200 SUCCESS">
+
+
+*Successfully updated segments*
+
+</TabItem>
+<TabItem value="8" label="204 NO CONTENT">
+
+
+*Invalid datasource name*
+
+</TabItem>
+<TabItem value="9" label="400 BAD REQUEST">
+
+
+*Invalid request payload*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+The following example marks two segments from the `wikipedia_hour` datasource unused based on their segment IDs.
+
+<Tabs>
+
+<TabItem value="10" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/datasources/wikipedia_hour/markUnused" \
+--header 'Content-Type: application/json' \
+--data '{
+    "segmentIds": [
+        "wikipedia_hour_2015-09-12T14:00:00.000Z_2015-09-12T15:00:00.000Z_2023-08-10T04:12:03.860Z",
+        "wikipedia_hour_2015-09-12T04:00:00.000Z_2015-09-12T05:00:00.000Z_2023-08-10T04:12:03.860Z"
+    ]
+}'
+```
+
+</TabItem>
+<TabItem value="11" label="HTTP">
+
+
+```HTTP
+POST /druid/indexer/v1/datasources/wikipedia_hour/markUnused HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+Content-Type: application/json
+Content-Length: 230
+
+{
+    "segmentIds": [
+        "wikipedia_hour_2015-09-12T14:00:00.000Z_2015-09-12T15:00:00.000Z_2023-08-10T04:12:03.860Z",
+        "wikipedia_hour_2015-09-12T04:00:00.000Z_2015-09-12T05:00:00.000Z_2023-08-10T04:12:03.860Z"
+    ]
+}
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+```json
+{
+    "numChangedSegments": 2
+}
+```
+</details>
+
+### Mark a group of segments used
+
+Marks the state of a group of segments as used, using an array of segment IDs or an interval.
+Pass the array of segment IDs or interval as a JSON object in the request body.
+
+For the interval, specify the start and end times as ISO 8601 strings to identify segments inclusive of the start time and exclusive of the end time.
+Optionally, specify an array of segment versions with interval. Druid updates only the segments completely contained
+within the specified interval that match the optional list of versions; partially overlapping segments are not affected.
+
+#### URL
+
+`POST` `/druid/indexer/v1/datasources/{datasource}/markUsed`
+
+#### Request body
+
+The group of segments is sent as a JSON request payload that accepts the following properties:
+
+|Property|Description|Required|Example|
+|--------|-----------|--------|-------|
+|`interval`|ISO 8601 segments interval.|Yes, if `segmentIds` is not specified.|`"2015-09-12T03:00:00.000Z/2015-09-12T05:00:00.000Z"`|
+|`segmentIds`|List of segment IDs.|Yes, if `interval` is not specified.|`["segmentId1", "segmentId2"]`|
+|`versions`|List of segment versions. Must be provided with `interval`.|No.|`["2024-03-14T16:00:04.086Z", ""2024-03-12T16:00:04.086Z"]`|
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="12" label="200 SUCCESS">
+
+
+*Successfully updated segments*
+
+</TabItem>
+<TabItem value="13" label="204 NO CONTENT">
+
+
+*Invalid datasource name*
+
+</TabItem>
+<TabItem value="14" label="400 BAD REQUEST">
+
+
+*Invalid request payload*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+The following example marks two segments from the `wikipedia_hour` datasource used based on their segment IDs.
+
+<Tabs>
+
+<TabItem value="15" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/datasources/wikipedia_hour/markUsed" \
+--header 'Content-Type: application/json' \
+--data '{
+    "segmentIds": [
+        "wikipedia_hour_2015-09-12T14:00:00.000Z_2015-09-12T15:00:00.000Z_2023-08-10T04:12:03.860Z",
+        "wikipedia_hour_2015-09-12T04:00:00.000Z_2015-09-12T05:00:00.000Z_2023-08-10T04:12:03.860Z"
+    ]
+}'
+```
+
+</TabItem>
+<TabItem value="16" label="HTTP">
+
+
+```HTTP
+POST /druid/indexer/v1/datasources/wikipedia_hour/markUsed HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+Content-Type: application/json
+Content-Length: 230
+
+{
+    "segmentIds": [
+        "wikipedia_hour_2015-09-12T14:00:00.000Z_2015-09-12T15:00:00.000Z_2023-08-10T04:12:03.860Z",
+        "wikipedia_hour_2015-09-12T04:00:00.000Z_2015-09-12T05:00:00.000Z_2023-08-10T04:12:03.860Z"
+    ]
+}
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+```json
+{
+    "numChangedSegments": 2
+}
+```
+</details>
+
+### Mark all segments unused
+
+Marks the state of all segments of a datasource as unused.
+This action performs a "soft delete" of the segments from Historicals.
+
+Note that this endpoint returns an HTTP `200 OK` response code even if the datasource doesn't exist.
+Check the response payload to confirm if any segment was actually updated.
+
+#### URL
+
+`DELETE` `/druid/indexer/v1/datasources/{datasource}`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="17" label="200 SUCCESS">
+
+
+*Successfully updated segments*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="18" label="cURL">
+
+
+```shell
+curl --request DELETE "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/datasources/wikipedia_hour"
+```
+
+</TabItem>
+<TabItem value="19" label="HTTP">
+
+
+```HTTP
+DELETE /druid/indexer/v1/datasources/wikipedia_hour HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+```json
+{
+    "numChangedSegments": 24
+}
+```
+</details>
+
+### Mark all non-overshadowed segments used
+
+Marks the state of all unused segments of a datasource as used given that they are not already overshadowed by other segments.
+The endpoint returns the number of changed segments.
+
+Note that this endpoint returns an HTTP `200 OK` response code even if the datasource doesn't exist.
+Check the response payload to get the number of segments actually updated.
+
+#### URL
+
+`POST` `/druid/indexer/v1/datasources/{datasource}`
+
+#### Header
+
+The following headers are required for this request:
+
+```json
+Content-Type: application/json
+Accept: application/json, text/plain
+```
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="20" label="200 SUCCESS">
+
+
+*Successfully updated segments*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+The following example updates all unused segments of `wikipedia_hour` to used.
+`wikipedia_hour` contains one unused segment eligible to be marked as used.
+
+<Tabs>
+
+<TabItem value="21" label="cURL">
+
+
+```shell
+curl --request POST "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/datasources/wikipedia_hour" \
+--header 'Content-Type: application/json' \
+--header 'Accept: application/json, text/plain'
+```
+
+</TabItem>
+<TabItem value="22" label="HTTP">
+
+
+```HTTP
+POST /druid/indexer/v1/datasources/wikipedia_hour HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+Content-Type: application/json
+Accept: application/json, text/plain
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+```json
+{
+    "numChangedSegments": 1
+}
+```
+</details>
+
+## Segment deletion
+
+### Permanently delete segments
+
+The DELETE endpoint sends a [kill task](../ingestion/tasks.md) for a given interval and datasource. The interval value is an ISO 8601 string delimited by `_`. This request permanently deletes all metadata for unused segments and removes them from deep storage.
+
+Note that this endpoint returns an HTTP `200 OK` response code even if the datasource doesn't exist.
+
+This endpoint supersedes the deprecated endpoint: `DELETE /druid/coordinator/v1/datasources/{datasource}?kill=true&interval={interval}`
+
+#### URL
+
+`DELETE` `/druid/coordinator/v1/datasources/{datasource}/intervals/{interval}`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="23" label="200 SUCCESS">
+
+
+*Successfully sent kill task*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+The following example sends a kill task to permanently delete segments in the datasource `wikipedia_hour` from the interval `2015-09-12` to `2015-09-13`.
+
+<Tabs>
+
+<TabItem value="24" label="cURL">
+
+
+```shell
+curl --request DELETE "http://ROUTER_IP:ROUTER_PORT/druid/coordinator/v1/datasources/wikipedia_hour/intervals/2015-09-12_2015-09-13"
+```
+
+</TabItem>
+<TabItem value="25" label="HTTP">
+
+
+```HTTP
+DELETE /druid/coordinator/v1/datasources/wikipedia_hour/intervals/2015-09-12_2015-09-13 HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+A successful request returns an HTTP `200 OK` and an empty response body.
diff --git a/docs/35.0.0/api-reference/dynamic-configuration-api.md b/docs/35.0.0/api-reference/dynamic-configuration-api.md
new file mode 100644
index 0000000000..cad61e4b88
--- /dev/null
+++ b/docs/35.0.0/api-reference/dynamic-configuration-api.md
@@ -0,0 +1,665 @@
+---
+id: dynamic-configuration-api
+title: Dynamic configuration API
+sidebar_label: Dynamic configuration
+---
+import Tabs from '@theme/Tabs';
+import TabItem from '@theme/TabItem';
+
+
+<!--
+
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements. See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership. The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License. You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied. See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+This document describes the API endpoints to retrieve and manage dynamic configurations for the [Coordinator](../design/coordinator.md) and [Overlord](../design/overlord.md) in Apache Druid.
+
+In this topic, `http://ROUTER_IP:ROUTER_PORT` is a placeholder for your Router service address and port.
+Replace it with the information for your deployment.
+For example, use `http://localhost:8888` for quickstart deployments.
+
+## Coordinator dynamic configuration
+
+The Coordinator has dynamic configurations to tune certain behavior on the fly, without requiring a service restart.
+For information on the supported properties, see [Coordinator dynamic configuration](../configuration/index.md#dynamic-configuration).
+
+### Get dynamic configuration
+
+Retrieves the current Coordinator dynamic configuration. Returns a JSON object with the dynamic configuration properties.
+
+#### URL
+
+`GET` `/druid/coordinator/v1/config`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="1" label="200 SUCCESS">
+
+
+*Successfully retrieved dynamic configuration*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="2" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/coordinator/v1/config"
+```
+
+</TabItem>
+<TabItem value="3" label="HTTP">
+
+
+```HTTP
+GET /druid/coordinator/v1/config HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+<summary>View the response</summary>
+
+```json
+{
+    "millisToWaitBeforeDeleting": 900000,
+    "maxSegmentsToMove": 100,
+    "replicantLifetime": 15,
+    "replicationThrottleLimit": 500,
+    "balancerComputeThreads": 1,
+    "killDataSourceWhitelist": [],
+    "killPendingSegmentsSkipList": [],
+    "maxSegmentsInNodeLoadingQueue": 500,
+    "decommissioningNodes": [],
+    "decommissioningMaxPercentOfMaxSegmentsToMove": 70,
+    "pauseCoordination": false,
+    "replicateAfterLoadTimeout": false,
+    "maxNonPrimaryReplicantsToLoad": 2147483647,
+    "useRoundRobinSegmentAssignment": true,
+    "smartSegmentLoading": true,
+    "debugDimensions": null,
+    "turboLoadingNodes": [],
+    "cloneServers": {}
+
+}
+```
+
+</details>
+
+### Update dynamic configuration
+
+Submits a JSON-based dynamic configuration spec to the Coordinator.
+For information on the supported properties, see [Dynamic configuration](../configuration/index.md#dynamic-configuration).
+
+#### URL
+
+`POST` `/druid/coordinator/v1/config`
+
+#### Header parameters
+
+The endpoint supports a set of optional header parameters to populate the `author` and `comment` fields in the configuration history.
+
+* `X-Druid-Author`
+  * Type: String
+  * Author of the configuration change.
+* `X-Druid-Comment`
+  * Type: String
+  * Description for the update.
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="4" label="200 SUCCESS">
+
+
+*Successfully updated dynamic configuration*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="5" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/coordinator/v1/config" \
+--header 'Content-Type: application/json' \
+--data '{
+  "millisToWaitBeforeDeleting": 900000,
+  "maxSegmentsToMove": 5,
+  "percentOfSegmentsToConsiderPerMove": 100,
+  "useBatchedSegmentSampler": true,
+  "replicantLifetime": 15,
+  "replicationThrottleLimit": 10,
+  "balancerComputeThreads": 1,
+  "emitBalancingStats": true,
+  "killDataSourceWhitelist": [],
+  "killPendingSegmentsSkipList": [],
+  "maxSegmentsInNodeLoadingQueue": 100,
+  "decommissioningNodes": [],
+  "decommissioningMaxPercentOfMaxSegmentsToMove": 70,
+  "pauseCoordination": false,
+  "replicateAfterLoadTimeout": false,
+  "maxNonPrimaryReplicantsToLoad": 2147483647,
+  "useRoundRobinSegmentAssignment": true,
+  "turboLoadingNodes": [],
+  "cloneServers": {}
+}'
+```
+
+</TabItem>
+<TabItem value="6" label="HTTP">
+
+
+```HTTP
+POST /druid/coordinator/v1/config HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+Content-Type: application/json
+Content-Length: 683
+
+{
+  "millisToWaitBeforeDeleting": 900000,
+  "maxSegmentsToMove": 5,
+  "percentOfSegmentsToConsiderPerMove": 100,
+  "useBatchedSegmentSampler": true,
+  "replicantLifetime": 15,
+  "replicationThrottleLimit": 10,
+  "balancerComputeThreads": 1,
+  "emitBalancingStats": true,
+  "killDataSourceWhitelist": [],
+  "killPendingSegmentsSkipList": [],
+  "maxSegmentsInNodeLoadingQueue": 100,
+  "decommissioningNodes": [],
+  "decommissioningMaxPercentOfMaxSegmentsToMove": 70,
+  "pauseCoordination": false,
+  "replicateAfterLoadTimeout": false,
+  "maxNonPrimaryReplicantsToLoad": 2147483647,
+  "useRoundRobinSegmentAssignment": true,
+  "turboLoadingNodes": [],
+  "cloneServers": {}
+}
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+A successful request returns an HTTP `200 OK` message code and an empty response body.
+
+### Get dynamic configuration history
+
+Retrieves the history of changes to Coordinator dynamic configuration over an interval of time. Returns an empty array if there are no history records available.
+
+#### URL
+
+`GET` `/druid/coordinator/v1/config/history`
+
+#### Query parameters
+
+The endpoint supports a set of optional query parameters to filter results.
+
+* `interval`
+  * Type: String
+  * Limit the results to the specified time interval in ISO 8601 format delimited with `/`. For example, `2023-07-13/2023-07-19`. The default interval is one week. You can change this period by setting `druid.audit.manager.auditHistoryMillis` in the `runtime.properties` file for the Coordinator.
+
+* `count`
+  * Type: Integer
+  * Limit the number of results to the last `n` entries.
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="7" label="200 SUCCESS">
+
+
+*Successfully retrieved history*
+
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+The following example retrieves the dynamic configuration history between `2022-07-13` and `2024-07-19`. The response is limited to 10 entries.
+
+<Tabs>
+
+<TabItem value="8" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/coordinator/v1/config/history?interval=2022-07-13%2F2024-07-19&count=10"
+```
+
+</TabItem>
+<TabItem value="9" label="HTTP">
+
+
+```HTTP
+GET /druid/coordinator/v1/config/history?interval=2022-07-13/2024-07-19&count=10 HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+```json
+[
+    {
+        "key": "coordinator.config",
+        "type": "coordinator.config",
+        "auditInfo": {
+            "author": "",
+            "comment": "",
+            "ip": "127.0.0.1"
+        },
+        "payload": "{\"millisToWaitBeforeDeleting\":900000,\"maxSegmentsToMove\":5,\"replicantLifetime\":15,\"replicationThrottleLimit\":10,\"balancerComputeThreads\":1,\"killDataSourceWhitelist\":[],\"killPendingSegmentsSkipList\":[],\"maxSegmentsInNodeLoadingQueue\":100,\"decommissioningNodes\":[],\"decommissioningMaxPercentOfMaxSegmentsToMove\":70,\"pauseCoordination\":false,\"replicateAfterLoadTimeout\":false,\"maxNonPrimaryReplicantsToLoad\":2147483647,\"useRoundRobinSegmentAssignment\":true,\"smartSegmentLoading\":true,\"debugDimensions\":null,\"decommissioningNodes\":[]}",
+        "auditTime": "2023-10-03T20:59:51.622Z"
+    }
+]
+```
+</details>
+
+## Overlord dynamic configuration
+
+The Overlord has dynamic configurations to tune how Druid assigns tasks to workers.
+For information on the supported properties, see [Overlord dynamic configuration](../configuration/index.md#overlord-dynamic-configuration).
+
+### Get dynamic configuration
+
+Retrieves the current Overlord dynamic configuration.
+Returns a JSON object with the dynamic configuration properties.
+Returns an empty response body if there is no current Overlord dynamic configuration.
+
+#### URL
+
+`GET` `/druid/indexer/v1/worker`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="10" label="200 SUCCESS">
+
+
+*Successfully retrieved dynamic configuration*
+
+</TabItem>
+</Tabs>
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="11" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/worker"
+```
+
+</TabItem>
+<TabItem value="12" label="HTTP">
+
+
+```HTTP
+GET /druid/indexer/v1/worker HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+```json
+{
+    "type": "default",
+    "selectStrategy": {
+        "type": "fillCapacityWithCategorySpec",
+        "workerCategorySpec": {
+            "categoryMap": {},
+            "strong": true
+        }
+    },
+    "autoScaler": null
+}
+```
+
+</details>
+
+### Update dynamic configuration
+
+Submits a JSON-based dynamic configuration spec to the Overlord.
+For information on the supported properties, see [Overlord dynamic configuration](../configuration/index.md#overlord-dynamic-configuration).
+
+#### URL
+
+`POST` `/druid/indexer/v1/worker`
+
+#### Header parameters
+
+The endpoint supports a set of optional header parameters to populate the `author` and `comment` fields in the configuration history.
+
+* `X-Druid-Author`
+  * Type: String
+  * Author of the configuration change.
+* `X-Druid-Comment`
+  * Type: String
+  * Description for the update.
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="13" label="200 SUCCESS">
+
+
+*Successfully updated dynamic configuration*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="14" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/worker" \
+--header 'Content-Type: application/json' \
+--data '{
+  "type": "default",
+  "selectStrategy": {
+    "type": "fillCapacityWithCategorySpec",
+    "workerCategorySpec": {
+      "categoryMap": {},
+      "strong": true
+    }
+  },
+  "autoScaler": null
+}'
+```
+
+</TabItem>
+<TabItem value="15" label="HTTP">
+
+
+```HTTP
+POST /druid/indexer/v1/worker HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+Content-Type: application/json
+Content-Length: 196
+
+{
+  "type": "default",
+  "selectStrategy": {
+    "type": "fillCapacityWithCategorySpec",
+    "workerCategorySpec": {
+      "categoryMap": {},
+      "strong": true
+    }
+  },
+  "autoScaler": null
+}
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+A successful request returns an HTTP `200 OK` message code and an empty response body.
+
+### Get dynamic configuration history
+
+Retrieves the history of changes to Overlord dynamic configuration over an interval of time. Returns an empty array if there are no history records available.
+
+#### URL
+
+`GET` `/druid/indexer/v1/worker/history`
+
+#### Query parameters
+
+The endpoint supports a set of optional query parameters to filter results.
+
+* `interval`
+  * Type: String
+  * Limit the results to the specified time interval in ISO 8601 format delimited with `/`. For example, `2023-07-13/2023-07-19`. The default interval is one week. You can change this period by setting `druid.audit.manager.auditHistoryMillis` in the `runtime.properties` file for the Overlord.
+
+* `count`
+  * Type: Integer
+  * Limit the number of results to the last `n` entries.
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="16" label="200 SUCCESS">
+
+
+*Successfully retrieved history*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+The following example retrieves the dynamic configuration history between `2022-07-13` and `2024-07-19`. The response is limited to 10 entries.
+
+<Tabs>
+
+<TabItem value="17" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/worker/history?interval=2022-07-13%2F2024-07-19&count=10"
+```
+
+</TabItem>
+<TabItem value="18" label="HTTP">
+
+
+```HTTP
+GET /druid/indexer/v1/worker/history?interval=2022-07-13%2F2024-07-19&count=10 HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+```json
+[
+    {
+        "key": "worker.config",
+        "type": "worker.config",
+        "auditInfo": {
+            "author": "",
+            "comment": "",
+            "ip": "127.0.0.1"
+        },
+        "payload": "{\"type\":\"default\",\"selectStrategy\":{\"type\":\"fillCapacityWithCategorySpec\",\"workerCategorySpec\":{\"categoryMap\":{},\"strong\":true}},\"autoScaler\":null}",
+        "auditTime": "2023-10-03T21:49:49.991Z"
+    }
+]
+```
+
+</details>
+
+### Get an array of worker nodes in the cluster
+
+Returns an array of all the worker nodes in the cluster along with its corresponding metadata.
+
+`GET` `/druid/indexer/v1/workers`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="19" label="200 SUCCESS">
+
+
+*Successfully retrieved worker nodes*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="20" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/workers"
+```
+
+</TabItem>
+<TabItem value="21" label="HTTP">
+
+
+```HTTP
+GET /druid/indexer/v1/workers HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+```json
+[
+    {
+        "worker": {
+            "scheme": "http",
+            "host": "localhost:8091",
+            "ip": "198.51.100.0",
+            "capacity": 2,
+            "version": "0",
+            "category": "_default_worker_category"
+        },
+        "currCapacityUsed": 0,
+        "currParallelIndexCapacityUsed": 0,
+        "availabilityGroups": [],
+        "runningTasks": [],
+        "lastCompletedTaskTime": "2023-09-29T19:13:05.505Z",
+        "blacklistedUntil": null
+    }
+]
+```
+
+</details>
+
+### Get scaling events
+
+Returns Overlord scaling events if autoscaling runners are in use.
+Returns an empty response body if there are no Overlord scaling events.
+
+#### URL
+
+`GET` `/druid/indexer/v1/scaling`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="22" label="200 SUCCESS">
+
+
+*Successfully retrieved scaling events*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="23" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/scaling"
+```
+
+</TabItem>
+<TabItem value="24" label="HTTP">
+
+
+```HTTP
+GET /druid/indexer/v1/scaling HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+A successful request returns a `200 OK` response and an array of scaling events.
diff --git a/docs/35.0.0/api-reference/json-querying-api.md b/docs/35.0.0/api-reference/json-querying-api.md
new file mode 100644
index 0000000000..5d03ec8b31
--- /dev/null
+++ b/docs/35.0.0/api-reference/json-querying-api.md
@@ -0,0 +1,925 @@
+---
+id: json-querying-api
+title: JSON querying API
+sidebar_label: JSON querying
+---
+import Tabs from '@theme/Tabs';
+import TabItem from '@theme/TabItem';
+
+
+<!--
+
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+This topic describes the API endpoints to submit JSON-based [native queries](../querying/querying.md) to Apache Druid.
+
+In this topic, `http://SERVICE_IP:SERVICE_PORT` is a placeholder for the server address of deployment and the service port. For example, on the quickstart configuration, replace `http://ROUTER_IP:ROUTER_PORT` with `http://localhost:8888`.
+
+
+## Submit a query
+
+Submits a JSON-based native query. The body of the request is the native query itself.
+
+Druid supports different types of queries for different use cases. All queries require the following properties:
+* `queryType`: A string representing the type of query. Druid supports the following native query types: `timeseries`, `topN`, `groupBy`, `timeBoundaries`, `segmentMetadata`, `datasourceMetadata`, `scan`, and `search`.
+* `dataSource`: A string or object defining the source of data to query. The most common value is the name of the datasource to query. For more information, see [Datasources](../querying/datasource.md).
+
+For additional properties based on your query type or use case, see [available native queries](../querying/querying.md#available-queries).
+
+### URL
+
+`POST` `/druid/v2`
+
+### Query parameters
+
+* `pretty` (optional)
+  * Druid returns the response in a pretty-printed format using indentation and line breaks.
+
+### Responses
+
+<Tabs>
+
+<TabItem value="1" label="200 SUCCESS">
+
+
+*Successfully submitted query*
+
+</TabItem>
+<TabItem value="2" label="400 BAD REQUEST">
+
+
+*Error thrown due to bad query. Returns a JSON object detailing the error with the following format:*
+
+```json
+{
+    "error": "A well-defined error code.",
+    "errorMessage": "A message with additional details about the error.",
+    "errorClass": "Class of exception that caused this error.",
+    "host": "The host on which the error occurred."
+}
+```
+For more information on possible error messages, see [query execution failures](../querying/querying.md#query-execution-failures).
+
+</TabItem>
+</Tabs>
+
+---
+
+### Example query: `topN`
+
+The following example shows a `topN` query. The query analyzes the `social_media` datasource to return the top five users from the `username` dimension with the highest number of views from the `views` metric.
+
+<Tabs>
+
+<TabItem value="3" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/v2?pretty=null" \
+--header 'Content-Type: application/json' \
+--data '{
+  "queryType": "topN",
+  "dataSource": "social_media",
+  "dimension": "username",
+  "threshold": 5,
+  "metric": "views",
+  "granularity": "all",
+  "aggregations": [
+    {
+      "type": "longSum",
+      "name": "views",
+      "fieldName": "views"
+    }
+  ],
+  "intervals": [
+    "2022-01-01T00:00:00.000/2024-01-01T00:00:00.000"
+  ]
+}'
+```
+</TabItem>
+<TabItem value="4" label="HTTP">
+
+
+```HTTP
+POST /druid/v2?pretty=null HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+Content-Type: application/json
+Content-Length: 336
+
+{
+  "queryType": "topN",
+  "dataSource": "social_media",
+  "dimension": "username",
+  "threshold": 5,
+  "metric": "views",
+  "granularity": "all",
+  "aggregations": [
+    {
+      "type": "longSum",
+      "name": "views",
+      "fieldName": "views"
+    }
+  ],
+  "intervals": [
+    "2022-01-01T00:00:00.000/2024-01-01T00:00:00.000"
+  ]
+}
+```
+
+</TabItem>
+</Tabs>
+
+#### Example response: `topN`
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+[
+    {
+        "timestamp": "2023-07-03T18:49:54.848Z",
+        "result": [
+            {
+                "views": 11591218026,
+                "username": "gus"
+            },
+            {
+                "views": 11578638578,
+                "username": "miette"
+            },
+            {
+                "views": 11561618880,
+                "username": "leon"
+            },
+            {
+                "views": 11552609824,
+                "username": "mia"
+            },
+            {
+                "views": 11551537517,
+                "username": "milton"
+            }
+        ]
+    }
+]
+  ```
+</details>
+
+### Example query: `groupBy`
+
+The following example submits a JSON query of the `groupBy` type to retrieve the `username` with the highest votes to posts ratio from the `social_media` datasource.
+
+In this query:
+* The `upvoteSum` aggregation calculates the sum of the `upvotes` for each user.
+* The `postCount` aggregation calculates the sum of posts for each user.
+* The `upvoteToPostRatio` is a post-aggregation of the `upvoteSum` and the `postCount`, divided to calculate the ratio.
+* The result is sorted based on the `upvoteToPostRatio` in descending order.
+
+<Tabs>
+
+<TabItem value="5" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/v2" \
+--header 'Content-Type: application/json' \
+--data '{
+  "queryType": "groupBy",
+  "dataSource": "social_media",
+  "dimensions": ["username"],
+  "granularity": "all",
+  "aggregations": [
+    { "type": "doubleSum", "name": "upvoteSum", "fieldName": "upvotes" },
+    { "type": "count", "name": "postCount", "fieldName": "post_title" }
+  ],
+  "postAggregations": [
+    {
+      "type": "arithmetic",
+      "name": "upvoteToPostRatio",
+      "fn": "/",
+      "fields": [
+        { "type": "fieldAccess", "name": "upvoteSum", "fieldName": "upvoteSum" },
+        { "type": "fieldAccess", "name": "postCount", "fieldName": "postCount" }
+      ]
+    }
+  ],
+  "intervals": ["2022-01-01T00:00:00.000/2024-01-01T00:00:00.000"],
+  "limitSpec": {
+    "type": "default",
+    "limit": 1,
+    "columns": [
+      { "dimension": "upvoteToPostRatio", "direction": "descending" }
+    ]
+  }
+}'
+```
+
+</TabItem>
+
+<TabItem value="6" label="HTTP">
+
+```HTTP
+POST /druid/v2?pretty=null HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+Content-Type: application/json
+Content-Length: 817
+
+{
+  "queryType": "groupBy",
+  "dataSource": "social_media",
+  "dimensions": ["username"],
+  "granularity": "all",
+  "aggregations": [
+    { "type": "doubleSum", "name": "upvoteSum", "fieldName": "upvotes" },
+    { "type": "count", "name": "postCount", "fieldName": "post_title" }
+  ],
+  "postAggregations": [
+    {
+      "type": "arithmetic",
+      "name": "upvoteToPostRatio",
+      "fn": "/",
+      "fields": [
+        { "type": "fieldAccess", "name": "upvoteSum", "fieldName": "upvoteSum" },
+        { "type": "fieldAccess", "name": "postCount", "fieldName": "postCount" }
+      ]
+    }
+  ],
+  "intervals": ["2022-01-01T00:00:00.000/2024-01-01T00:00:00.000"],
+  "limitSpec": {
+    "type": "default",
+    "limit": 1,
+    "columns": [
+      { "dimension": "upvoteToPostRatio", "direction": "descending" }
+    ]
+  }
+}
+```
+
+</TabItem>
+</Tabs>
+
+#### Example response: `groupBy`
+
+<details>
+  <summary>View the response</summary>
+
+```json
+[
+    {
+        "version": "v1",
+        "timestamp": "2022-01-01T00:00:00.000Z",
+        "event": {
+            "upvoteSum": 8.0419541E7,
+            "upvoteToPostRatio": 69.53014661762697,
+            "postCount": 1156614,
+            "username": "miette"
+        }
+    }
+]
+```
+</details>
+
+## Get segment information for query
+
+Retrieves an array that contains objects with segment information, including the server locations associated with the query provided in the request body.
+
+### URL
+
+`POST` `/druid/v2/candidates`
+
+### Query parameters
+
+* `pretty` (optional)
+  *  Druid returns the response in a pretty-printed format using indentation and line breaks.
+
+### Responses
+
+<Tabs>
+
+<TabItem value="7" label="200 SUCCESS">
+
+
+*Successfully retrieved segment information*
+
+</TabItem>
+<TabItem value="8" label="400 BAD REQUEST">
+
+
+*Error thrown due to bad query. Returns a JSON object detailing the error with the following format:*
+
+```json
+{
+    "error": "A well-defined error code.",
+    "errorMessage": "A message with additional details about the error.",
+    "errorClass": "Class of exception that caused this error.",
+    "host": "The host on which the error occurred."
+}
+```
+
+For more information on possible error messages, see [query execution failures](../querying/querying.md#query-execution-failures).
+
+</TabItem>
+</Tabs>
+
+---
+
+### Sample request
+
+<Tabs>
+
+<TabItem value="9" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/v2/candidates" \
+--header 'Content-Type: application/json' \
+--data '{
+  "queryType": "topN",
+  "dataSource": "social_media",
+  "dimension": "username",
+  "threshold": 5,
+  "metric": "views",
+  "granularity": "all",
+  "aggregations": [
+    {
+      "type": "longSum",
+      "name": "views",
+      "fieldName": "views"
+    }
+  ],
+  "intervals": [
+    "2022-01-01T00:00:00.000/2024-01-01T00:00:00.000"
+  ]
+}'
+```
+
+</TabItem>
+<TabItem value="10" label="HTTP">
+
+
+```HTTP
+POST /druid/v2/candidates HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+Content-Type: application/json
+Content-Length: 336
+
+{
+  "queryType": "topN",
+  "dataSource": "social_media",
+  "dimension": "username",
+  "threshold": 5,
+  "metric": "views",
+  "granularity": "all",
+
+  "aggregations": [
+    {
+      "type": "longSum",
+      "name": "views",
+      "fieldName": "views"
+    }
+  ],
+  "intervals": [
+    "2020-01-01T00:00:00.000/2024-01-01T00:00:00.000"
+  ]
+}
+```
+
+</TabItem>
+</Tabs>
+
+### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+[
+    {
+        "interval": "2023-07-03T18:00:00.000Z/2023-07-03T19:00:00.000Z",
+        "version": "2023-07-03T18:51:18.905Z",
+        "partitionNumber": 0,
+        "size": 21563693,
+        "locations": [
+            {
+                "name": "localhost:8083",
+                "host": "localhost:8083",
+                "hostAndTlsPort": null,
+                "maxSize": 300000000000,
+                "type": "historical",
+                "tier": "_default_tier",
+                "priority": 0
+            }
+        ]
+    },
+    {
+        "interval": "2023-07-03T19:00:00.000Z/2023-07-03T20:00:00.000Z",
+        "version": "2023-07-03T19:00:00.657Z",
+        "partitionNumber": 0,
+        "size": 6057236,
+        "locations": [
+            {
+                "name": "localhost:8083",
+                "host": "localhost:8083",
+                "hostAndTlsPort": null,
+                "maxSize": 300000000000,
+                "type": "historical",
+                "tier": "_default_tier",
+                "priority": 0
+            }
+        ]
+    },
+    {
+        "interval": "2023-07-05T21:00:00.000Z/2023-07-05T22:00:00.000Z",
+        "version": "2023-07-05T21:09:58.102Z",
+        "partitionNumber": 0,
+        "size": 223926186,
+        "locations": [
+            {
+                "name": "localhost:8083",
+                "host": "localhost:8083",
+                "hostAndTlsPort": null,
+                "maxSize": 300000000000,
+                "type": "historical",
+                "tier": "_default_tier",
+                "priority": 0
+            }
+        ]
+    },
+    {
+        "interval": "2023-07-05T21:00:00.000Z/2023-07-05T22:00:00.000Z",
+        "version": "2023-07-05T21:09:58.102Z",
+        "partitionNumber": 1,
+        "size": 20244827,
+        "locations": [
+            {
+                "name": "localhost:8083",
+                "host": "localhost:8083",
+                "hostAndTlsPort": null,
+                "maxSize": 300000000000,
+                "type": "historical",
+                "tier": "_default_tier",
+                "priority": 0
+            }
+        ]
+    },
+    {
+        "interval": "2023-07-05T22:00:00.000Z/2023-07-05T23:00:00.000Z",
+        "version": "2023-07-05T22:00:00.524Z",
+        "partitionNumber": 0,
+        "size": 104628051,
+        "locations": [
+            {
+                "name": "localhost:8083",
+                "host": "localhost:8083",
+                "hostAndTlsPort": null,
+                "maxSize": 300000000000,
+                "type": "historical",
+                "tier": "_default_tier",
+                "priority": 0
+            }
+        ]
+    },
+    {
+        "interval": "2023-07-05T22:00:00.000Z/2023-07-05T23:00:00.000Z",
+        "version": "2023-07-05T22:00:00.524Z",
+        "partitionNumber": 1,
+        "size": 1603995,
+        "locations": [
+            {
+                "name": "localhost:8083",
+                "host": "localhost:8083",
+                "hostAndTlsPort": null,
+                "maxSize": 300000000000,
+                "type": "historical",
+                "tier": "_default_tier",
+                "priority": 0
+            }
+        ]
+    },
+    {
+        "interval": "2023-07-05T23:00:00.000Z/2023-07-06T00:00:00.000Z",
+        "version": "2023-07-05T23:21:55.242Z",
+        "partitionNumber": 0,
+        "size": 181506843,
+        "locations": [
+            {
+                "name": "localhost:8083",
+                "host": "localhost:8083",
+                "hostAndTlsPort": null,
+                "maxSize": 300000000000,
+                "type": "historical",
+                "tier": "_default_tier",
+                "priority": 0
+            }
+        ]
+    },
+    {
+        "interval": "2023-07-06T00:00:00.000Z/2023-07-06T01:00:00.000Z",
+        "version": "2023-07-06T00:02:08.498Z",
+        "partitionNumber": 0,
+        "size": 9170974,
+        "locations": [
+            {
+                "name": "localhost:8083",
+                "host": "localhost:8083",
+                "hostAndTlsPort": null,
+                "maxSize": 300000000000,
+                "type": "historical",
+                "tier": "_default_tier",
+                "priority": 0
+            }
+        ]
+    },
+    {
+        "interval": "2023-07-06T00:00:00.000Z/2023-07-06T01:00:00.000Z",
+        "version": "2023-07-06T00:02:08.498Z",
+        "partitionNumber": 1,
+        "size": 23969632,
+        "locations": [
+            {
+                "name": "localhost:8083",
+                "host": "localhost:8083",
+                "hostAndTlsPort": null,
+                "maxSize": 300000000000,
+                "type": "historical",
+                "tier": "_default_tier",
+                "priority": 0
+            }
+        ]
+    },
+    {
+        "interval": "2023-07-06T01:00:00.000Z/2023-07-06T02:00:00.000Z",
+        "version": "2023-07-06T01:13:53.982Z",
+        "partitionNumber": 0,
+        "size": 599895,
+        "locations": [
+            {
+                "name": "localhost:8083",
+                "host": "localhost:8083",
+                "hostAndTlsPort": null,
+                "maxSize": 300000000000,
+                "type": "historical",
+                "tier": "_default_tier",
+                "priority": 0
+            }
+        ]
+    },
+    {
+        "interval": "2023-07-06T01:00:00.000Z/2023-07-06T02:00:00.000Z",
+        "version": "2023-07-06T01:13:53.982Z",
+        "partitionNumber": 1,
+        "size": 1627041,
+        "locations": [
+            {
+                "name": "localhost:8083",
+                "host": "localhost:8083",
+                "hostAndTlsPort": null,
+                "maxSize": 300000000000,
+                "type": "historical",
+                "tier": "_default_tier",
+                "priority": 0
+            }
+        ]
+    },
+    {
+        "interval": "2023-07-06T02:00:00.000Z/2023-07-06T03:00:00.000Z",
+        "version": "2023-07-06T02:55:50.701Z",
+        "partitionNumber": 0,
+        "size": 629753,
+        "locations": [
+            {
+                "name": "localhost:8083",
+                "host": "localhost:8083",
+                "hostAndTlsPort": null,
+                "maxSize": 300000000000,
+                "type": "historical",
+                "tier": "_default_tier",
+                "priority": 0
+            }
+        ]
+    },
+    {
+        "interval": "2023-07-06T02:00:00.000Z/2023-07-06T03:00:00.000Z",
+        "version": "2023-07-06T02:55:50.701Z",
+        "partitionNumber": 1,
+        "size": 1342360,
+        "locations": [
+            {
+                "name": "localhost:8083",
+                "host": "localhost:8083",
+                "hostAndTlsPort": null,
+                "maxSize": 300000000000,
+                "type": "historical",
+                "tier": "_default_tier",
+                "priority": 0
+            }
+        ]
+    },
+    {
+        "interval": "2023-07-06T04:00:00.000Z/2023-07-06T05:00:00.000Z",
+        "version": "2023-07-06T04:02:36.562Z",
+        "partitionNumber": 0,
+        "size": 2131434,
+        "locations": [
+            {
+                "name": "localhost:8083",
+                "host": "localhost:8083",
+                "hostAndTlsPort": null,
+                "maxSize": 300000000000,
+                "type": "historical",
+                "tier": "_default_tier",
+                "priority": 0
+            }
+        ]
+    },
+    {
+        "interval": "2023-07-06T05:00:00.000Z/2023-07-06T06:00:00.000Z",
+        "version": "2023-07-06T05:23:27.856Z",
+        "partitionNumber": 0,
+        "size": 797161,
+        "locations": [
+            {
+                "name": "localhost:8083",
+                "host": "localhost:8083",
+                "hostAndTlsPort": null,
+                "maxSize": 300000000000,
+                "type": "historical",
+                "tier": "_default_tier",
+                "priority": 0
+            }
+        ]
+    },
+    {
+        "interval": "2023-07-06T05:00:00.000Z/2023-07-06T06:00:00.000Z",
+        "version": "2023-07-06T05:23:27.856Z",
+        "partitionNumber": 1,
+        "size": 1176858,
+        "locations": [
+            {
+                "name": "localhost:8083",
+                "host": "localhost:8083",
+                "hostAndTlsPort": null,
+                "maxSize": 300000000000,
+                "type": "historical",
+                "tier": "_default_tier",
+                "priority": 0
+            }
+        ]
+    },
+    {
+        "interval": "2023-07-06T06:00:00.000Z/2023-07-06T07:00:00.000Z",
+        "version": "2023-07-06T06:46:34.638Z",
+        "partitionNumber": 0,
+        "size": 2148760,
+        "locations": [
+            {
+                "name": "localhost:8083",
+                "host": "localhost:8083",
+                "hostAndTlsPort": null,
+                "maxSize": 300000000000,
+                "type": "historical",
+                "tier": "_default_tier",
+                "priority": 0
+            }
+        ]
+    },
+    {
+        "interval": "2023-07-06T07:00:00.000Z/2023-07-06T08:00:00.000Z",
+        "version": "2023-07-06T07:38:28.050Z",
+        "partitionNumber": 0,
+        "size": 2040748,
+        "locations": [
+            {
+                "name": "localhost:8083",
+                "host": "localhost:8083",
+                "hostAndTlsPort": null,
+                "maxSize": 300000000000,
+                "type": "historical",
+                "tier": "_default_tier",
+                "priority": 0
+            }
+        ]
+    },
+    {
+        "interval": "2023-07-06T08:00:00.000Z/2023-07-06T09:00:00.000Z",
+        "version": "2023-07-06T08:27:31.407Z",
+        "partitionNumber": 0,
+        "size": 678723,
+        "locations": [
+            {
+                "name": "localhost:8083",
+                "host": "localhost:8083",
+                "hostAndTlsPort": null,
+                "maxSize": 300000000000,
+                "type": "historical",
+                "tier": "_default_tier",
+                "priority": 0
+            }
+        ]
+    },
+    {
+        "interval": "2023-07-06T08:00:00.000Z/2023-07-06T09:00:00.000Z",
+        "version": "2023-07-06T08:27:31.407Z",
+        "partitionNumber": 1,
+        "size": 1437866,
+        "locations": [
+            {
+                "name": "localhost:8083",
+                "host": "localhost:8083",
+                "hostAndTlsPort": null,
+                "maxSize": 300000000000,
+                "type": "historical",
+                "tier": "_default_tier",
+                "priority": 0
+            }
+        ]
+    },
+    {
+        "interval": "2023-07-06T10:00:00.000Z/2023-07-06T11:00:00.000Z",
+        "version": "2023-07-06T10:02:42.079Z",
+        "partitionNumber": 0,
+        "size": 1671296,
+        "locations": [
+            {
+                "name": "localhost:8083",
+                "host": "localhost:8083",
+                "hostAndTlsPort": null,
+                "maxSize": 300000000000,
+                "type": "historical",
+                "tier": "_default_tier",
+                "priority": 0
+            }
+        ]
+    },
+    {
+        "interval": "2023-07-06T11:00:00.000Z/2023-07-06T12:00:00.000Z",
+        "version": "2023-07-06T11:27:23.902Z",
+        "partitionNumber": 0,
+        "size": 574893,
+        "locations": [
+            {
+                "name": "localhost:8083",
+                "host": "localhost:8083",
+                "hostAndTlsPort": null,
+                "maxSize": 300000000000,
+                "type": "historical",
+                "tier": "_default_tier",
+                "priority": 0
+            }
+        ]
+    },
+    {
+        "interval": "2023-07-06T11:00:00.000Z/2023-07-06T12:00:00.000Z",
+        "version": "2023-07-06T11:27:23.902Z",
+        "partitionNumber": 1,
+        "size": 1427384,
+        "locations": [
+            {
+                "name": "localhost:8083",
+                "host": "localhost:8083",
+                "hostAndTlsPort": null,
+                "maxSize": 300000000000,
+                "type": "historical",
+                "tier": "_default_tier",
+                "priority": 0
+            }
+        ]
+    },
+    {
+        "interval": "2023-07-06T12:00:00.000Z/2023-07-06T13:00:00.000Z",
+        "version": "2023-07-06T12:52:00.846Z",
+        "partitionNumber": 0,
+        "size": 2115172,
+        "locations": [
+            {
+                "name": "localhost:8083",
+                "host": "localhost:8083",
+                "hostAndTlsPort": null,
+                "maxSize": 300000000000,
+                "type": "historical",
+                "tier": "_default_tier",
+                "priority": 0
+            }
+        ]
+    },
+    {
+        "interval": "2023-07-06T14:00:00.000Z/2023-07-06T15:00:00.000Z",
+        "version": "2023-07-06T14:32:33.926Z",
+        "partitionNumber": 0,
+        "size": 589108,
+        "locations": [
+            {
+                "name": "localhost:8083",
+                "host": "localhost:8083",
+                "hostAndTlsPort": null,
+                "maxSize": 300000000000,
+                "type": "historical",
+                "tier": "_default_tier",
+                "priority": 0
+            }
+        ]
+    },
+    {
+        "interval": "2023-07-06T14:00:00.000Z/2023-07-06T15:00:00.000Z",
+        "version": "2023-07-06T14:32:33.926Z",
+        "partitionNumber": 1,
+        "size": 1392649,
+        "locations": [
+            {
+                "name": "localhost:8083",
+                "host": "localhost:8083",
+                "hostAndTlsPort": null,
+                "maxSize": 300000000000,
+                "type": "historical",
+                "tier": "_default_tier",
+                "priority": 0
+            }
+        ]
+    },
+    {
+        "interval": "2023-07-06T15:00:00.000Z/2023-07-06T16:00:00.000Z",
+        "version": "2023-07-06T15:53:25.467Z",
+        "partitionNumber": 0,
+        "size": 2037851,
+        "locations": [
+            {
+                "name": "localhost:8083",
+                "host": "localhost:8083",
+                "hostAndTlsPort": null,
+                "maxSize": 300000000000,
+                "type": "historical",
+                "tier": "_default_tier",
+                "priority": 0
+            }
+        ]
+    },
+    {
+        "interval": "2023-07-06T16:00:00.000Z/2023-07-06T17:00:00.000Z",
+        "version": "2023-07-06T16:02:26.568Z",
+        "partitionNumber": 0,
+        "size": 230400650,
+        "locations": [
+            {
+                "name": "localhost:8083",
+                "host": "localhost:8083",
+                "hostAndTlsPort": null,
+                "maxSize": 300000000000,
+                "type": "historical",
+                "tier": "_default_tier",
+                "priority": 0
+            }
+        ]
+    },
+    {
+        "interval": "2023-07-06T16:00:00.000Z/2023-07-06T17:00:00.000Z",
+        "version": "2023-07-06T16:02:26.568Z",
+        "partitionNumber": 1,
+        "size": 38209056,
+        "locations": [
+            {
+                "name": "localhost:8083",
+                "host": "localhost:8083",
+                "hostAndTlsPort": null,
+                "maxSize": 300000000000,
+                "type": "historical",
+                "tier": "_default_tier",
+                "priority": 0
+            }
+        ]
+    },
+    {
+        "interval": "2023-07-06T17:00:00.000Z/2023-07-06T18:00:00.000Z",
+        "version": "2023-07-06T17:00:02.391Z",
+        "partitionNumber": 0,
+        "size": 211099463,
+        "locations": [
+            {
+                "name": "localhost:8083",
+                "host": "localhost:8083",
+                "hostAndTlsPort": null,
+                "maxSize": 300000000000,
+                "type": "historical",
+                "tier": "_default_tier",
+                "priority": 0
+            }
+        ]
+    }
+]
+  ```
+</details>
diff --git a/docs/35.0.0/api-reference/legacy-metadata-api.md b/docs/35.0.0/api-reference/legacy-metadata-api.md
new file mode 100644
index 0000000000..d22be18a7e
--- /dev/null
+++ b/docs/35.0.0/api-reference/legacy-metadata-api.md
@@ -0,0 +1,344 @@
+---
+id: legacy-metadata-api
+title: Legacy metadata API
+sidebar_label: Legacy metadata
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+This document describes the legacy API endpoints to retrieve datasource metadata from Apache Druid. Use the [SQL metadata tables](../querying/sql-metadata-tables.md) to retrieve datasource metadata instead.
+
+## Segment loading
+
+`GET /druid/coordinator/v1/loadstatus`
+
+Returns the percentage of segments actually loaded in the cluster versus segments that should be loaded in the cluster.
+
+`GET /druid/coordinator/v1/loadstatus?simple`
+
+Returns the number of segments left to load until segments that should be loaded in the cluster are available for queries. This does not include segment replication counts.
+
+`GET /druid/coordinator/v1/loadstatus?full`
+
+Returns the number of segments left to load in each tier until segments that should be loaded in the cluster are all available. This includes segment replication counts.
+
+`GET /druid/coordinator/v1/loadstatus?full&computeUsingClusterView`
+
+Returns the number of segments not yet loaded for each tier until all segments loading in the cluster are available.
+The result includes segment replication counts. It also factors in the number of available nodes that are of a service type that can load the segment when computing the number of segments remaining to load.
+A segment is considered fully loaded when:
+- Druid has replicated it the number of times configured in the corresponding load rule.
+- Or the number of replicas for the segment in each tier where it is configured to be replicated equals the available nodes of a service type that are currently allowed to load the segment in the tier.
+
+`GET /druid/coordinator/v1/loadqueue`
+
+Returns the ids of segments to load and drop for each Historical process.
+
+`GET /druid/coordinator/v1/loadqueue?simple`
+
+Returns the number of segments to load and drop, as well as the total segment load and drop size in bytes for each Historical process.
+
+`GET /druid/coordinator/v1/loadqueue?full`
+
+Returns the serialized JSON of segments to load and drop for each Historical process.
+
+## Segment loading by datasource
+
+Note that all _interval_ query parameters are ISO 8601 strings&mdash;for example, 2016-06-27/2016-06-28.
+Also note that these APIs only guarantees that the segments are available at the time of the call.
+Segments can still become missing because of historical process failures or any other reasons afterward.
+
+`GET /druid/coordinator/v1/datasources/{dataSourceName}/loadstatus?forceMetadataRefresh={boolean}&interval={myInterval}`
+
+Returns the percentage of segments actually loaded in the cluster versus segments that should be loaded in the cluster for the given 
+datasource over the given interval (or last 2 weeks if interval is not given). `forceMetadataRefresh` is required to be set. 
+* Setting `forceMetadataRefresh` to true will force the coordinator to poll latest segment metadata from the metadata store 
+(Note: `forceMetadataRefresh=true` refreshes Coordinator's metadata cache of all datasources. This can be a heavy operation in terms 
+of the load on the metadata store but can be necessary to make sure that we verify all the latest segments' load status)
+* Setting `forceMetadataRefresh` to false will use the metadata cached on the coordinator from the last force/periodic refresh. 
+If no used segments are found for the given inputs, this API returns `204 No Content`
+
+`GET /druid/coordinator/v1/datasources/{dataSourceName}/loadstatus?simple&forceMetadataRefresh={boolean}&interval={myInterval}`
+
+Returns the number of segments left to load until segments that should be loaded in the cluster are available for the given datasource 
+over the given interval (or last 2 weeks if interval is not given). This does not include segment replication counts. `forceMetadataRefresh` is required to be set. 
+* Setting `forceMetadataRefresh` to true will force the coordinator to poll latest segment metadata from the metadata store 
+(Note: `forceMetadataRefresh=true` refreshes Coordinator's metadata cache of all datasources. This can be a heavy operation in terms 
+of the load on the metadata store but can be necessary to make sure that we verify all the latest segments' load status)
+* Setting `forceMetadataRefresh` to false will use the metadata cached on the coordinator from the last force/periodic refresh. 
+If no used segments are found for the given inputs, this API returns `204 No Content`
+
+`GET /druid/coordinator/v1/datasources/{dataSourceName}/loadstatus?full&forceMetadataRefresh={boolean}&interval={myInterval}`
+
+Returns the number of segments left to load in each tier until segments that should be loaded in the cluster are all available for the given datasource  over the given interval (or last 2 weeks if interval is not given). This includes segment replication counts. `forceMetadataRefresh` is required to be set. 
+* Setting `forceMetadataRefresh` to true will force the coordinator to poll latest segment metadata from the metadata store 
+(Note: `forceMetadataRefresh=true` refreshes Coordinator's metadata cache of all datasources. This can be a heavy operation in terms 
+of the load on the metadata store but can be necessary to make sure that we verify all the latest segments' load status)
+* Setting `forceMetadataRefresh` to false will use the metadata cached on the coordinator from the last force/periodic refresh. 
+  
+You can pass the optional query parameter `computeUsingClusterView` to factor in the available cluster services when calculating
+the segments left to load. See [Coordinator Segment Loading](#segment-loading) for details.
+If no used segments are found for the given inputs, this API returns `204 No Content`
+
+## Metadata store information
+
+:::info
+ Note: Much of this information is available in a simpler, easier-to-use form through the Druid SQL
+ [`sys.segments`](../querying/sql-metadata-tables.md#segments-table) table.
+:::
+
+`GET /druid/coordinator/v1/metadata/segments`
+
+Returns a list of all segments for each datasource enabled in the cluster.
+
+`GET /druid/coordinator/v1/metadata/segments?datasources={dataSourceName1}&datasources={dataSourceName2}`
+
+Returns a list of all segments for one or more specific datasources enabled in the cluster.
+
+`GET /druid/coordinator/v1/metadata/segments?includeOvershadowedStatus`
+
+Returns a list of all segments for each datasource with the full segment metadata and an extra field `overshadowed`.
+
+`GET /druid/coordinator/v1/metadata/segments?includeOvershadowedStatus&includeRealtimeSegments`
+
+Returns a list of all published and realtime segments for each datasource with the full segment metadata and extra fields `overshadowed`,`realtime` & `numRows`. Realtime segments are returned only when `druid.centralizedDatasourceSchema.enabled` is set on the Coordinator. 
+
+`GET /druid/coordinator/v1/metadata/segments?includeOvershadowedStatus&datasources={dataSourceName1}&datasources={dataSourceName2}`
+
+Returns a list of all segments for one or more specific datasources with the full segment metadata and an extra field `overshadowed`.
+
+`GET /druid/coordinator/v1/metadata/segments?includeOvershadowedStatus&includeRealtimeSegments&datasources={dataSourceName1}&datasources={dataSourceName2}`
+
+Returns a list of all published and realtime segments for the specified datasources with the full segment metadata and extra fields `overshadwed`,`realtime` & `numRows`. Realtime segments are returned only when `druid.centralizedDatasourceSchema.enabled` is set on the Coordinator.
+
+`GET /druid/coordinator/v1/metadata/datasources`
+
+Returns a list of the names of datasources with at least one used segment in the cluster, retrieved from the metadata database. Users should call this API to get the eventual state that the system will be in.
+
+`GET /druid/coordinator/v1/metadata/datasources?includeUnused`
+
+Returns a list of the names of datasources, regardless of whether there are used segments belonging to those datasources in the cluster or not.
+
+`GET /druid/coordinator/v1/metadata/datasources?includeDisabled`
+
+Returns a list of the names of datasources, regardless of whether the datasource is disabled or not.
+
+`GET /druid/coordinator/v1/metadata/datasources?full`
+
+Returns a list of all datasources with at least one used segment in the cluster. Returns all metadata about those datasources as stored in the metadata store.
+
+`GET /druid/coordinator/v1/metadata/datasources/{dataSourceName}`
+
+Returns full metadata for a datasource as stored in the metadata store.
+
+`GET /druid/coordinator/v1/metadata/datasources/{dataSourceName}/segments`
+
+Returns a list of all segments for a datasource as stored in the metadata store.
+
+`GET /druid/coordinator/v1/metadata/datasources/{dataSourceName}/segments?full`
+
+Returns a list of all segments for a datasource with the full segment metadata as stored in the metadata store.
+
+`GET /druid/coordinator/v1/metadata/datasources/{dataSourceName}/segments/{segmentId}`
+
+Returns full segment metadata for a specific segment as stored in the metadata store, if the segment is used. If the
+segment is unused, or is unknown, a 404 response is returned.
+
+`GET /druid/coordinator/v1/metadata/datasources/{dataSourceName}/segments/{segmentId}?includeUnused=true`
+
+Returns full segment metadata for a specific segment as stored in the metadata store. If it is unknown, a 404 response
+is returned.
+
+`GET /druid/coordinator/v1/metadata/datasources/{dataSourceName}/segments`
+
+Returns a list of all segments, overlapping with any of given intervals,  for a datasource as stored in the metadata store. Request body is array of string IS0 8601 intervals like `[interval1, interval2,...]`&mdash;for example, `["2012-01-01T00:00:00.000/2012-01-03T00:00:00.000", "2012-01-05T00:00:00.000/2012-01-07T00:00:00.000"]`.
+
+`GET /druid/coordinator/v1/metadata/datasources/{dataSourceName}/segments?full`
+
+Returns a list of all segments, overlapping with any of given intervals, for a datasource with the full segment metadata as stored in the metadata store. Request body is array of string ISO 8601 intervals like `[interval1, interval2,...]`&mdash;for example, `["2012-01-01T00:00:00.000/2012-01-03T00:00:00.000", "2012-01-05T00:00:00.000/2012-01-07T00:00:00.000"]`.
+
+`POST /druid/coordinator/v1/metadata/dataSourceInformation`
+
+Returns information about the specified datasources, including the datasource schema.
+
+`POST /druid/coordinator/v1/metadata/bootstrapSegments`
+
+Returns information about bootstrap segments for all datasources. The returned set includes all broadcast segments if broadcast rules are configured.
+
+<a name="coordinator-datasources"></a>
+
+## Datasources
+
+Note that all _interval_ URL parameters are ISO 8601 strings delimited by a `_` instead of a `/`&mdash;for example, `2016-06-27_2016-06-28`.
+
+`GET /druid/coordinator/v1/datasources`
+
+Returns a list of datasource names found in the cluster as seen by the coordinator. This view is updated every [`druid.coordinator.period`](../configuration/index.md#coordinator-operation).
+
+`GET /druid/coordinator/v1/datasources?simple`
+
+Returns a list of JSON objects containing the name and properties of datasources found in the cluster. Properties include segment count, total segment byte size, replicated total segment byte size, minTime, and maxTime.
+
+`GET /druid/coordinator/v1/datasources?full`
+
+Returns a list of datasource names found in the cluster with all metadata about those datasources.
+
+`GET /druid/coordinator/v1/datasources/{dataSourceName}`
+
+Returns a JSON object containing the name and properties of a datasource. Properties include segment count, total segment byte size, replicated total segment byte size, minTime, and maxTime.
+
+`GET /druid/coordinator/v1/datasources/{dataSourceName}?full`
+
+Returns full metadata for a datasource.
+
+`GET /druid/coordinator/v1/datasources/{dataSourceName}/intervals`
+
+Returns a set of segment intervals.
+
+`GET /druid/coordinator/v1/datasources/{dataSourceName}/intervals?simple`
+
+Returns a map of an interval to a JSON object containing the total byte size of segments and number of segments for that interval.
+
+`GET /druid/coordinator/v1/datasources/{dataSourceName}/intervals?full`
+
+Returns a map of an interval to a map of segment metadata to a set of server names that contain the segment for that interval.
+
+`GET /druid/coordinator/v1/datasources/{dataSourceName}/intervals/{interval}`
+
+Returns a set of segment ids for an interval.
+
+`GET /druid/coordinator/v1/datasources/{dataSourceName}/intervals/{interval}?simple`
+
+Returns a map of segment intervals contained within the specified interval to a JSON object containing the total byte size of segments and number of segments for an interval.
+
+`GET /druid/coordinator/v1/datasources/{dataSourceName}/intervals/{interval}?full`
+
+Returns a map of segment intervals contained within the specified interval to a map of segment metadata to a set of server names that contain the segment for an interval.
+
+`GET /druid/coordinator/v1/datasources/{dataSourceName}/intervals/{interval}/serverview`
+
+Returns a map of segment intervals contained within the specified interval to information about the servers that contain the segment for an interval.
+
+`GET /druid/coordinator/v1/datasources/{dataSourceName}/segments`
+
+Returns a list of all segments for a datasource in the cluster.
+
+`GET /druid/coordinator/v1/datasources/{dataSourceName}/segments?full`
+
+Returns a list of all segments for a datasource in the cluster with the full segment metadata.
+
+`GET /druid/coordinator/v1/datasources/{dataSourceName}/segments/{segmentId}`
+
+Returns full segment metadata for a specific segment in the cluster.
+
+`GET /druid/coordinator/v1/datasources/{dataSourceName}/tiers`
+
+Return the tiers that a datasource exists in.
+
+## Intervals
+
+Note that all _interval_ URL parameters are ISO 8601 strings delimited by a `_` instead of a `/` as in `2016-06-27_2016-06-28`.
+
+`GET /druid/coordinator/v1/intervals`
+
+Returns all intervals for all datasources with total size and count.
+
+`GET /druid/coordinator/v1/intervals/{interval}`
+
+Returns aggregated total size and count for all intervals that intersect given ISO interval.
+
+`GET /druid/coordinator/v1/intervals/{interval}?simple`
+
+Returns total size and count for each interval within given ISO interval.
+
+`GET /druid/coordinator/v1/intervals/{interval}?full`
+
+Returns total size and count for each datasource for each interval within given ISO interval.
+
+## Server information
+
+`GET /druid/coordinator/v1/servers`
+
+Returns a list of servers URLs using the format `{hostname}:{port}`. Note that
+processes that run with different types will appear multiple times with different
+ports.
+
+`GET /druid/coordinator/v1/servers?simple`
+ 
+Returns a list of server data objects in which each object has the following keys:
+* `host`: host URL include (`{hostname}:{port}`)
+* `type`: process type (`indexer-executor`, `historical`)
+* `currSize`: storage size currently used
+* `maxSize`: maximum storage size
+* `priority`
+* `tier`
+
+
+## Query server
+
+This section documents the API endpoints for the services that reside on Query servers (Brokers) in the suggested [three-server configuration](../design/architecture.md#druid-servers).
+
+### Broker
+
+#### Datasource information
+
+Note that all _interval_ URL parameters are ISO 8601 strings delimited by a `_` instead of a `/`
+as in `2016-06-27_2016-06-28`.
+
+:::info
+ Note: Much of this information is available in a simpler, easier-to-use form through the Druid SQL
+ [`INFORMATION_SCHEMA.TABLES`](../querying/sql-metadata-tables.md#tables-table),
+ [`INFORMATION_SCHEMA.COLUMNS`](../querying/sql-metadata-tables.md#columns-table), and
+ [`sys.segments`](../querying/sql-metadata-tables.md#segments-table) tables.
+:::
+
+`GET /druid/v2/datasources`
+
+Returns a list of queryable datasources.
+
+`GET /druid/v2/datasources/{dataSourceName}`
+
+Returns the dimensions and metrics of the datasource. Optionally, you can provide request parameter "full" to get list of served intervals with dimensions and metrics being served for those intervals. You can also provide request param "interval" explicitly to refer to a particular interval.
+
+If no interval is specified, a default interval spanning a configurable period before the current time will be used. The default duration of this interval is specified in ISO 8601 duration format via: `druid.query.segmentMetadata.defaultHistory`
+
+`GET /druid/v2/datasources/{dataSourceName}/dimensions`
+
+:::info
+ This API is deprecated and will be removed in future releases. Please use [SegmentMetadataQuery](../querying/segmentmetadataquery.md) instead
+ which provides more comprehensive information and supports all dataSource types including streaming dataSources. It's also encouraged to use [INFORMATION_SCHEMA tables](../querying/sql-metadata-tables.md)
+ if you're using SQL.
+:::
+
+Returns the dimensions of the datasource.
+
+`GET /druid/v2/datasources/{dataSourceName}/metrics`
+
+:::info
+ This API is deprecated and will be removed in future releases. Please use [SegmentMetadataQuery](../querying/segmentmetadataquery.md) instead
+ which provides more comprehensive information and supports all dataSource types including streaming dataSources. It's also encouraged to use [INFORMATION_SCHEMA tables](../querying/sql-metadata-tables.md)
+ if you're using SQL.
+:::
+
+Returns the metrics of the datasource.
+
+`GET /druid/v2/datasources/{dataSourceName}/candidates?intervals={comma-separated-intervals}&numCandidates={numCandidates}`
+
+Returns segment information lists including server locations for the given datasource and intervals. If "numCandidates" is not specified, it will return all servers for each interval.
diff --git a/docs/35.0.0/api-reference/lookups-api.md b/docs/35.0.0/api-reference/lookups-api.md
new file mode 100644
index 0000000000..4a122917b5
--- /dev/null
+++ b/docs/35.0.0/api-reference/lookups-api.md
@@ -0,0 +1,279 @@
+---
+id: lookups-api
+title: Lookups API
+sidebar_label: Lookups
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+This document describes the API endpoints to configure, update, retrieve, and manage lookups for Apache Druid.
+
+## Configure lookups
+
+### Bulk update
+
+Lookups can be updated in bulk by posting a JSON object to `/druid/coordinator/v1/lookups/config`. The format of the json object is as follows:
+
+```json
+{
+    "<tierName>": {
+        "<lookupName>": {
+          "version": "<version>",
+          "lookupExtractorFactory": {
+            "type": "<someExtractorFactoryType>",
+            "<someExtractorField>": "<someExtractorValue>"
+          }
+        }
+    }
+}
+```
+
+Note that "version" is an arbitrary string assigned by the user, when making updates to existing lookup then user would need to specify a lexicographically higher version.
+
+For example, a config might look something like:
+
+```json
+{
+  "__default": {
+    "country_code": {
+      "version": "v0",
+      "lookupExtractorFactory": {
+        "type": "map",
+        "map": {
+          "77483": "United States"
+        }
+      }
+    },
+    "site_id": {
+      "version": "v0",
+      "lookupExtractorFactory": {
+        "type": "cachedNamespace",
+        "extractionNamespace": {
+          "type": "jdbc",
+          "connectorConfig": {
+            "createTables": true,
+            "connectURI": "jdbc:mysql:\/\/localhost:3306\/druid",
+            "user": "druid",
+            "password": "diurd"
+          },
+          "table": "lookupTable",
+          "keyColumn": "country_id",
+          "valueColumn": "country_name",
+          "tsColumn": "timeColumn"
+        },
+        "firstCacheTimeout": 120000,
+        "injective": true
+      }
+    },
+    "site_id_customer1": {
+      "version": "v0",
+      "lookupExtractorFactory": {
+        "type": "map",
+        "map": {
+          "847632": "Internal Use Only"
+        }
+      }
+    },
+    "site_id_customer2": {
+      "version": "v0",
+      "lookupExtractorFactory": {
+        "type": "map",
+        "map": {
+          "AHF77": "Home"
+        }
+      }
+    }
+  },
+  "realtime_customer1": {
+    "country_code": {
+      "version": "v0",
+      "lookupExtractorFactory": {
+        "type": "map",
+        "map": {
+          "77483": "United States"
+        }
+      }
+    },
+    "site_id_customer1": {
+      "version": "v0",
+      "lookupExtractorFactory": {
+        "type": "map",
+        "map": {
+          "847632": "Internal Use Only"
+        }
+      }
+    }
+  },
+  "realtime_customer2": {
+    "country_code": {
+      "version": "v0",
+      "lookupExtractorFactory": {
+        "type": "map",
+        "map": {
+          "77483": "United States"
+        }
+      }
+    },
+    "site_id_customer2": {
+      "version": "v0",
+      "lookupExtractorFactory": {
+        "type": "map",
+        "map": {
+          "AHF77": "Home"
+        }
+      }
+    }
+  }
+}
+```
+
+All entries in the map will UPDATE existing entries. No entries will be deleted.
+
+### Update lookup
+
+A `POST` to a particular lookup extractor factory via `/druid/coordinator/v1/lookups/config/{tier}/{id}` creates or updates that specific extractor factory.
+
+For example, a post to `/druid/coordinator/v1/lookups/config/realtime_customer1/site_id_customer1` might contain the following:
+
+```json
+{
+  "version": "v1",
+  "lookupExtractorFactory": {
+    "type": "map",
+    "map": {
+      "847632": "Internal Use Only"
+    }
+  }
+}
+```
+
+This will replace the `site_id_customer1` lookup in the `realtime_customer1` with the definition above.
+
+Assign a unique version identifier each time you update a lookup extractor factory. Otherwise the call will fail.
+
+### Get all lookups
+
+A `GET` to `/druid/coordinator/v1/lookups/config/all` will return all known lookup specs for all tiers.
+
+### Get lookup
+
+A `GET` to a particular lookup extractor factory is accomplished via `/druid/coordinator/v1/lookups/config/{tier}/{id}`
+
+Using the prior example, a `GET` to `/druid/coordinator/v1/lookups/config/realtime_customer2/site_id_customer2` should return
+
+```json
+{
+  "version": "v1",
+  "lookupExtractorFactory": {
+    "type": "map",
+    "map": {
+      "AHF77": "Home"
+    }
+  }
+}
+```
+
+### Delete lookup
+
+A `DELETE` to `/druid/coordinator/v1/lookups/config/{tier}/{id}` will remove that lookup from the cluster. If it was last lookup in the tier, then tier is deleted as well.
+
+### Delete tier
+
+A `DELETE` to `/druid/coordinator/v1/lookups/config/{tier}` will remove that tier from the cluster.
+
+### List tier names
+
+A `GET` to `/druid/coordinator/v1/lookups/config` will return a list of known tier names in the dynamic configuration.
+To discover a list of tiers currently active in the cluster in addition to ones known in the dynamic configuration, the parameter `discover=true` can be added as per `/druid/coordinator/v1/lookups/config?discover=true`.
+
+### List lookup names
+
+A `GET` to `/druid/coordinator/v1/lookups/config/{tier}` will return a list of known lookup names for that tier.
+
+These end points can be used to get the propagation status of configured lookups to processes using lookups such as Historicals.
+
+## Lookup status
+
+### List load status of all lookups
+
+`GET` `/druid/coordinator/v1/lookups/status` with optional query parameter `detailed`.
+
+### List load status of lookups in a tier
+
+`GET` `/druid/coordinator/v1/lookups/status/{tier}` with optional query parameter `detailed`.
+
+### List load status of single lookup
+
+`GET` `/druid/coordinator/v1/lookups/status/{tier}/{lookup}` with optional query parameter `detailed`.
+
+### List lookup state of all processes
+
+`GET` `/druid/coordinator/v1/lookups/nodeStatus` with optional query parameter `discover` to discover tiers advertised by other Druid nodes, or by default, returning all configured lookup tiers. The default response will also include the lookups which are loaded, being loaded, or being dropped on each node, for each tier, including the complete lookup spec. Add the optional query parameter `detailed=false` to only include the 'version' of the lookup instead of the complete spec.
+
+### List lookup state of processes in a tier
+
+`GET` `/druid/coordinator/v1/lookups/nodeStatus/{tier}`
+
+### List lookup state of single process
+
+`GET` `/druid/coordinator/v1/lookups/nodeStatus/{tier}/{host:port}`
+
+## Internal API
+
+The Peon, Router, Broker, and Historical processes all have the ability to consume lookup configuration.
+There is an internal API these processes use to list/load/drop their lookups starting at `/druid/listen/v1/lookups`.
+These follow the same convention for return values as the cluster wide dynamic configuration. Following endpoints
+can be used for debugging purposes but not otherwise.
+
+### Get lookups
+
+A `GET` to the process at `/druid/listen/v1/lookups` will return a json map of all the lookups currently active on the process.
+The return value will be a json map of the lookups to their extractor factories.
+
+```json
+{
+  "site_id_customer2": {
+    "version": "v1",
+    "lookupExtractorFactory": {
+      "type": "map",
+      "map": {
+        "AHF77": "Home"
+      }
+    }
+  }
+}
+```
+
+### Get lookup
+
+A `GET` to the process at `/druid/listen/v1/lookups/some_lookup_name` will return the LookupExtractorFactory for the lookup identified by `some_lookup_name`.
+The return value will be the json representation of the factory.
+
+```json
+{
+  "version": "v1",
+  "lookupExtractorFactory": {
+    "type": "map",
+    "map": {
+      "AHF77": "Home"
+    }
+  }
+}
+```
\ No newline at end of file
diff --git a/docs/35.0.0/api-reference/retention-rules-api.md b/docs/35.0.0/api-reference/retention-rules-api.md
new file mode 100644
index 0000000000..c21e546abd
--- /dev/null
+++ b/docs/35.0.0/api-reference/retention-rules-api.md
@@ -0,0 +1,562 @@
+---
+id: retention-rules-api
+title: Retention rules API
+sidebar_label: Retention rules
+---
+import Tabs from '@theme/Tabs';
+import TabItem from '@theme/TabItem';
+
+
+<!--
+
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+This topic describes the API endpoints for managing retention rules in Apache Druid. You can configure retention rules in the Druid web console or API.
+
+Druid uses retention rules to determine what data is retained in the cluster. Druid supports load, drop, and broadcast rules. For more information, see [Using rules to drop and retain data](../operations/rule-configuration.md).
+
+In this topic, `http://ROUTER_IP:ROUTER_PORT` is a placeholder for your Router service address and port. Replace it with the information for your deployment. For example, use `http://localhost:8888` for quickstart deployments.
+
+## Update retention rules for a datasource
+
+Updates one or more retention rules for a datasource. The request body takes an array of retention rule objects. For details on defining retention rules, see the following sources:
+
+* [Load rules](../operations/rule-configuration.md#load-rules)
+* [Drop rules](../operations/rule-configuration.md#drop-rules)
+* [Broadcast rules](../operations/rule-configuration.md#broadcast-rules)
+
+This request overwrites any existing rules for the datasource.
+Druid reads rules in the order in which they appear; for more information, see [rule structure](../operations/rule-configuration.md).
+
+Note that this endpoint returns an HTTP `200 OK` even if the datasource does not exist.
+
+### URL
+
+`POST` `/druid/coordinator/v1/rules/{dataSource}`
+
+### Header parameters
+
+The endpoint supports a set of optional header parameters to populate the `author` and `comment` fields in the `auditInfo` property for audit history.
+
+* `X-Druid-Author` (optional)
+  * Type: String
+  * A string representing the author making the configuration change.
+* `X-Druid-Comment` (optional)
+  * Type: String
+  * A string describing the update.
+
+### Responses
+
+<Tabs>
+
+<TabItem value="1" label="200 SUCCESS">
+
+
+*Successfully updated retention rules for specified datasource*
+
+</TabItem>
+</Tabs>
+
+---
+
+### Sample request
+
+The following example sets a set of broadcast, load, and drop retention rules for the `kttm1` datasource.
+
+<Tabs>
+
+<TabItem value="2" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/coordinator/v1/rules/kttm1" \
+--header 'X-Druid-Author: doc intern' \
+--header 'X-Druid-Comment: submitted via api' \
+--header 'Content-Type: application/json' \
+--data '[
+    {
+        "type": "broadcastForever"
+    },
+    {
+        "type": "loadForever",
+        "tieredReplicants": {
+            "_default_tier": 2
+        },
+        "useDefaultTierForNull": true
+    },
+    {
+        "type": "dropByPeriod",
+        "period": "P1M"
+    }
+]'
+```
+
+</TabItem>
+<TabItem value="3" label="HTTP">
+
+
+```HTTP
+POST /druid/coordinator/v1/rules/kttm1 HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+X-Druid-Author: doc intern
+X-Druid-Comment: submitted via api
+Content-Type: application/json
+Content-Length: 273
+
+[
+    {
+        "type": "broadcastForever"
+    },
+    {
+        "type": "loadForever",
+        "tieredReplicants": {
+            "_default_tier": 1
+        },
+        "useDefaultTierForNull": true
+    },
+    {
+        "type": "dropByPeriod",
+        "period": "P1M"
+    }
+]
+```
+
+</TabItem>
+</Tabs>
+
+### Sample response
+
+A successful request returns an HTTP `200 OK` message code and an empty response body.
+
+## Update default retention rules for all datasources
+
+Updates one or more default retention rules for all datasources. Submit retention rules as an array of objects in the request body. For details on defining retention rules, see the following sources:
+
+* [Load rules](../operations/rule-configuration.md#load-rules)
+* [Drop rules](../operations/rule-configuration.md#drop-rules)
+* [Broadcast rules](../operations/rule-configuration.md#broadcast-rules)
+
+This request overwrites any existing rules for all datasources. To remove default retention rules for all datasources, submit an empty rule array in the request body. Rules are read in the order in which they appear; for more information, see [rule structure](../operations/rule-configuration.md).
+
+### URL
+
+`POST` `/druid/coordinator/v1/rules/_default`
+
+### Header parameters
+
+The endpoint supports a set of optional header parameters to populate the `author` and `comment` fields in the `auditInfo` property for audit history.
+
+* `X-Druid-Author` (optional)
+  * Type: String
+  * A string representing the author making the configuration change.
+* `X-Druid-Comment` (optional)
+  * Type: String
+  * A string describing the update.
+
+### Responses
+
+<Tabs>
+
+<TabItem value="4" label="200 SUCCESS">
+
+
+*Successfully updated default retention rules*
+
+</TabItem>
+<TabItem value="5" label="500 SERVER ERROR">
+
+
+*Error with request body*
+
+</TabItem>
+</Tabs>
+
+---
+
+### Sample request
+
+The following example updates the default retention rule for all datasources with a `loadByInterval` rule.
+
+<Tabs>
+
+<TabItem value="6" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/coordinator/v1/rules/_default" \
+--header 'Content-Type: application/json' \
+--data '[
+    {
+        "type": "loadByInterval",
+        "tieredReplicants": {},
+        "useDefaultTierForNull": false,
+        "interval": "2010-01-01/2020-01-01"
+    }
+]'
+```
+
+</TabItem>
+<TabItem value="7" label="HTTP">
+
+
+```HTTP
+POST /druid/coordinator/v1/rules/_default HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+Content-Type: application/json
+Content-Length: 205
+
+[
+    {
+        "type": "loadByInterval",
+        "tieredReplicants": {},
+        "useDefaultTierForNull": false,
+        "interval": "2010-01-01/2020-01-01"
+    }
+]
+```
+
+</TabItem>
+</Tabs>
+
+### Sample response
+
+A successful request returns an HTTP `200 OK` message code and an empty response body.
+
+## Get an array of all retention rules
+
+Retrieves all current retention rules in the cluster including the default retention rule. Returns an array of objects for each datasource and their associated retention rules.
+
+### URL
+
+`GET` `/druid/coordinator/v1/rules`
+
+### Responses
+
+<Tabs>
+
+<TabItem value="8" label="200 SUCCESS">
+
+
+*Successfully retrieved retention rules*
+
+</TabItem>
+</Tabs>
+
+---
+
+### Sample request
+
+<Tabs>
+
+<TabItem value="9" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/coordinator/v1/rules"
+```
+
+</TabItem>
+<TabItem value="10" label="HTTP">
+
+
+```HTTP
+GET /druid/coordinator/v1/rules HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+{
+    "_default": [
+        {
+            "tieredReplicants": {
+                "_default_tier": 2
+            },
+            "type": "loadForever"
+        }
+    ],
+    "social_media": [
+        {
+            "interval": "2023-01-01T00:00:00.000Z/2023-02-01T00:00:00.000Z",
+            "type": "dropByInterval"
+        }
+    ],
+    "wikipedia_api": [],
+}
+  ```
+</details>
+
+## Get an array of retention rules for a datasource
+
+Retrieves an array of rule objects for a single datasource. Returns an empty array if there are no retention rules.
+
+Note that this endpoint returns an HTTP `200 OK` message code even if the datasource doesn't exist.
+
+### URL
+
+`GET` `/druid/coordinator/v1/rules/{dataSource}`
+
+### Query parameters
+
+* `full` (optional)
+  * Includes the default retention rule for the datasource in the response.
+
+### Responses
+
+<Tabs>
+
+<TabItem value="11" label="200 SUCCESS">
+
+
+*Successfully retrieved retention rules*
+
+</TabItem>
+</Tabs>
+
+---
+
+### Sample request
+
+The following example retrieves the custom retention rules and default retention rules for datasource with the name `social_media`.
+
+<Tabs>
+
+<TabItem value="12" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/coordinator/v1/rules/social_media?full=null"
+```
+
+</TabItem>
+<TabItem value="13" label="HTTP">
+
+
+```HTTP
+GET /druid/coordinator/v1/rules/social_media?full=null HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+[
+    {
+        "interval": "2020-01-01T00:00:00.000Z/2022-02-01T00:00:00.000Z",
+        "type": "dropByInterval"
+    },
+    {
+        "interval": "2010-01-01T00:00:00.000Z/2020-01-01T00:00:00.000Z",
+        "tieredReplicants": {
+            "_default_tier": 2
+        },
+        "type": "loadByInterval"
+    },
+    {
+        "tieredReplicants": {
+            "_default_tier": 2
+        },
+        "type": "loadForever"
+    }
+]
+  ```
+
+</details>
+
+## Get audit history for all datasources
+
+Retrieves the audit history of rules for all datasources over an interval of time. The default interval is 1 week. You can change this period by setting `druid.audit.manager.auditHistoryMillis` in the `runtime.properties` file for the Coordinator.
+
+### URL
+
+`GET` `/druid/coordinator/v1/rules/history`
+
+### Query parameters
+
+Note that the following query parameters cannot be chained.
+
+* `interval` (optional)
+  * Type: ISO 8601.
+  * Limits the number of results to the specified time interval. Delimit with `/`. For example, `2023-07-13/2023-07-19`.
+* `count` (optional)
+  * Type: Int
+  * Limits the number of results to the last `n` entries.
+
+### Responses
+
+<Tabs>
+
+<TabItem value="14" label="200 SUCCESS">
+
+
+*Successfully retrieved audit history*
+
+</TabItem>
+<TabItem value="15" label="400 BAD REQUEST">
+
+
+*Request in the incorrect format*
+
+</TabItem>
+<TabItem value="16" label="404 NOT FOUND">
+
+
+*`count` query parameter too large*
+
+</TabItem>
+</Tabs>
+
+---
+
+### Sample request
+
+The following example retrieves the audit history for all datasources from `2023-07-13` to `2023-07-19`.
+
+<Tabs>
+
+<TabItem value="17" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/coordinator/v1/rules/history?interval=2023-07-13%2F2023-07-19"
+```
+
+</TabItem>
+<TabItem value="18" label="HTTP">
+
+
+```HTTP
+GET /druid/coordinator/v1/rules/history?interval=2023-07-13/2023-07-19 HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+[
+    {
+        "key": "social_media",
+        "type": "rules",
+        "auditInfo": {
+            "author": "console",
+            "comment": "test",
+            "ip": "127.0.0.1"
+        },
+        "payload": "[{\"interval\":\"2023-01-01T00:00:00.000Z/2023-02-01T00:00:00.000Z\",\"type\":\"dropByInterval\"}]",
+        "auditTime": "2023-07-13T18:05:33.066Z"
+    },
+    {
+        "key": "social_media",
+        "type": "rules",
+        "auditInfo": {
+            "author": "console",
+            "comment": "test",
+            "ip": "127.0.0.1"
+        },
+        "payload": "[]",
+        "auditTime": "2023-07-18T18:10:21.203Z"
+    },
+    {
+        "key": "wikipedia_api",
+        "type": "rules",
+        "auditInfo": {
+            "author": "console",
+            "comment": "test",
+            "ip": "127.0.0.1"
+        },
+        "payload": "[{\"tieredReplicants\":{\"_default_tier\":2},\"type\":\"loadForever\"}]",
+        "auditTime": "2023-07-18T18:10:44.519Z"
+    },
+    {
+        "key": "wikipedia_api",
+        "type": "rules",
+        "auditInfo": {
+            "author": "console",
+            "comment": "test",
+            "ip": "127.0.0.1"
+        },
+        "payload": "[]",
+        "auditTime": "2023-07-18T18:11:02.110Z"
+    },
+    {
+        "key": "social_media",
+        "type": "rules",
+        "auditInfo": {
+            "author": "console",
+            "comment": "test",
+            "ip": "127.0.0.1"
+        },
+        "payload": "[{\"interval\":\"2023-07-03T18:49:54.848Z/2023-07-03T18:49:55.861Z\",\"type\":\"dropByInterval\"}]",
+        "auditTime": "2023-07-18T18:32:50.060Z"
+    },
+    {
+        "key": "social_media",
+        "type": "rules",
+        "auditInfo": {
+            "author": "console",
+            "comment": "test",
+            "ip": "127.0.0.1"
+        },
+        "payload": "[{\"interval\":\"2020-01-01T00:00:00.000Z/2022-02-01T00:00:00.000Z\",\"type\":\"dropByInterval\"}]",
+        "auditTime": "2023-07-18T18:34:09.657Z"
+    },
+    {
+        "key": "social_media",
+        "type": "rules",
+        "auditInfo": {
+            "author": "console",
+            "comment": "test",
+            "ip": "127.0.0.1"
+        },
+        "payload": "[{\"interval\":\"2020-01-01T00:00:00.000Z/2022-02-01T00:00:00.000Z\",\"type\":\"dropByInterval\"},{\"tieredReplicants\":{\"_default_tier\":2},\"type\":\"loadForever\"}]",
+        "auditTime": "2023-07-18T18:38:37.223Z"
+    },
+    {
+        "key": "social_media",
+        "type": "rules",
+        "auditInfo": {
+            "author": "console",
+            "comment": "test",
+            "ip": "127.0.0.1"
+        },
+        "payload": "[{\"interval\":\"2020-01-01T00:00:00.000Z/2022-02-01T00:00:00.000Z\",\"type\":\"dropByInterval\"},{\"interval\":\"2010-01-01T00:00:00.000Z/2020-01-01T00:00:00.000Z\",\"tieredReplicants\":{\"_default_tier\":2},\"type\":\"loadByInterval\"}]",
+        "auditTime": "2023-07-18T18:49:43.964Z"
+    }
+]
+  ```
+</details>
diff --git a/docs/35.0.0/api-reference/service-status-api.md b/docs/35.0.0/api-reference/service-status-api.md
new file mode 100644
index 0000000000..47d2a5a6d3
--- /dev/null
+++ b/docs/35.0.0/api-reference/service-status-api.md
@@ -0,0 +1,1469 @@
+---
+id: service-status-api
+title: Service status API
+sidebar_label: Service status
+---
+import Tabs from '@theme/Tabs';
+import TabItem from '@theme/TabItem';
+
+
+<!--
+
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+This document describes the API endpoints to retrieve service status, cluster information for Apache Druid.
+
+In this document, `http://SERVICE_IP:SERVICE_PORT` is a placeholder for the server address of deployment and the service port. For example, on the quickstart configuration, replace `http://ROUTER_IP:ROUTER_PORT` with `http://localhost:8888`.
+
+## Common
+
+All services support the following endpoints.
+
+You can use each endpoint with the ports for each type of service. The following table contains port addresses for a local configuration:
+
+|Service|Port address|
+| ------ | ------------ |
+| Coordinator|8081|
+| Overlord|8081|
+| Router|8888|
+| Broker|8082|
+| Historical|8083|
+| Middle Manager|8091|
+
+### Get service information
+
+Retrieves the Druid version, loaded extensions, memory used, total memory, and other useful information about the individual service.
+
+Modify the host and port for the endpoint to match the service to query. Refer to the [default service ports](#common) for the port numbers.
+
+#### URL
+
+`GET` `/status`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="1" label="200 SUCCESS">
+
+
+<br/>
+
+*Successfully retrieved service information*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="2" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/status"
+```
+
+</TabItem>
+<TabItem value="3" label="HTTP">
+
+
+```http
+GET /status HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+  {
+    "version": "26.0.0",
+    "modules": [
+        {
+            "name": "org.apache.druid.common.aws.AWSModule",
+            "artifact": "druid-aws-common",
+            "version": "26.0.0"
+        },
+        {
+            "name": "org.apache.druid.common.gcp.GcpModule",
+            "artifact": "druid-gcp-common",
+            "version": "26.0.0"
+        },
+        {
+            "name": "org.apache.druid.storage.hdfs.HdfsStorageDruidModule",
+            "artifact": "druid-hdfs-storage",
+            "version": "26.0.0"
+        },
+        {
+            "name": "org.apache.druid.indexing.kafka.KafkaIndexTaskModule",
+            "artifact": "druid-kafka-indexing-service",
+            "version": "26.0.0"
+        },
+        {
+            "name": "org.apache.druid.query.aggregation.datasketches.theta.SketchModule",
+            "artifact": "druid-datasketches",
+            "version": "26.0.0"
+        },
+        {
+            "name": "org.apache.druid.query.aggregation.datasketches.theta.oldapi.OldApiSketchModule",
+            "artifact": "druid-datasketches",
+            "version": "26.0.0"
+        },
+        {
+            "name": "org.apache.druid.query.aggregation.datasketches.quantiles.DoublesSketchModule",
+            "artifact": "druid-datasketches",
+            "version": "26.0.0"
+        },
+        {
+            "name": "org.apache.druid.query.aggregation.datasketches.tuple.ArrayOfDoublesSketchModule",
+            "artifact": "druid-datasketches",
+            "version": "26.0.0"
+        },
+        {
+            "name": "org.apache.druid.query.aggregation.datasketches.hll.HllSketchModule",
+            "artifact": "druid-datasketches",
+            "version": "26.0.0"
+        },
+        {
+            "name": "org.apache.druid.query.aggregation.datasketches.kll.KllSketchModule",
+            "artifact": "druid-datasketches",
+            "version": "26.0.0"
+        },
+        {
+            "name": "org.apache.druid.msq.guice.MSQExternalDataSourceModule",
+            "artifact": "druid-multi-stage-query",
+            "version": "26.0.0"
+        },
+        {
+            "name": "org.apache.druid.msq.guice.MSQIndexingModule",
+            "artifact": "druid-multi-stage-query",
+            "version": "26.0.0"
+        },
+        {
+            "name": "org.apache.druid.msq.guice.MSQDurableStorageModule",
+            "artifact": "druid-multi-stage-query",
+            "version": "26.0.0"
+        },
+        {
+            "name": "org.apache.druid.msq.guice.MSQServiceClientModule",
+            "artifact": "druid-multi-stage-query",
+            "version": "26.0.0"
+        },
+        {
+            "name": "org.apache.druid.msq.guice.MSQSqlModule",
+            "artifact": "druid-multi-stage-query",
+            "version": "26.0.0"
+        },
+        {
+            "name": "org.apache.druid.msq.guice.SqlTaskModule",
+            "artifact": "druid-multi-stage-query",
+            "version": "26.0.0"
+        }
+    ],
+    "memory": {
+        "maxMemory": 268435456,
+        "totalMemory": 268435456,
+        "freeMemory": 139060688,
+        "usedMemory": 129374768,
+        "directMemory": 134217728
+    }
+  }
+  ```
+</details>
+
+### Get service health
+
+Retrieves the online status of the individual Druid service. It is a simple health check to determine if the service is running and accessible. If online, it will always return a boolean `true` value, indicating that the service can receive API calls. This endpoint is suitable for automated health checks.
+
+Modify the host and port for the endpoint to match the service to query. Refer to the [default service ports](#common) for the port numbers.
+
+Additional checks for readiness should use the [Historical segment readiness](#get-segment-readiness) and [Broker query readiness](#get-broker-query-readiness) endpoints.
+
+#### URL
+
+`GET` `/status/health`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="4" label="200 SUCCESS">
+
+
+<br/>
+
+*Successfully retrieved service health*
+
+</TabItem>
+</Tabs>
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="5" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/status/health"
+```
+
+</TabItem>
+<TabItem value="6" label="HTTP">
+
+
+```http
+GET /status/health HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+  true
+  ```
+
+</details>
+
+
+### Get configuration properties
+
+Retrieves the current configuration properties of the individual service queried.
+
+Modify the host and port for the endpoint to match the service to query. Refer to the [default service ports](#common) for the port numbers.
+
+#### URL
+
+`GET` `/status/properties`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="7" label="200 SUCCESS">
+
+
+<br/>
+
+*Successfully retrieved service configuration properties*
+
+</TabItem>
+</Tabs>
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="8" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/status/properties"
+```
+
+</TabItem>
+<TabItem value="9" label="HTTP">
+
+
+```http
+GET /status/properties HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+  {
+{
+    "gopherProxySet": "false",
+    "awt.toolkit": "sun.lwawt.macosx.LWCToolkit",
+    "druid.monitoring.monitors": "[\"org.apache.druid.java.util.metrics.JvmMonitor\"]",
+    "java.specification.version": "11",
+    "sun.cpu.isalist": "",
+    "druid.plaintextPort": "8888",
+    "sun.jnu.encoding": "UTF-8",
+    "druid.indexing.doubleStorage": "double",
+    "druid.metadata.storage.connector.port": "1527",
+    "java.class.path": "/Users/genericUserPath",
+    "log4j.shutdownHookEnabled": "true",
+    "java.vm.vendor": "Homebrew",
+    "sun.arch.data.model": "64",
+    "druid.extensions.loadList": "[\"druid-hdfs-storage\", \"druid-kafka-indexing-service\", \"druid-datasketches\", \"druid-multi-stage-query\"]",
+    "java.vendor.url": "https://github.com/Homebrew/homebrew-core/issues",
+    "druid.router.coordinatorServiceName": "druid/coordinator",
+    "user.timezone": "UTC",
+    "druid.global.http.eagerInitialization": "false",
+    "os.name": "Mac OS X",
+    "java.vm.specification.version": "11",
+    "sun.java.launcher": "SUN_STANDARD",
+    "user.country": "US",
+    "sun.boot.library.path": "/opt/homebrew/Cellar/openjdk@11/11.0.19/libexec/openjdk.jdk/Contents/Home/lib",
+    "sun.java.command": "org.apache.druid.cli.Main server router",
+    "http.nonProxyHosts": "local|*.local|169.254/16|*.169.254/16",
+    "jdk.debug": "release",
+    "druid.metadata.storage.connector.host": "localhost",
+    "sun.cpu.endian": "little",
+    "druid.zk.paths.base": "/druid",
+    "user.home": "/Users/genericUser",
+    "user.language": "en",
+    "java.specification.vendor": "Oracle Corporation",
+    "java.version.date": "2023-04-18",
+    "java.home": "/opt/homebrew/Cellar/openjdk@11/11.0.19/libexec/openjdk.jdk/Contents/Home",
+    "druid.service": "druid/router",
+    "druid.selectors.coordinator.serviceName": "druid/coordinator",
+    "druid.metadata.storage.connector.connectURI": "jdbc:derby://localhost:1527/var/druid/metadata.db;create=true",
+    "file.separator": "/",
+    "druid.selectors.indexing.serviceName": "druid/overlord",
+    "java.vm.compressedOopsMode": "Zero based",
+    "druid.metadata.storage.type": "derby",
+    "line.separator": "\n",
+    "druid.log.path": "/Users/genericUserPath",
+    "java.vm.specification.vendor": "Oracle Corporation",
+    "java.specification.name": "Java Platform API Specification",
+    "druid.indexer.logs.directory": "var/druid/indexing-logs",
+    "java.awt.graphicsenv": "sun.awt.CGraphicsEnvironment",
+    "druid.router.defaultBrokerServiceName": "druid/broker",
+    "druid.storage.storageDirectory": "var/druid/segments",
+    "sun.management.compiler": "HotSpot 64-Bit Tiered Compilers",
+    "ftp.nonProxyHosts": "local|*.local|169.254/16|*.169.254/16",
+    "java.runtime.version": "11.0.19+0",
+    "user.name": "genericUser",
+    "druid.indexer.logs.type": "file",
+    "druid.host": "localhost",
+    "log4j2.is.webapp": "false",
+    "path.separator": ":",
+    "os.version": "12.6.5",
+    "druid.lookup.enableLookupSyncOnStartup": "false",
+    "java.runtime.name": "OpenJDK Runtime Environment",
+    "druid.zk.service.host": "localhost",
+    "file.encoding": "UTF-8",
+    "druid.sql.planner.useGroupingSetForExactDistinct": "true",
+    "druid.router.managementProxy.enabled": "true",
+    "java.vm.name": "OpenJDK 64-Bit Server VM",
+    "java.vendor.version": "Homebrew",
+    "druid.startup.logging.logProperties": "true",
+    "java.vendor.url.bug": "https://github.com/Homebrew/homebrew-core/issues",
+    "log4j.shutdownCallbackRegistry": "org.apache.druid.common.config.Log4jShutdown",
+    "java.io.tmpdir": "var/tmp",
+    "druid.sql.enable": "true",
+    "druid.emitter.logging.logLevel": "info",
+    "java.version": "11.0.19",
+    "user.dir": "/Users/genericUser/Downloads/apache-druid-26.0.0",
+    "os.arch": "aarch64",
+    "java.vm.specification.name": "Java Virtual Machine Specification",
+    "druid.node.type": "router",
+    "java.awt.printerjob": "sun.lwawt.macosx.CPrinterJob",
+    "sun.os.patch.level": "unknown",
+    "java.util.logging.manager": "org.apache.logging.log4j.jul.LogManager",
+    "java.library.path": "/Users/genericUserPath",
+    "java.vendor": "Homebrew",
+    "java.vm.info": "mixed mode",
+    "java.vm.version": "11.0.19+0",
+    "druid.emitter": "noop",
+    "sun.io.unicode.encoding": "UnicodeBig",
+    "druid.storage.type": "local",
+    "java.class.version": "55.0",
+    "socksNonProxyHosts": "local|*.local|169.254/16|*.169.254/16",
+    "druid.server.hiddenProperties": "[\"druid.s3.accessKey\",\"druid.s3.secretKey\",\"druid.metadata.storage.connector.password\", \"password\", \"key\", \"token\", \"pwd\"]"
+}
+```
+
+</details>
+
+### Get node discovery status and cluster integration confirmation
+
+Retrieves a JSON map of the form `{"selfDiscovered": true/false}`, indicating whether the node has received a confirmation from the central node discovery mechanism (currently ZooKeeper) of the Druid cluster that the node has been added to the cluster.
+
+Only consider a Druid node "healthy" or "ready" in automated deployment/container management systems when this endpoint returns `{"selfDiscovered": true}`. Nodes experiencing network issues may become isolated and are not healthy.
+For nodes that use Zookeeper segment discovery, a response of `{"selfDiscovered": true}` indicates that the node's Zookeeper client has started receiving data from the Zookeeper cluster, enabling timely discovery of segments and other nodes.
+
+#### URL
+
+`GET` `/status/selfDiscovered/status`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="10" label="200 SUCCESS">
+
+
+<br/>
+
+*Node was successfully added to the cluster*
+
+</TabItem>
+</Tabs>
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="11" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/status/selfDiscovered/status"
+```
+
+</TabItem>
+<TabItem value="12" label="HTTP">
+
+
+```http
+GET /status/selfDiscovered/status HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+  {
+    "selfDiscovered": true
+  }
+  ```
+
+</details>
+
+
+### Get node self-discovery status
+
+Returns an HTTP status code to indicate node discovery within the Druid cluster. This endpoint is similar to the `status/selfDiscovered/status` endpoint, but relies on HTTP status codes alone.
+Use this endpoint for monitoring checks that are unable to examine the response body. For example, AWS load balancer health checks.
+
+#### URL
+
+`GET` `/status/selfDiscovered`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="13" label="200 SUCCESS">
+
+
+<br/>
+
+*Successfully retrieved node status*
+
+</TabItem>
+<TabItem value="14" label="503 SERVICE UNAVAILABLE">
+
+
+<br/>
+
+*Unsuccessful node self-discovery*
+
+</TabItem>
+</Tabs>
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="15" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/status/selfDiscovered"
+```
+
+</TabItem>
+<TabItem value="16" label="HTTP">
+
+
+```http
+GET /status/selfDiscovered HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+A successful response to this endpoint results in an empty response body.
+
+## Coordinator
+
+### Get Coordinator leader address
+
+Retrieves the address of the current leader Coordinator of the cluster. If any request is sent to a non-leader Coordinator, the request is automatically redirected to the leader Coordinator.
+
+#### URL
+
+`GET` `/druid/coordinator/v1/leader`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="17" label="200 SUCCESS">
+
+
+<br/>
+
+*Successfully retrieved leader Coordinator address*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="18" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/coordinator/v1/leader"
+```
+
+</TabItem>
+<TabItem value="19" label="HTTP">
+
+
+```http
+GET /druid/coordinator/v1/leader HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+  http://localhost:8081
+  ```
+
+</details>
+
+### Get Coordinator leader status
+
+Retrieves a JSON object with a `leader` key. Returns `true` if this server is the current leader Coordinator of the cluster. To get the individual address of the leader Coordinator node, see the [leader endpoint](#get-coordinator-leader-address).
+
+Use this endpoint as a load balancer status check when you only want the active leader to be considered in-service at the load balancer.
+
+#### URL
+
+`GET` `/druid/coordinator/v1/isLeader`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="20" label="200 SUCCESS">
+
+
+<br/>
+
+*Current server is the leader*
+
+</TabItem>
+<TabItem value="21" label="404 NOT FOUND">
+
+
+<br/>
+
+*Current server is not the leader*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="22" label="cURL">
+
+
+```shell
+curl "http://COORDINATOR_IP:COORDINATOR_PORT/druid/coordinator/v1/isLeader"
+```
+
+</TabItem>
+<TabItem value="23" label="HTTP">
+
+
+```http
+GET /druid/coordinator/v1/isLeader HTTP/1.1
+Host: http://COORDINATOR_IP:COORDINATOR_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+  {
+    "leader": true
+  }
+  ```
+
+</details>
+
+
+### Get Historical Cloning Status
+
+Retrieves the current status of Historical cloning from the Coordinator.
+
+#### URL
+
+`GET` `/druid/coordinator/v1/config/cloneStatus`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="56" label="200 SUCCESS">
+
+
+<br/>
+
+*Successfully retrieved cloning status*
+
+</TabItem>
+</Tabs>
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="58" label="cURL">
+
+
+```shell
+curl "http://COORDINATOR_IP:COORDINATOR_PORT/druid/coordinator/v1/config/cloneStatus"
+```
+
+</TabItem>
+<TabItem value="59" label="HTTP">
+
+
+```http
+GET /druid/coordinator/v1/config/cloneStatus HTTP/1.1
+Host: http://COORDINATOR_IP:COORDINATOR_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+```json
+{
+  "cloneStatus": [
+    {
+      "sourceServer": "localhost:8089",
+      "targetServer": "localhost:8083",
+      "state": "IN_PROGRESS",
+      "segmentLoadsRemaining": 0,
+      "segmentDropsRemaining": 0,
+      "bytesToLoad": 0
+    }
+  ]
+}
+```
+
+</details>
+
+### Get Broker dynamic configuration view
+
+Retrieves the list of Brokers which have an up-to-date view of Coordinator dynamic configuration.
+
+#### URL
+
+`GET` `/druid/coordinator/v1/config/syncedBrokers`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="56" label="200 SUCCESS">
+
+
+<br/>
+
+*Successfully retrieved Broker Configuration view*
+
+</TabItem>
+</Tabs>
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="58" label="cURL">
+
+
+```shell
+curl "http://COORDINATOR_IP:COORDINATOR_PORT/druid/coordinator/v1/config/syncedBrokers"
+```
+
+</TabItem>
+<TabItem value="59" label="HTTP">
+
+
+```http
+GET /druid/coordinator/v1/config/syncedBrokers HTTP/1.1
+Host: http://COORDINATOR_IP:COORDINATOR_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+```json
+{
+  "syncedBrokers": [
+    {
+      "host": "localhost",
+      "port": 8082,
+      "lastSyncTimestampMillis": 1745756337472
+    }
+  ]
+}
+```
+
+</details>
+
+## Overlord
+
+### Get Overlord leader address
+
+Retrieves the address of the current leader Overlord of the cluster. In a cluster of multiple Overlords, only one Overlord assumes the leading role, while the remaining Overlords remain on standby.
+
+#### URL
+
+`GET` `/druid/indexer/v1/leader`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="24" label="200 SUCCESS">
+
+
+<br/>
+
+*Successfully retrieved leader Overlord address*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="25" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/leader"
+```
+
+</TabItem>
+<TabItem value="26" label="HTTP">
+
+
+```http
+GET /druid/indexer/v1/leader HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+  http://localhost:8081
+  ```
+
+</details>
+
+
+### Get Overlord leader status
+
+Retrieves a JSON object with a `leader` property. The value can be `true` or `false`, indicating if this server is the current leader Overlord of the cluster. To get the individual address of the leader Overlord node, see the [leader endpoint](#get-overlord-leader-address).
+
+Use this endpoint as a load balancer status check when you only want the active leader to be considered in-service at the load balancer.
+
+#### URL
+
+`GET` `/druid/indexer/v1/isLeader`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="27" label="200 SUCCESS">
+
+
+<br/>
+
+*Current server is the leader*
+
+</TabItem>
+<TabItem value="28" label="404 NOT FOUND">
+
+
+<br/>
+
+*Current server is not the leader*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="29" label="cURL">
+
+
+```shell
+curl "http://OVERLORD_IP:OVERLORD_PORT/druid/indexer/v1/isLeader"
+```
+
+</TabItem>
+<TabItem value="30" label="HTTP">
+
+
+```http
+GET /druid/indexer/v1/isLeader HTTP/1.1
+Host: http://OVERLORD_IP:OVERLORD_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+  {
+    "leader": true
+  }
+  ```
+
+</details>
+
+
+## Middle Manager
+
+### Get Middle Manager state status
+
+Retrieves the enabled state of the Middle Manager process. Returns JSON object keyed by the combined `druid.host` and `druid.port` with a boolean `true` or `false` state as the value.
+
+#### URL
+
+`GET` `/druid/worker/v1/enabled`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="31" label="200 SUCCESS">
+
+
+<br/>
+
+*Successfully retrieved Middle Manager state*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="32" label="cURL">
+
+
+```shell
+curl "http://MIDDLEMANAGER_IP:MIDDLEMANAGER_PORT/druid/worker/v1/enabled"
+```
+
+</TabItem>
+<TabItem value="33" label="HTTP">
+
+
+```http
+GET /druid/worker/v1/enabled HTTP/1.1
+Host: http://MIDDLEMANAGER_IP:MIDDLEMANAGER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+  {
+    "localhost:8091": true
+  }
+  ```
+
+</details>
+
+### Get active tasks
+
+Retrieves a list of active tasks being run on the Middle Manager. Returns JSON list of task ID strings. Note that for normal usage, you should use the `/druid/indexer/v1/tasks` [Tasks API](./tasks-api.md) endpoint or one of the task state specific variants instead.
+
+#### URL
+
+`GET` `/druid/worker/v1/tasks`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="34" label="200 SUCCESS">
+
+
+<br/>
+
+*Successfully retrieved active tasks*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="35" label="cURL">
+
+
+```shell
+curl "http://MIDDLEMANAGER_IP:MIDDLEMANAGER_PORT/druid/worker/v1/tasks"
+```
+
+</TabItem>
+<TabItem value="36" label="HTTP">
+
+
+```http
+GET /druid/worker/v1/tasks HTTP/1.1
+Host: http://MIDDLEMANAGER_IP:MIDDLEMANAGER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+  [
+    "index_parallel_wikipedia_mgchefio_2023-06-13T22:18:05.360Z"
+  ]
+  ```
+
+</details>
+
+### Get task log
+
+Retrieves task log output stream by task ID. For normal usage, you should use the `/druid/indexer/v1/task/{taskId}/log`
+[Tasks API](./tasks-api.md) endpoint instead.
+
+#### URL
+
+`GET` `/druid/worker/v1/task/{taskId}/log`
+
+### Shut down running task
+
+Shuts down a running task by ID. For normal usage, you should use the `/druid/indexer/v1/task/{taskId}/shutdown`
+[Tasks API](./tasks-api.md) endpoint instead.
+
+#### URL
+
+`POST` `/druid/worker/v1/task/{taskId}/shutdown`
+
+#### Responses
+<Tabs>
+
+<TabItem value="37" label="200 SUCCESS">
+
+
+<br/>
+
+*Successfully shut down a task*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+The following example shuts down a task with specified ID `index_kafka_wikiticker_f7011f8ffba384b_fpeclode`.
+
+<Tabs>
+
+<TabItem value="38" label="cURL">
+
+
+```shell
+curl "http://MIDDLEMANAGER_IP:MIDDLEMANAGER_PORT/druid/worker/v1/task/index_kafka_wikiticker_f7011f8ffba384b_fpeclode/shutdown"
+```
+
+</TabItem>
+<TabItem value="39" label="HTTP">
+
+
+```http
+POST /druid/worker/v1/task/index_kafka_wikiticker_f7011f8ffba384b_fpeclode/shutdown HTTP/1.1
+Host: http://MIDDLEMANAGER_IP:MIDDLEMANAGER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+  {
+    "task":"index_kafka_wikiticker_f7011f8ffba384b_fpeclode"
+  }
+  ```
+
+</details>
+
+### Disable Middle Manager
+
+Disables a Middle Manager, causing it to stop accepting new tasks but complete all existing tasks. Returns a JSON  object
+keyed by the combined `druid.host` and `druid.port`.
+
+#### URL
+
+`POST` `/druid/worker/v1/disable`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="40" label="200 SUCCESS">
+
+
+<br/>
+
+*Successfully disabled Middle Manager*
+
+</TabItem>
+</Tabs>
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="41" label="cURL">
+
+
+```shell
+curl "http://MIDDLEMANAGER_IP:MIDDLEMANAGER_PORT/druid/worker/v1/disable"
+```
+
+</TabItem>
+<TabItem value="42" label="HTTP">
+
+
+```http
+POST /druid/worker/v1/disable HTTP/1.1
+Host: http://MIDDLEMANAGER_IP:MIDDLEMANAGER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+  {
+    "localhost:8091":"disabled"
+  }
+  ```
+
+</details>
+
+### Enable Middle Manager
+
+Enables a Middle Manager, allowing it to accept new tasks again if it was previously disabled. Returns a JSON object keyed by the combined `druid.host` and `druid.port`.
+
+#### URL
+
+`POST` `/druid/worker/v1/enable`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="43" label="200 SUCCESS">
+
+
+<br/>
+
+*Successfully enabled Middle Manager*
+
+</TabItem>
+</Tabs>
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="44" label="cURL">
+
+
+```shell
+curl "http://MIDDLEMANAGER_IP:MIDDLEMANAGER_PORT/druid/worker/v1/enable"
+```
+
+</TabItem>
+<TabItem value="45" label="HTTP">
+
+
+```http
+POST /druid/worker/v1/enable HTTP/1.1
+Host: http://MIDDLEMANAGER_IP:MIDDLEMANAGER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+  {
+    "localhost:8091":"enabled"
+  }
+  ```
+
+</details>
+
+## Historical
+
+### Get segment load status
+
+Retrieves a JSON object of the form `{"cacheInitialized":value}`, where value is either `true` or `false` indicating if all segments in the local cache have been loaded.
+
+Use this endpoint to know when a Broker service is ready to accept queries after a restart.
+
+#### URL
+
+`GET` `/druid/historical/v1/loadstatus`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="46" label="200 SUCCESS">
+
+
+<br/>
+
+*Successfully retrieved status*
+
+</TabItem>
+</Tabs>
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="47" label="cURL">
+
+
+```shell
+curl "http://HISTORICAL_IP:HISTORICAL_PORT/druid/historical/v1/loadstatus"
+```
+
+</TabItem>
+<TabItem value="48" label="HTTP">
+
+
+```http
+GET /druid/historical/v1/loadstatus HTTP/1.1
+Host: http://HISTORICAL_IP:HISTORICAL_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+  {
+    "cacheInitialized": true
+  }
+  ```
+
+</details>
+
+### Get segment readiness
+
+Retrieves a status code to indicate if all segments in the local cache have been loaded. Similar to `/druid/historical/v1/loadstatus`, but instead of returning JSON with a flag, it returns status codes.
+
+#### URL
+
+`GET` `/druid/historical/v1/readiness`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="49" label="200 SUCCESS">
+
+
+<br/>
+
+*Segments in local cache successfully loaded*
+
+</TabItem>
+<TabItem value="50" label="503 SERVICE UNAVAILABLE">
+
+
+<br/>
+
+*Segments in local cache have not been loaded*
+
+</TabItem>
+</Tabs>
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="51" label="cURL">
+
+
+```shell
+curl "http://HISTORICAL_IP:HISTORICAL_PORT/druid/historical/v1/readiness"
+```
+
+</TabItem>
+<TabItem value="52" label="HTTP">
+
+
+```http
+GET /druid/historical/v1/readiness HTTP/1.1
+Host: http://HISTORICAL_IP:HISTORICAL_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+A successful response to this endpoint results in an empty response body.
+
+## Load Status
+
+### Get Broker query load status
+
+Retrieves a flag indicating if the Broker knows about all segments in the cluster. Use this endpoint to know when a Broker service is ready to accept queries after a restart.
+
+#### URL
+
+`GET` `/druid/broker/v1/loadstatus`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="53" label="200 SUCCESS">
+
+
+<br/>
+
+*Segments successfully loaded*
+
+</TabItem>
+</Tabs>
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="54" label="cURL">
+
+
+```shell
+curl "http://BROKER_IP:BROKER_PORT/druid/broker/v1/loadstatus"
+```
+
+</TabItem>
+<TabItem value="55" label="HTTP">
+
+
+```http
+GET /druid/broker/v1/loadstatus HTTP/1.1
+Host: http://<BROKER_IP>:<BROKER_PORT>
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+  {
+    "inventoryInitialized": true
+  }
+  ```
+
+</details>
+
+### Get Broker query readiness
+
+Retrieves a status code to indicate Broker readiness. Readiness signifies the Broker knows about all segments in the cluster and is ready to accept queries after a restart. Similar to `/druid/broker/v1/loadstatus`, but instead of returning a JSON, it returns status codes.
+
+#### URL
+
+`GET` `/druid/broker/v1/readiness`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="56" label="200 SUCCESS">
+
+
+<br/>
+
+*Segments successfully loaded*
+
+</TabItem>
+<TabItem value="57" label="503 SERVICE UNAVAILABLE">
+
+
+<br/>
+
+*Segments have not been loaded*
+
+</TabItem>
+</Tabs>
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="58" label="cURL">
+
+
+```shell
+curl "http://BROKER_IP:BROKER_PORT/druid/broker/v1/readiness"
+```
+
+</TabItem>
+<TabItem value="59" label="HTTP">
+
+
+```http
+GET /druid/broker/v1/readiness HTTP/1.1
+Host: http://BROKER_IP:BROKER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+A successful response to this endpoint results in an empty response body.
diff --git a/docs/35.0.0/api-reference/sql-api.md b/docs/35.0.0/api-reference/sql-api.md
new file mode 100644
index 0000000000..af60cee4c8
--- /dev/null
+++ b/docs/35.0.0/api-reference/sql-api.md
@@ -0,0 +1,1727 @@
+---
+id: sql-api
+title: Druid SQL API
+sidebar_label: Druid SQL
+---
+import Tabs from '@theme/Tabs';
+import TabItem from '@theme/TabItem';
+
+<!--
+
+
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ Apache Druid supports two query languages: Druid SQL and [native queries](../querying/querying.md).
+ This document describes the SQL language.
+:::
+
+In this topic, `http://ROUTER_IP:ROUTER_PORT` is a placeholder for your Router service address and port. Replace it with the information for your deployment. For example, use `http://localhost:8888` for quickstart deployments.
+
+## Query from Historicals
+
+### Submit a query
+
+Submits a SQL-based query in the JSON or text format request body. 
+Returns a JSON object with the query results and optional metadata for the results. You can also use this endpoint to query [metadata tables](../querying/sql-metadata-tables.md).
+
+Each query has an associated SQL query ID. You can set this ID manually using the SQL context parameter `sqlQueryId`. If not set, Druid automatically generates `sqlQueryId` and returns it in the response header for `X-Druid-SQL-Query-Id`. Note that you need the `sqlQueryId` to [cancel a query](#cancel-a-query).
+
+#### URL
+
+`POST` `/druid/v2/sql`
+
+#### JSON Format Request body
+
+To send queries in JSON format, the `Content-Type` in the HTTP request MUST be `application/json`.
+If there are multiple `Content-Type` headers, the **first** one is used.
+
+The request body takes the following properties:
+
+* `query`: SQL query string. HTTP requests are permitted to include multiple `SET` statements to assign [SQL query context parameter](../querying/sql-query-context.md) values to apply to the query statement, see [SET](../querying/sql.md#set) for details. Context parameters set by `SET` statements take priority over values set in `context`.
+* `resultFormat`: String that indicates the format to return query results. Select one of the following formats:
+  * `object`: Returns a JSON array of JSON objects with the HTTP response header `Content-Type: application/json`.  
+     Object field names match the columns returned by the SQL query in the same order as the SQL query.
+
+  * `array`: Returns a JSON array of JSON arrays with the HTTP response header `Content-Type: application/json`.  
+     Each inner array has elements matching the columns returned by the SQL query, in order.
+
+  * `objectLines`: Returns newline-delimited JSON objects with the HTTP response header `Content-Type: text/plain`.  
+     Newline separation facilitates parsing the entire response set as a stream if you don't have a streaming JSON parser.
+     This format includes a single trailing newline character so you can detect a truncated response.
+
+  * `arrayLines`: Returns newline-delimited JSON arrays with the HTTP response header `Content-Type: text/plain`.  
+     Newline separation facilitates parsing the entire response set as a stream if you don't have a streaming JSON parser.
+     This format includes a single trailing newline character so you can detect a truncated response.
+
+  * `csv`: Returns comma-separated values with one row per line. Sent with the HTTP response header `Content-Type: text/csv`.  
+     Druid uses double quotes to escape individual field values. For example, a value with a comma returns `"A,B"`.
+     If the field value contains a double quote character, Druid escapes it with a second double quote character.
+     For example, `foo"bar` becomes `foo""bar`.
+      This format includes a single trailing newline character so you can detect a truncated response.
+
+* `header`: Boolean value that determines whether to return information on column names. When set to `true`, Druid returns the column names as the first row of the results. To also get information on the column types, set `typesHeader` or `sqlTypesHeader` to `true`. For a comparative overview of data formats and configurations for the header, see the [Query output format](#query-output-format) table.
+
+* `typesHeader`: Adds Druid runtime type information in the header. Requires `header` to be set to `true`. Complex types, like sketches, will be reported as `COMPLEX<typeName>` if a particular complex type name is known for that field, or as `COMPLEX` if the particular type name is unknown or mixed.
+
+* `sqlTypesHeader`: Adds SQL type information in the header. Requires `header` to be set to `true`.
+
+   For compatibility, Druid returns the HTTP header `X-Druid-SQL-Header-Included: yes` when all of the following conditions are met:
+   * The `header` property is set to true.
+   * The version of Druid supports `typesHeader` and `sqlTypesHeader`, regardless of whether either property is set.
+
+* `context`: JSON object containing optional [SQL query context parameters](../querying/sql-query-context.md), such as to set the query ID, time zone, and whether to use an approximation algorithm for distinct count. You can also set the context through the SQL SET command. For more information, see [Druid SQL overview](../querying/sql.md#set).
+
+* `parameters`: List of query parameters for parameterized queries. Each parameter in the array should be a JSON object containing the parameter's SQL data type and parameter value. For more information on using dynamic parameters, see [Dynamic parameters](../querying/sql.md#dynamic-parameters). For a list of supported SQL types, see [Data types](../querying/sql-data-types.md).
+
+    For example:
+
+    ```json
+    {
+        "query": "SELECT \"arrayDouble\", \"stringColumn\" FROM \"array_example\" WHERE ARRAY_CONTAINS(\"arrayDouble\", ?) AND \"stringColumn\" = ?",
+        "parameters": [
+            {"type": "ARRAY", "value": [999.0, null, 5.5]},
+            {"type": "VARCHAR", "value": "bar"}
+            ]
+    }
+    ```
+
+##### Text Format Request body
+
+Druid also allows you to submit SQL queries in text format which is simpler than above JSON format. 
+To do this, just set the `Content-Type` request header to `text/plain` or `application/x-www-form-urlencoded`, and pass SQL via the HTTP Body. 
+
+If `application/x-www-form-urlencoded` is used, make sure the SQL query is URL-encoded.
+
+If there are multiple `Content-Type` headers, the **first** one is used.
+
+For response, the `resultFormat` is always `object` with the HTTP response header `Content-Type: application/json`.
+If you want more control over the query context or response format, use the above JSON format request body instead.
+
+The following example demonstrates how to submit a SQL query in text format:
+
+```commandline
+echo 'SELECT 1' | curl -H 'Content-Type: text/plain' http://ROUTER_IP:ROUTER_PORT/druid/v2/sql --data @- 
+```
+
+We can also use `application/x-www-form-urlencoded` to submit URL-encoded SQL queries as shown by the following examples:
+
+```commandline
+echo 'SELECT%20%31' | curl http://ROUTER_IP:ROUTER_PORT/druid/v2/sql --data @-
+echo 'SELECT 1' | curl http://ROUTER_IP:ROUTER_PORT/druid/v2/sql --data-urlencode @-
+```
+
+The `curl` tool uses `application/x-www-form-urlencoded` as Content-Type header if the header is not given.
+
+The first example pass the URL-encoded query `SELECT%20%31`, which is `SELECT 1`, to the `curl` and `curl` will directly sends it to the server.
+While the second example passes the raw query `SELECT 1` to `curl` and the `curl` encodes the query to `SELECT%20%31` because of `--data-urlencode` option and sends the encoded text to the server.
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="1" label="200 SUCCESS">
+
+
+*Successfully submitted query*
+
+</TabItem>
+<TabItem value="2" label="400 BAD REQUEST">
+
+
+*Error thrown due to bad query. Returns a JSON object detailing the error with the following format:*
+
+```json
+{
+    "error": "A well-defined error code.",
+    "errorMessage": "A message with additional details about the error.",
+    "errorClass": "Class of exception that caused this error.",
+    "host": "The host on which the error occurred."
+}
+```
+</TabItem>
+<TabItem value="3" label="500 INTERNAL SERVER ERROR">
+
+
+*Request not sent due to unexpected conditions. Returns a JSON object detailing the error with the following format:*
+
+```json
+{
+    "error": "A well-defined error code.",
+    "errorMessage": "A message with additional details about the error.",
+    "errorClass": "Class of exception that caused this error.",
+    "host": "The host on which the error occurred."
+}
+```
+
+</TabItem>
+</Tabs>
+
+#### Client-side error handling and truncated responses
+
+Druid reports errors that occur before the response body is sent as JSON with an HTTP 500 status code. The errors are reported using the same format as [native Druid query errors](../querying/querying.md#query-errors).
+If an error occurs while Druid is sending the response body, the server handling the request stops the response midstream and logs an error.
+
+This means that when you call the SQL API, you must properly handle response truncation.
+For  `object` and `array` formats, truncated responses are invalid JSON.
+For line-oriented formats, Druid includes a newline character as the final character of every complete response. Absence of a final newline character indicates a truncated response.
+
+If you detect a truncated response, treat it as an error.
+
+---
+
+#### Sample request
+
+In the following example, this query demonstrates the following actions:
+- Retrieves all rows from the `wikipedia` datasource.
+- Filters the results where the `user` value is `BlueMoon2662`.
+- Applies the `sqlTimeZone` context parameter to set the time zone of results to `America/Los_Angeles`.
+- Returns descriptors for `header`, `typesHeader`, and `sqlTypesHeader`.
+
+
+<Tabs>
+
+<TabItem value="4" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/v2/sql" \
+--header 'Content-Type: application/json' \
+--data '{
+    "query": "SELECT * FROM wikipedia WHERE user='\''BlueMoon2662'\''",
+    "context" : {"sqlTimeZone" : "America/Los_Angeles"},
+    "header" : true,
+    "typesHeader" : true,
+    "sqlTypesHeader" : true
+}'
+```
+
+</TabItem>
+<TabItem value="5" label="HTTP">
+
+
+```HTTP
+POST /druid/v2/sql HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+Content-Type: application/json
+Content-Length: 201
+
+{
+    "query": "SELECT * FROM wikipedia WHERE user='BlueMoon2662'",
+    "context" : {"sqlTimeZone" : "America/Los_Angeles"},
+    "header" : true,
+    "typesHeader" : true,
+    "sqlTypesHeader" : true
+}
+```
+
+</TabItem>
+</Tabs>
+
+You can also specify query-level context parameters directly within the SQL query string using the `SET` command. For more details, see [SET](../querying/sql.md#set).
+
+The following request body is functionally equivalent to the previous example and uses SET instead of the `context` parameter:
+
+```JSON
+{
+  "query": "SET sqlTimeZone='America/Los_Angeles'; SELECT * FROM wikipedia WHERE user='BlueMoon2662'",
+  "header": true,
+  "typesHeader": true,
+  "sqlTypesHeader": true
+}
+```
+
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+```json
+[
+    {
+        "__time": {
+            "type": "LONG",
+            "sqlType": "TIMESTAMP"
+        },
+        "channel": {
+            "type": "STRING",
+            "sqlType": "VARCHAR"
+        },
+        "cityName": {
+            "type": "STRING",
+            "sqlType": "VARCHAR"
+        },
+        "comment": {
+            "type": "STRING",
+            "sqlType": "VARCHAR"
+        },
+        "countryIsoCode": {
+            "type": "STRING",
+            "sqlType": "VARCHAR"
+        },
+        "countryName": {
+            "type": "STRING",
+            "sqlType": "VARCHAR"
+        },
+        "isAnonymous": {
+            "type": "STRING",
+            "sqlType": "VARCHAR"
+        },
+        "isMinor": {
+            "type": "STRING",
+            "sqlType": "VARCHAR"
+        },
+        "isNew": {
+            "type": "STRING",
+            "sqlType": "VARCHAR"
+        },
+        "isRobot": {
+            "type": "STRING",
+            "sqlType": "VARCHAR"
+        },
+        "isUnpatrolled": {
+            "type": "STRING",
+            "sqlType": "VARCHAR"
+        },
+        "metroCode": {
+            "type": "LONG",
+            "sqlType": "BIGINT"
+        },
+        "namespace": {
+            "type": "STRING",
+            "sqlType": "VARCHAR"
+        },
+        "page": {
+            "type": "STRING",
+            "sqlType": "VARCHAR"
+        },
+        "regionIsoCode": {
+            "type": "STRING",
+            "sqlType": "VARCHAR"
+        },
+        "regionName": {
+            "type": "STRING",
+            "sqlType": "VARCHAR"
+        },
+        "user": {
+            "type": "STRING",
+            "sqlType": "VARCHAR"
+        },
+        "delta": {
+            "type": "LONG",
+            "sqlType": "BIGINT"
+        },
+        "added": {
+            "type": "LONG",
+            "sqlType": "BIGINT"
+        },
+        "deleted": {
+            "type": "LONG",
+            "sqlType": "BIGINT"
+        }
+    },
+    {
+        "__time": "2015-09-11T17:47:53.259-07:00",
+        "channel": "#ja.wikipedia",
+        "cityName": null,
+        "comment": "/* 対戦通算成績と得失点 */",
+        "countryIsoCode": null,
+        "countryName": null,
+        "isAnonymous": "false",
+        "isMinor": "true",
+        "isNew": "false",
+        "isRobot": "false",
+        "isUnpatrolled": "false",
+        "metroCode": null,
+        "namespace": "Main",
+        "page": "アルビレックス新潟の年度別成績一覧",
+        "regionIsoCode": null,
+        "regionName": null,
+        "user": "BlueMoon2662",
+        "delta": 14,
+        "added": 14,
+        "deleted": 0
+    }
+]
+```
+</details>
+
+### Cancel a query
+
+Cancels a query on the Router or the Broker with the associated `sqlQueryId`. The `sqlQueryId` can be manually set when the query is submitted in the query context parameter, or if not set, Druid will generate one and return it in the response header when the query is successfully submitted. Note that Druid does not enforce a unique `sqlQueryId` in the query context. If you've set the same `sqlQueryId` for multiple queries, Druid cancels all requests with that query ID.
+
+When you cancel a query, Druid handles the cancellation in a best-effort manner. Druid immediately marks the query as canceled and aborts the query execution as soon as possible. However, the query may continue running for a short time after you make the cancellation request.
+
+Cancellation requests require READ permission on all resources used in the SQL query.
+
+#### URL
+
+`DELETE` `/druid/v2/sql/{sqlQueryId}`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="6" label="202 SUCCESS">
+
+
+*Successfully deleted query*
+
+</TabItem>
+<TabItem value="7" label="403 FORBIDDEN">
+
+
+*Authorization failure*
+
+</TabItem>
+<TabItem value="8" label="404 NOT FOUND">
+
+
+*Invalid `sqlQueryId` or query was completed before cancellation request*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+The following example cancels a request with the set query ID `request01`.
+
+<Tabs>
+
+<TabItem value="9" label="cURL">
+
+
+```shell
+curl --request DELETE "http://ROUTER_IP:ROUTER_PORT/druid/v2/sql/request01"
+```
+
+</TabItem>
+<TabItem value="10" label="HTTP">
+
+
+```HTTP
+DELETE /druid/v2/sql/request01 HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+A successful response results in an `HTTP 202` message code and an empty response body.
+
+### Query output format
+
+The following table shows examples of how Druid returns the column names and data types based on the result format and the type request.
+In all cases, `header` is true.
+The examples includes the first row of results, where the value of `user` is `BlueMoon2662`.
+
+```
+| Format | typesHeader | sqlTypesHeader | Example output                                                                             |
+|--------|-------------|----------------|--------------------------------------------------------------------------------------------|
+| object | true        | false          | [ { "user" : { "type" : "STRING" } }, { "user" : "BlueMoon2662" } ]                        |
+| object | true        | true           | [ { "user" : { "type" : "STRING", "sqlType" : "VARCHAR" } }, { "user" : "BlueMoon2662" } ] |
+| object | false       | true           | [ { "user" : { "sqlType" : "VARCHAR" } }, { "user" : "BlueMoon2662" } ]                    |
+| object | false       | false          | [ { "user" : null }, { "user" : "BlueMoon2662" } ]                                         |
+| array  | true        | false          | [ [ "user" ], [ "STRING" ], [ "BlueMoon2662" ] ]                                           |
+| array  | true        | true           | [ [ "user" ], [ "STRING" ], [ "VARCHAR" ], [ "BlueMoon2662" ] ]                            |
+| array  | false       | true           | [ [ "user" ], [ "VARCHAR" ], [ "BlueMoon2662" ] ]                                          |
+| array  | false       | false          | [ [ "user" ], [ "BlueMoon2662" ] ]                                                         |
+| csv    | true        | false          | user STRING BlueMoon2662                                                                   |
+| csv    | true        | true           | user STRING VARCHAR BlueMoon2662                                                           |
+| csv    | false       | true           | user VARCHAR BlueMoon2662                                                                  |
+| csv    | false       | false          | user BlueMoon2662                                                                          |
+```
+
+## Query from deep storage
+
+You can use the `sql/statements` endpoint to query segments that exist only in deep storage and are not loaded onto your Historical processes as determined by your load rules.
+
+Note that at least one segment of a datasource must be available on a Historical process so that the Broker can plan your query. A quick way to check if this is true is whether or not a datasource is visible in the Druid console.
+
+
+For more information, see [Query from deep storage](../querying/query-from-deep-storage.md).
+
+### Submit a query
+
+Submit a query for data stored in deep storage. Any data ingested into Druid is placed into deep storage. The query is contained in the "query" field in the JSON object within the request payload.
+
+Note that at least part of a datasource must be available on a Historical process so that Druid can plan your query and only the user who submits a query can see the results.
+
+#### URL
+
+`POST` `/druid/v2/sql/statements`
+
+#### Request body
+
+Generally, the `sql` and `sql/statements` endpoints support the same response body fields with minor differences. For general information about the available fields, see [Submit a query to the `sql` endpoint](#submit-a-query).
+
+Keep the following in mind when submitting queries to the `sql/statements` endpoint:
+
+- Apart from the context parameters mentioned [here](../multi-stage-query/reference.md#context-parameters) there are additional context parameters for `sql/statements` specifically:
+
+   - `executionMode`  determines how query results are fetched. Druid currently only supports `ASYNC`. You must manually retrieve your results after the query completes.
+   - `selectDestination` determines where final results get written. By default, results are written to task reports. Set this parameter to `durableStorage` to instruct Druid to write the results from SELECT queries to durable storage, which allows you to fetch larger result sets. For result sets with more than 3000 rows, it is highly recommended to use `durableStorage`. Note that this requires you to have [durable storage for MSQ](../operations/durable-storage.md) enabled.
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="1" label="200 SUCCESS">
+
+
+*Successfully queried from deep storage*
+
+</TabItem>
+<TabItem value="2" label="400 BAD REQUEST">
+
+
+*Error thrown due to bad query. Returns a JSON object detailing the error with the following format:*
+
+```json
+{
+    "error": "Summary of the encountered error.",
+    "errorClass": "Class of exception that caused this error.",
+    "host": "The host on which the error occurred.",
+    "errorCode": "Well-defined error code.",
+    "persona": "Role or persona associated with the error.",
+    "category": "Classification of the error.",
+    "errorMessage": "Summary of the encountered issue with expanded information.",
+    "context": "Additional context about the error."
+}
+```
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="3" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/v2/sql/statements" \
+--header 'Content-Type: application/json' \
+--data '{
+    "query": "SELECT * FROM wikipedia WHERE user='\''BlueMoon2662'\''",
+    "context": {
+        "executionMode":"ASYNC"
+    }
+}'
+```
+
+</TabItem>
+<TabItem value="4" label="HTTP">
+
+
+```HTTP
+POST /druid/v2/sql/statements HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+Content-Type: application/json
+Content-Length: 134
+
+{
+    "query": "SELECT * FROM wikipedia WHERE user='BlueMoon2662'",
+    "context": {
+        "executionMode":"ASYNC"
+    }
+}
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+{
+    "queryId": "query-b82a7049-b94f-41f2-a230-7fef94768745",
+    "state": "ACCEPTED",
+    "createdAt": "2023-07-26T21:16:25.324Z",
+    "schema": [
+        {
+            "name": "__time",
+            "type": "TIMESTAMP",
+            "nativeType": "LONG"
+        },
+        {
+            "name": "channel",
+            "type": "VARCHAR",
+            "nativeType": "STRING"
+        },
+        {
+            "name": "cityName",
+            "type": "VARCHAR",
+            "nativeType": "STRING"
+        },
+        {
+            "name": "comment",
+            "type": "VARCHAR",
+            "nativeType": "STRING"
+        },
+        {
+            "name": "countryIsoCode",
+            "type": "VARCHAR",
+            "nativeType": "STRING"
+        },
+        {
+            "name": "countryName",
+            "type": "VARCHAR",
+            "nativeType": "STRING"
+        },
+        {
+            "name": "isAnonymous",
+            "type": "BIGINT",
+            "nativeType": "LONG"
+        },
+        {
+            "name": "isMinor",
+            "type": "BIGINT",
+            "nativeType": "LONG"
+        },
+        {
+            "name": "isNew",
+            "type": "BIGINT",
+            "nativeType": "LONG"
+        },
+        {
+            "name": "isRobot",
+            "type": "BIGINT",
+            "nativeType": "LONG"
+        },
+        {
+            "name": "isUnpatrolled",
+            "type": "BIGINT",
+            "nativeType": "LONG"
+        },
+        {
+            "name": "metroCode",
+            "type": "BIGINT",
+            "nativeType": "LONG"
+        },
+        {
+            "name": "namespace",
+            "type": "VARCHAR",
+            "nativeType": "STRING"
+        },
+        {
+            "name": "page",
+            "type": "VARCHAR",
+            "nativeType": "STRING"
+        },
+        {
+            "name": "regionIsoCode",
+            "type": "VARCHAR",
+            "nativeType": "STRING"
+        },
+        {
+            "name": "regionName",
+            "type": "VARCHAR",
+            "nativeType": "STRING"
+        },
+        {
+            "name": "user",
+            "type": "VARCHAR",
+            "nativeType": "STRING"
+        },
+        {
+            "name": "delta",
+            "type": "BIGINT",
+            "nativeType": "LONG"
+        },
+        {
+            "name": "added",
+            "type": "BIGINT",
+            "nativeType": "LONG"
+        },
+        {
+            "name": "deleted",
+            "type": "BIGINT",
+            "nativeType": "LONG"
+        }
+    ],
+    "durationMs": -1
+}
+  ```
+</details>
+
+### Get query status
+
+Retrieves information about the query associated with the given query ID. The response matches the response from the POST API if the query is accepted or running and the execution mode is  `ASYNC`. In addition to the fields that this endpoint shares with `POST /sql/statements`, a completed query's status includes the following:
+
+- A `result` object that summarizes information about your results, such as the total number of rows and sample records.
+- A `pages` object that includes the following information for each page of results:
+  -  `numRows`: the number of rows in that page of results.
+  - `sizeInBytes`: the size of the page.
+  - `id`: the page number that you can use to reference a specific page when you get query results.
+
+If the optional query parameter `detail` is supplied, then the response also includes the following:
+- A `stages` object that summarizes information about the different stages being used for query execution, such as stage number, phase, start time, duration, input and output information, processing methods, and partitioning.
+- A `counters` object that provides details on the rows, bytes, and files processed at various stages for each worker across different channels, along with sort progress.
+- A `warnings` object that provides details about any warnings.
+
+#### URL
+
+`GET` `/druid/v2/sql/statements/{queryId}`
+
+#### Query parameters
+* `detail` (optional)
+    * Type: Boolean
+    * Default: false
+    * Fetch additional details about the query, which includes the information about different stages, counters for each stage, and any warnings.
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="5" label="200 SUCCESS">
+
+
+*Successfully retrieved query status*
+
+</TabItem>
+<TabItem value="6" label="400 BAD REQUEST">
+
+
+*Error thrown due to bad query. Returns a JSON object detailing the error with the following format:*
+
+```json
+{
+    "error": "Summary of the encountered error.",
+    "errorCode": "Well-defined error code.",
+    "persona": "Role or persona associated with the error.",
+    "category": "Classification of the error.",
+    "errorMessage": "Summary of the encountered issue with expanded information.",
+    "context": "Additional context about the error."
+}
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample request
+
+The following example retrieves the status of a query with specified ID `query-9b93f6f7-ab0e-48f5-986a-3520f84f0804`.
+
+<Tabs>
+
+<TabItem value="7" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/v2/sql/statements/query-9b93f6f7-ab0e-48f5-986a-3520f84f0804?detail=true"
+```
+
+</TabItem>
+<TabItem value="8" label="HTTP">
+
+
+```HTTP
+GET /druid/v2/sql/statements/query-9b93f6f7-ab0e-48f5-986a-3520f84f0804?detail=true HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+{
+    "queryId": "query-9b93f6f7-ab0e-48f5-986a-3520f84f0804",
+    "state": "SUCCESS",
+    "createdAt": "2023-07-26T22:57:46.620Z",
+    "schema": [
+        {
+            "name": "__time",
+            "type": "TIMESTAMP",
+            "nativeType": "LONG"
+        },
+        {
+            "name": "channel",
+            "type": "VARCHAR",
+            "nativeType": "STRING"
+        },
+        {
+            "name": "cityName",
+            "type": "VARCHAR",
+            "nativeType": "STRING"
+        },
+        {
+            "name": "comment",
+            "type": "VARCHAR",
+            "nativeType": "STRING"
+        },
+        {
+            "name": "countryIsoCode",
+            "type": "VARCHAR",
+            "nativeType": "STRING"
+        },
+        {
+            "name": "countryName",
+            "type": "VARCHAR",
+            "nativeType": "STRING"
+        },
+        {
+            "name": "isAnonymous",
+            "type": "BIGINT",
+            "nativeType": "LONG"
+        },
+        {
+            "name": "isMinor",
+            "type": "BIGINT",
+            "nativeType": "LONG"
+        },
+        {
+            "name": "isNew",
+            "type": "BIGINT",
+            "nativeType": "LONG"
+        },
+        {
+            "name": "isRobot",
+            "type": "BIGINT",
+            "nativeType": "LONG"
+        },
+        {
+            "name": "isUnpatrolled",
+            "type": "BIGINT",
+            "nativeType": "LONG"
+        },
+        {
+            "name": "metroCode",
+            "type": "BIGINT",
+            "nativeType": "LONG"
+        },
+        {
+            "name": "namespace",
+            "type": "VARCHAR",
+            "nativeType": "STRING"
+        },
+        {
+            "name": "page",
+            "type": "VARCHAR",
+            "nativeType": "STRING"
+        },
+        {
+            "name": "regionIsoCode",
+            "type": "VARCHAR",
+            "nativeType": "STRING"
+        },
+        {
+            "name": "regionName",
+            "type": "VARCHAR",
+            "nativeType": "STRING"
+        },
+        {
+            "name": "user",
+            "type": "VARCHAR",
+            "nativeType": "STRING"
+        },
+        {
+            "name": "delta",
+            "type": "BIGINT",
+            "nativeType": "LONG"
+        },
+        {
+            "name": "added",
+            "type": "BIGINT",
+            "nativeType": "LONG"
+        },
+        {
+            "name": "deleted",
+            "type": "BIGINT",
+            "nativeType": "LONG"
+        }
+    ],
+    "durationMs": 25591,
+    "result": {
+        "numTotalRows": 1,
+        "totalSizeInBytes": 375,
+        "dataSource": "__query_select",
+        "sampleRecords": [
+            [
+                1442018873259,
+                "#ja.wikipedia",
+                "",
+                "/* 対戦通算成績と得失点 */",
+                "",
+                "",
+                0,
+                1,
+                0,
+                0,
+                0,
+                0,
+                "Main",
+                "アルビレックス新潟の年度別成績一覧",
+                "",
+                "",
+                "BlueMoon2662",
+                14,
+                14,
+                0
+            ]
+        ],
+        "pages": [
+            {
+                "id": 0,
+                "numRows": 1,
+                "sizeInBytes": 375
+            }
+        ]
+    },
+    "stages": [
+        {
+            "stageNumber": 0,
+            "definition": {
+                "id": "query-9b93f6f7-ab0e-48f5-986a-3520f84f0804_0",
+                "input": [
+                    {
+                        "type": "table",
+                        "dataSource": "wikipedia",
+                        "intervals": [
+                            "-146136543-09-08T08:23:32.096Z/146140482-04-24T15:36:27.903Z"
+                        ],
+                        "filter": {
+                            "type": "equals",
+                            "column": "user",
+                            "matchValueType": "STRING",
+                            "matchValue": "BlueMoon2662"
+                        },
+                        "filterFields": [
+                            "user"
+                        ]
+                    }
+                ],
+                "processor": {
+                    "type": "scan",
+                    "query": {
+                        "queryType": "scan",
+                        "dataSource": {
+                            "type": "inputNumber",
+                            "inputNumber": 0
+                        },
+                        "intervals": {
+                            "type": "intervals",
+                            "intervals": [
+                                "-146136543-09-08T08:23:32.096Z/146140482-04-24T15:36:27.903Z"
+                            ]
+                        },
+                        "virtualColumns": [
+                            {
+                                "type": "expression",
+                                "name": "v0",
+                                "expression": "'BlueMoon2662'",
+                                "outputType": "STRING"
+                            }
+                        ],
+                        "resultFormat": "compactedList",
+                        "limit": 1001,
+                        "filter": {
+                            "type": "equals",
+                            "column": "user",
+                            "matchValueType": "STRING",
+                            "matchValue": "BlueMoon2662"
+                        },
+                        "columns": [
+                            "__time",
+                            "added",
+                            "channel",
+                            "cityName",
+                            "comment",
+                            "commentLength",
+                            "countryIsoCode",
+                            "countryName",
+                            "deleted",
+                            "delta",
+                            "deltaBucket",
+                            "diffUrl",
+                            "flags",
+                            "isAnonymous",
+                            "isMinor",
+                            "isNew",
+                            "isRobot",
+                            "isUnpatrolled",
+                            "metroCode",
+                            "namespace",
+                            "page",
+                            "regionIsoCode",
+                            "regionName",
+                            "v0"
+                        ],
+                        "context": {
+                            "__resultFormat": "array",
+                            "__user": "allowAll",
+                            "executionMode": "async",
+                            "finalize": true,
+                            "maxNumTasks": 2,
+                            "maxParseExceptions": 0,
+                            "queryId": "33b53acb-7533-4880-a81b-51c16c489eab",
+                            "scanSignature": "[{\"name\":\"__time\",\"type\":\"LONG\"},{\"name\":\"added\",\"type\":\"LONG\"},{\"name\":\"channel\",\"type\":\"STRING\"},{\"name\":\"cityName\",\"type\":\"STRING\"},{\"name\":\"comment\",\"type\":\"STRING\"},{\"name\":\"commentLength\",\"type\":\"LONG\"},{\"name\":\"countryIsoCode\",\"type\":\"STRING\"},{\"name\":\"countryName\",\"type\":\"STRING\"},{\"name\":\"deleted\",\"type\":\"LONG\"},{\"name\":\"delta\",\"type\":\"LONG\"},{\"name\":\"deltaBucket\",\"type\":\"LONG\"},{\"name\":\"diffUrl\",\"type\":\"STRING\"},{\"name\":\"flags\",\"type\":\"STRING\"},{\"name\":\"isAnonymous\",\"type\":\"STRING\"},{\"name\":\"isMinor\",\"type\":\"STRING\"},{\"name\":\"isNew\",\"type\":\"STRING\"},{\"name\":\"isRobot\",\"type\":\"STRING\"},{\"name\":\"isUnpatrolled\",\"type\":\"STRING\"},{\"name\":\"metroCode\",\"type\":\"STRING\"},{\"name\":\"namespace\",\"type\":\"STRING\"},{\"name\":\"page\",\"type\":\"STRING\"},{\"name\":\"regionIsoCode\",\"type\":\"STRING\"},{\"name\":\"regionName\",\"type\":\"STRING\"},{\"name\":\"v0\",\"type\":\"STRING\"}]",
+                            "sqlOuterLimit": 1001,
+                            "sqlQueryId": "33b53acb-7533-4880-a81b-51c16c489eab",
+                            "sqlStringifyArrays": false
+                        },
+                        "columnTypes": [
+                            "LONG",
+                            "LONG",
+                            "STRING",
+                            "STRING",
+                            "STRING",
+                            "LONG",
+                            "STRING",
+                            "STRING",
+                            "LONG",
+                            "LONG",
+                            "LONG",
+                            "STRING",
+                            "STRING",
+                            "STRING",
+                            "STRING",
+                            "STRING",
+                            "STRING",
+                            "STRING",
+                            "STRING",
+                            "STRING",
+                            "STRING",
+                            "STRING",
+                            "STRING",
+                            "STRING"
+                        ],
+                        "granularity": {
+                            "type": "all"
+                        },
+                        "legacy": false
+                    }
+                },
+                "signature": [
+                    {
+                        "name": "__boost",
+                        "type": "LONG"
+                    },
+                    {
+                        "name": "__time",
+                        "type": "LONG"
+                    },
+                    {
+                        "name": "added",
+                        "type": "LONG"
+                    },
+                    {
+                        "name": "channel",
+                        "type": "STRING"
+                    },
+                    {
+                        "name": "cityName",
+                        "type": "STRING"
+                    },
+                    {
+                        "name": "comment",
+                        "type": "STRING"
+                    },
+                    {
+                        "name": "commentLength",
+                        "type": "LONG"
+                    },
+                    {
+                        "name": "countryIsoCode",
+                        "type": "STRING"
+                    },
+                    {
+                        "name": "countryName",
+                        "type": "STRING"
+                    },
+                    {
+                        "name": "deleted",
+                        "type": "LONG"
+                    },
+                    {
+                        "name": "delta",
+                        "type": "LONG"
+                    },
+                    {
+                        "name": "deltaBucket",
+                        "type": "LONG"
+                    },
+                    {
+                        "name": "diffUrl",
+                        "type": "STRING"
+                    },
+                    {
+                        "name": "flags",
+                        "type": "STRING"
+                    },
+                    {
+                        "name": "isAnonymous",
+                        "type": "STRING"
+                    },
+                    {
+                        "name": "isMinor",
+                        "type": "STRING"
+                    },
+                    {
+                        "name": "isNew",
+                        "type": "STRING"
+                    },
+                    {
+                        "name": "isRobot",
+                        "type": "STRING"
+                    },
+                    {
+                        "name": "isUnpatrolled",
+                        "type": "STRING"
+                    },
+                    {
+                        "name": "metroCode",
+                        "type": "STRING"
+                    },
+                    {
+                        "name": "namespace",
+                        "type": "STRING"
+                    },
+                    {
+                        "name": "page",
+                        "type": "STRING"
+                    },
+                    {
+                        "name": "regionIsoCode",
+                        "type": "STRING"
+                    },
+                    {
+                        "name": "regionName",
+                        "type": "STRING"
+                    },
+                    {
+                        "name": "v0",
+                        "type": "STRING"
+                    }
+                ],
+                "shuffleSpec": {
+                    "type": "mix"
+                },
+                "maxWorkerCount": 1
+            },
+            "phase": "FINISHED",
+            "workerCount": 1,
+            "partitionCount": 1,
+            "shuffle": "mix",
+            "output": "localStorage",
+            "startTime": "2024-07-31T15:20:21.255Z",
+            "duration": 103
+        },
+        {
+            "stageNumber": 1,
+            "definition": {
+                "id": "query-9b93f6f7-ab0e-48f5-986a-3520f84f0804_1",
+                "input": [
+                    {
+                        "type": "stage",
+                        "stage": 0
+                    }
+                ],
+                "processor": {
+                    "type": "limit",
+                    "limit": 1001
+                },
+                "signature": [
+                    {
+                        "name": "__boost",
+                        "type": "LONG"
+                    },
+                    {
+                        "name": "__time",
+                        "type": "LONG"
+                    },
+                    {
+                        "name": "added",
+                        "type": "LONG"
+                    },
+                    {
+                        "name": "channel",
+                        "type": "STRING"
+                    },
+                    {
+                        "name": "cityName",
+                        "type": "STRING"
+                    },
+                    {
+                        "name": "comment",
+                        "type": "STRING"
+                    },
+                    {
+                        "name": "commentLength",
+                        "type": "LONG"
+                    },
+                    {
+                        "name": "countryIsoCode",
+                        "type": "STRING"
+                    },
+                    {
+                        "name": "countryName",
+                        "type": "STRING"
+                    },
+                    {
+                        "name": "deleted",
+                        "type": "LONG"
+                    },
+                    {
+                        "name": "delta",
+                        "type": "LONG"
+                    },
+                    {
+                        "name": "deltaBucket",
+                        "type": "LONG"
+                    },
+                    {
+                        "name": "diffUrl",
+                        "type": "STRING"
+                    },
+                    {
+                        "name": "flags",
+                        "type": "STRING"
+                    },
+                    {
+                        "name": "isAnonymous",
+                        "type": "STRING"
+                    },
+                    {
+                        "name": "isMinor",
+                        "type": "STRING"
+                    },
+                    {
+                        "name": "isNew",
+                        "type": "STRING"
+                    },
+                    {
+                        "name": "isRobot",
+                        "type": "STRING"
+                    },
+                    {
+                        "name": "isUnpatrolled",
+                        "type": "STRING"
+                    },
+                    {
+                        "name": "metroCode",
+                        "type": "STRING"
+                    },
+                    {
+                        "name": "namespace",
+                        "type": "STRING"
+                    },
+                    {
+                        "name": "page",
+                        "type": "STRING"
+                    },
+                    {
+                        "name": "regionIsoCode",
+                        "type": "STRING"
+                    },
+                    {
+                        "name": "regionName",
+                        "type": "STRING"
+                    },
+                    {
+                        "name": "v0",
+                        "type": "STRING"
+                    }
+                ],
+                "shuffleSpec": {
+                    "type": "maxCount",
+                    "clusterBy": {
+                        "columns": [
+                            {
+                                "columnName": "__boost",
+                                "order": "ASCENDING"
+                            }
+                        ]
+                    },
+                    "partitions": 1
+                },
+                "maxWorkerCount": 1
+            },
+            "phase": "FINISHED",
+            "workerCount": 1,
+            "partitionCount": 1,
+            "shuffle": "globalSort",
+            "output": "localStorage",
+            "startTime": "2024-07-31T15:20:21.355Z",
+            "duration": 10,
+            "sort": true
+        }
+    ],
+    "counters": {
+        "0": {
+            "0": {
+                "input0": {
+                    "type": "channel",
+                    "rows": [
+                        24433
+                    ],
+                    "bytes": [
+                        7393933
+                    ],
+                    "files": [
+                        22
+                    ],
+                    "totalFiles": [
+                        22
+                    ]
+                }
+            }
+        },
+        "1": {
+            "0": {
+                "sortProgress": {
+                    "type": "sortProgress",
+                    "totalMergingLevels": -1,
+                    "levelToTotalBatches": {},
+                    "levelToMergedBatches": {},
+                    "totalMergersForUltimateLevel": -1,
+                    "triviallyComplete": true,
+                    "progressDigest": 1
+                }
+            }
+        }
+    },
+    "warnings": []
+}
+  ```
+</details>
+
+
+### Get query results
+
+Retrieves results for completed queries. Results are separated into pages, so you can use the optional `page` parameter to refine the results you get. Druid returns information about the composition of each page and its page number (`id`). For information about pages, see [Get query status](#get-query-status).
+
+If a page number isn't passed, all results are returned sequentially in the same response. If you have large result sets, you may encounter timeouts based on the value configured for `druid.router.http.readTimeout`.
+
+Getting the query results for an ingestion query returns an empty response.
+
+#### URL
+
+`GET` `/druid/v2/sql/statements/{queryId}/results`
+
+#### Query parameters
+* `page` (optional)
+    * Type: Int
+    * Fetch results based on page numbers. If not specified, all results are returned sequentially starting from page 0 to N in the same response.
+* `resultFormat` (optional)
+    * Type: String
+    * Defines the format in which the results are presented. The following options are supported `arrayLines`,`objectLines`,`array`,`object`, and `csv`. The default is `object`.
+* `filename` (optional)
+    * Type: String  
+    * If set, attaches a `Content-Disposition` header to the response with the value of `attachment; filename={filename}`. The filename must not be longer than 255 characters and must not contain the characters `/`, `\`, `:`, `*`, `?`, `"`, `<`, `>`, `|`, `\0`, `\n`, or `\r`.
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="9" label="200 SUCCESS">
+
+
+*Successfully retrieved query results*
+
+</TabItem>
+<TabItem value="10" label="400 BAD REQUEST">
+
+
+*Query in progress. Returns a JSON object detailing the error with the following format:*
+
+```json
+{
+    "error": "Summary of the encountered error.",
+    "errorCode": "Well-defined error code.",
+    "persona": "Role or persona associated with the error.",
+    "category": "Classification of the error.",
+    "errorMessage": "Summary of the encountered issue with expanded information.",
+    "context": "Additional context about the error."
+}
+```
+
+</TabItem>
+<TabItem value="11" label="404 NOT FOUND">
+
+
+*Query not found, failed or canceled*
+
+</TabItem>
+<TabItem value="12" label="500 SERVER ERROR">
+
+
+*Error thrown due to bad query. Returns a JSON object detailing the error with the following format:*
+
+```json
+{
+    "error": "Summary of the encountered error.",
+    "errorCode": "Well-defined error code.",
+    "persona": "Role or persona associated with the error.",
+    "category": "Classification of the error.",
+    "errorMessage": "Summary of the encountered issue with expanded information.",
+    "context": "Additional context about the error."
+}
+```
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+The following example retrieves the status of a query with specified ID `query-f3bca219-173d-44d4-bdc7-5002e910352f`.
+
+<Tabs>
+
+<TabItem value="13" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/v2/sql/statements/query-f3bca219-173d-44d4-bdc7-5002e910352f/results"
+```
+
+</TabItem>
+<TabItem value="14" label="HTTP">
+
+
+```HTTP
+GET /druid/v2/sql/statements/query-f3bca219-173d-44d4-bdc7-5002e910352f/results HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+[
+    {
+        "__time": 1442018818771,
+        "channel": "#en.wikipedia",
+        "cityName": "",
+        "comment": "added project",
+        "countryIsoCode": "",
+        "countryName": "",
+        "isAnonymous": 0,
+        "isMinor": 0,
+        "isNew": 0,
+        "isRobot": 0,
+        "isUnpatrolled": 0,
+        "metroCode": 0,
+        "namespace": "Talk",
+        "page": "Talk:Oswald Tilghman",
+        "regionIsoCode": "",
+        "regionName": "",
+        "user": "GELongstreet",
+        "delta": 36,
+        "added": 36,
+        "deleted": 0
+    },
+    {
+        "__time": 1442018820496,
+        "channel": "#ca.wikipedia",
+        "cityName": "",
+        "comment": "Robot inserta {{Commonscat}} que enllaça amb [[commons:category:Rallicula]]",
+        "countryIsoCode": "",
+        "countryName": "",
+        "isAnonymous": 0,
+        "isMinor": 1,
+        "isNew": 0,
+        "isRobot": 1,
+        "isUnpatrolled": 0,
+        "metroCode": 0,
+        "namespace": "Main",
+        "page": "Rallicula",
+        "regionIsoCode": "",
+        "regionName": "",
+        "user": "PereBot",
+        "delta": 17,
+        "added": 17,
+        "deleted": 0
+    },
+    {
+        "__time": 1442018825474,
+        "channel": "#en.wikipedia",
+        "cityName": "Auburn",
+        "comment": "/* Status of peremptory norms under international law */ fixed spelling of 'Wimbledon'",
+        "countryIsoCode": "AU",
+        "countryName": "Australia",
+        "isAnonymous": 1,
+        "isMinor": 0,
+        "isNew": 0,
+        "isRobot": 0,
+        "isUnpatrolled": 0,
+        "metroCode": 0,
+        "namespace": "Main",
+        "page": "Peremptory norm",
+        "regionIsoCode": "NSW",
+        "regionName": "New South Wales",
+        "user": "60.225.66.142",
+        "delta": 0,
+        "added": 0,
+        "deleted": 0
+    },
+    {
+        "__time": 1442018828770,
+        "channel": "#vi.wikipedia",
+        "cityName": "",
+        "comment": "fix Lỗi CS1: ngày tháng",
+        "countryIsoCode": "",
+        "countryName": "",
+        "isAnonymous": 0,
+        "isMinor": 1,
+        "isNew": 0,
+        "isRobot": 1,
+        "isUnpatrolled": 0,
+        "metroCode": 0,
+        "namespace": "Main",
+        "page": "Apamea abruzzorum",
+        "regionIsoCode": "",
+        "regionName": "",
+        "user": "Cheers!-bot",
+        "delta": 18,
+        "added": 18,
+        "deleted": 0
+    },
+    {
+        "__time": 1442018831862,
+        "channel": "#vi.wikipedia",
+        "cityName": "",
+        "comment": "clean up using [[Project:AWB|AWB]]",
+        "countryIsoCode": "",
+        "countryName": "",
+        "isAnonymous": 0,
+        "isMinor": 0,
+        "isNew": 0,
+        "isRobot": 1,
+        "isUnpatrolled": 0,
+        "metroCode": 0,
+        "namespace": "Main",
+        "page": "Atractus flammigerus",
+        "regionIsoCode": "",
+        "regionName": "",
+        "user": "ThitxongkhoiAWB",
+        "delta": 18,
+        "added": 18,
+        "deleted": 0
+    },
+    {
+        "__time": 1442018833987,
+        "channel": "#vi.wikipedia",
+        "cityName": "",
+        "comment": "clean up using [[Project:AWB|AWB]]",
+        "countryIsoCode": "",
+        "countryName": "",
+        "isAnonymous": 0,
+        "isMinor": 0,
+        "isNew": 0,
+        "isRobot": 1,
+        "isUnpatrolled": 0,
+        "metroCode": 0,
+        "namespace": "Main",
+        "page": "Agama mossambica",
+        "regionIsoCode": "",
+        "regionName": "",
+        "user": "ThitxongkhoiAWB",
+        "delta": 18,
+        "added": 18,
+        "deleted": 0
+    },
+    {
+        "__time": 1442018837009,
+        "channel": "#ca.wikipedia",
+        "cityName": "",
+        "comment": "/* Imperi Austrohongarès */",
+        "countryIsoCode": "",
+        "countryName": "",
+        "isAnonymous": 0,
+        "isMinor": 0,
+        "isNew": 0,
+        "isRobot": 0,
+        "isUnpatrolled": 0,
+        "metroCode": 0,
+        "namespace": "Main",
+        "page": "Campanya dels Balcans (1914-1918)",
+        "regionIsoCode": "",
+        "regionName": "",
+        "user": "Jaumellecha",
+        "delta": -20,
+        "added": 0,
+        "deleted": 20
+    },
+    {
+        "__time": 1442018839591,
+        "channel": "#en.wikipedia",
+        "cityName": "",
+        "comment": "adding comment on notability and possible COI",
+        "countryIsoCode": "",
+        "countryName": "",
+        "isAnonymous": 0,
+        "isMinor": 0,
+        "isNew": 1,
+        "isRobot": 0,
+        "isUnpatrolled": 1,
+        "metroCode": 0,
+        "namespace": "Talk",
+        "page": "Talk:Dani Ploeger",
+        "regionIsoCode": "",
+        "regionName": "",
+        "user": "New Media Theorist",
+        "delta": 345,
+        "added": 345,
+        "deleted": 0
+    },
+    {
+        "__time": 1442018841578,
+        "channel": "#en.wikipedia",
+        "cityName": "",
+        "comment": "Copying assessment table to wiki",
+        "countryIsoCode": "",
+        "countryName": "",
+        "isAnonymous": 0,
+        "isMinor": 0,
+        "isNew": 0,
+        "isRobot": 1,
+        "isUnpatrolled": 0,
+        "metroCode": 0,
+        "namespace": "User",
+        "page": "User:WP 1.0 bot/Tables/Project/Pubs",
+        "regionIsoCode": "",
+        "regionName": "",
+        "user": "WP 1.0 bot",
+        "delta": 121,
+        "added": 121,
+        "deleted": 0
+    },
+    {
+        "__time": 1442018845821,
+        "channel": "#vi.wikipedia",
+        "cityName": "",
+        "comment": "clean up using [[Project:AWB|AWB]]",
+        "countryIsoCode": "",
+        "countryName": "",
+        "isAnonymous": 0,
+        "isMinor": 0,
+        "isNew": 0,
+        "isRobot": 1,
+        "isUnpatrolled": 0,
+        "metroCode": 0,
+        "namespace": "Main",
+        "page": "Agama persimilis",
+        "regionIsoCode": "",
+        "regionName": "",
+        "user": "ThitxongkhoiAWB",
+        "delta": 18,
+        "added": 18,
+        "deleted": 0
+    }
+]
+  ```
+</details>
+
+### Cancel a query
+
+Cancels a running or accepted query.
+
+#### URL
+
+`DELETE` `/druid/v2/sql/statements/{queryId}`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="15" label="200 OK">
+
+
+*A no op operation since the query is not in a state to be cancelled*
+
+</TabItem>
+<TabItem value="16" label="202 ACCEPTED">
+
+
+*Successfully accepted query for cancellation*
+
+</TabItem>
+<TabItem value="17" label="404 SERVER ERROR">
+
+
+*Invalid query ID. Returns a JSON object detailing the error with the following format:*
+
+```json
+{
+    "error": "Summary of the encountered error.",
+    "errorCode": "Well-defined error code.",
+    "persona": "Role or persona associated with the error.",
+    "category": "Classification of the error.",
+    "errorMessage": "Summary of the encountered issue with expanded information.",
+    "context": "Additional context about the error."
+}
+```
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+The following example cancels a query with specified ID `query-945c9633-2fa2-49ab-80ae-8221c38c024da`.
+
+<Tabs>
+
+<TabItem value="18" label="cURL">
+
+
+```shell
+curl --request DELETE "http://ROUTER_IP:ROUTER_PORT/druid/v2/sql/statements/query-945c9633-2fa2-49ab-80ae-8221c38c024da"
+```
+
+</TabItem>
+<TabItem value="19" label="HTTP">
+
+
+```HTTP
+DELETE /druid/v2/sql/statements/query-945c9633-2fa2-49ab-80ae-8221c38c024da HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+A successful request returns an HTTP `202 ACCEPTED` message code and an empty response body.
diff --git a/docs/35.0.0/api-reference/sql-ingestion-api.md b/docs/35.0.0/api-reference/sql-ingestion-api.md
new file mode 100644
index 0000000000..59942aff8e
--- /dev/null
+++ b/docs/35.0.0/api-reference/sql-ingestion-api.md
@@ -0,0 +1,850 @@
+---
+id: sql-ingestion-api
+title: SQL-based ingestion API
+sidebar_label: SQL-based ingestion
+---
+import Tabs from '@theme/Tabs';
+import TabItem from '@theme/TabItem';
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ This page describes SQL-based batch ingestion using the [`druid-multi-stage-query`](../multi-stage-query/index.md)
+ extension, new in Druid 24.0. Refer to the [ingestion methods](../ingestion/index.md#batch) table to determine which
+ ingestion method is right for you.
+:::
+
+The **Query** view in the web console provides a friendly experience for the multi-stage query task engine (MSQ task engine) and multi-stage query architecture. We recommend using the web console if you don't need a programmatic interface.
+
+When using the API for the MSQ task engine, the action you want to take determines the endpoint you use:
+
+- `/druid/v2/sql/task`: Submit a query for ingestion.
+- `/druid/indexer/v1/task`: Interact with a query, including getting its status or details, or canceling the query. This page describes a few of the Overlord Task APIs that you can use with the MSQ task engine. For information about Druid APIs, see the [API reference for Druid](../ingestion/tasks.md).
+
+In this topic, `http://ROUTER_IP:ROUTER_PORT` is a placeholder for your Router service address and port. Replace it with the information for your deployment. For example, use `http://localhost:8888` for quickstart deployments.
+
+## Submit a query
+
+Submits queries to the MSQ task engine.
+
+The `/druid/v2/sql/task` endpoint accepts the following:
+
+- [SQL requests in the JSON-over-HTTP form](sql-api.md#request-body) using the
+`query`, `context`, and `parameters` fields. The endpoint ignores the `resultFormat`, `header`, `typesHeader`, and `sqlTypesHeader` fields.
+- [INSERT](../multi-stage-query/reference.md#insert) and [REPLACE](../multi-stage-query/reference.md#replace) statements.
+- SELECT queries (experimental feature). SELECT query results are collected from workers by the controller, and written into the [task report](#get-the-report-for-a-query-task) as an array of arrays. The behavior and result format of plain SELECT queries (without INSERT or REPLACE) is subject to change.
+
+### URL
+
+`POST` `/druid/v2/sql/task`
+
+### Responses
+
+<Tabs>
+
+<TabItem value="1" label="200 SUCCESS">
+
+
+*Successfully submitted query*
+
+</TabItem>
+<TabItem value="2" label="400 BAD REQUEST">
+
+
+*Error thrown due to bad query. Returns a JSON object detailing the error with the following format:*
+
+```json
+{
+    "error": "A well-defined error code.",
+    "errorMessage": "A message with additional details about the error.",
+    "errorClass": "Class of exception that caused this error.",
+    "host": "The host on which the error occurred."
+}
+```
+</TabItem>
+<TabItem value="3" label="500 INTERNAL SERVER ERROR">
+
+
+*Request not sent due to unexpected conditions. Returns a JSON object detailing the error with the following format:*
+
+```json
+{
+    "error": "A well-defined error code.",
+    "errorMessage": "A message with additional details about the error.",
+    "errorClass": "Class of exception that caused this error.",
+    "host": "The host on which the error occurred."
+}
+```
+
+</TabItem>
+</Tabs>
+
+---
+
+### Sample request
+
+The following example shows a query that fetches data from an external JSON source and inserts it into a table named `wikipedia`.
+The example specifies two query context parameters:
+
+- `maxNumTasks=3`: Limits the maximum number of parallel tasks to 3.
+- `finalizeAggregations=false`: Ensures that Druid saves the aggregation's intermediate type during ingestion. For more information, see [Rollup](../multi-stage-query/concepts.md#rollup).
+
+
+<Tabs>
+
+<TabItem value="4" label="HTTP">
+
+```HTTP
+POST /druid/v2/sql/task HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+Content-Type: application/json
+
+{
+  "query": "SET maxNumTasks=3;\nSET finalizeAggregations=false;\nINSERT INTO wikipedia\nSELECT\n  TIME_PARSE(\"timestamp\") AS __time,\n  *\nFROM TABLE(\n  EXTERN(\n    '{\"type\": \"http\", \"uris\": [\"https://druid.apache.org/data/wikipedia.json.gz\"]}',\n    '{\"type\": \"json\"}',\n    '[{\"name\": \"added\", \"type\": \"long\"}, {\"name\": \"channel\", \"type\": \"string\"}, {\"name\": \"cityName\", \"type\": \"string\"}, {\"name\": \"comment\", \"type\": \"string\"}, {\"name\": \"commentLength\", \"type\": \"long\"}, {\"name\": \"countryIsoCode\", \"type\": \"string\"}, {\"name\": \"countryName\", \"type\": \"string\"}, {\"name\": \"deleted\", \"type\": \"long\"}, {\"name\": \"delta\", \"type\": \"long\"}, {\"name\": \"deltaBucket\", \"type\": \"string\"}, {\"name\": \"diffUrl\", \"type\": \"string\"}, {\"name\": \"flags\", \"type\": \"string\"}, {\"name\": \"isAnonymous\", \"type\": \"string\"}, {\"name\": \"isMinor\", \"type\": \"string\"}, {\"name\": \"isNew\", \"type\": \"string\"}, {\"name\": \"isRobot\", \"type\": \"string\"}, {\"name\": \"isUnpatrolled\", \"type\": \"string\"}, {\"name\": \"metroCode\", \"type\": \"string\"}, {\"name\": \"namespace\", \"type\": \"string\"}, {\"name\": \"page\", \"type\": \"string\"}, {\"name\": \"regionIsoCode\", \"type\": \"string\"}, {\"name\": \"regionName\", \"type\": \"string\"}, {\"name\": \"timestamp\", \"type\": \"string\"}, {\"name\": \"user\", \"type\": \"string\"}]'\n  )\n)\nPARTITIONED BY DAY"
+}
+```
+
+</TabItem>
+
+<TabItem value="5" label="cURL">
+
+
+```shell
+curl --location --request POST 'http://ROUTER_IP:ROUTER_PORT/druid/v2/sql/task' \
+  --header 'Content-Type: application/json' \
+  --data '{
+  "query": "SET maxNumTasks=3;\nSET finalizeAggregations=false;\nINSERT INTO wikipedia\nSELECT\n  TIME_PARSE(\"timestamp\") AS __time,\n  *\nFROM TABLE(\n  EXTERN(\n    '\''{\"type\": \"http\", \"uris\": [\"https://druid.apache.org/data/wikipedia.json.gz\"]}'\'',\n    '\''{\"type\": \"json\"}'\'',\n    '\''[{\"name\": \"added\", \"type\": \"long\"}, {\"name\": \"channel\", \"type\": \"string\"}, {\"name\": \"cityName\", \"type\": \"string\"}, {\"name\": \"comment\", \"type\": \"string\"}, {\"name\": \"commentLength\", \"type\": \"long\"}, {\"name\": \"countryIsoCode\", \"type\": \"string\"}, {\"name\": \"countryName\", \"type\": \"string\"}, {\"name\": \"deleted\", \"type\": \"long\"}, {\"name\": \"delta\", \"type\": \"long\"}, {\"name\": \"deltaBucket\", \"type\": \"string\"}, {\"name\": \"diffUrl\", \"type\": \"string\"}, {\"name\": \"flags\", \"type\": \"string\"}, {\"name\": \"isAnonymous\", \"type\": \"string\"}, {\"name\": \"isMinor\", \"type\": \"string\"}, {\"name\": \"isNew\", \"type\": \"string\"}, {\"name\": \"isRobot\", \"type\": \"string\"}, {\"name\": \"isUnpatrolled\", \"type\": \"string\"}, {\"name\": \"metroCode\", \"type\": \"string\"}, {\"name\": \"namespace\", \"type\": \"string\"}, {\"name\": \"page\", \"type\": \"string\"}, {\"name\": \"regionIsoCode\", \"type\": \"string\"}, {\"name\": \"regionName\", \"type\": \"string\"}, {\"name\": \"timestamp\", \"type\": \"string\"}, {\"name\": \"user\", \"type\": \"string\"}]'\''\n  )\n)\nPARTITIONED BY DAY"
+}'
+```
+
+</TabItem>
+
+<TabItem value="6" label="Python">
+
+
+```python
+import json
+import requests
+
+url = "http://ROUTER_IP:ROUTER_PORT/druid/v2/sql/task"
+
+payload = json.dumps({
+  "query": "SET maxNumTasks=3;\nSET finalizeAggregations=false;\nINSERT INTO wikipedia\nSELECT\n  TIME_PARSE(\"timestamp\") AS __time,\n  *\nFROM TABLE(\n  EXTERN(\n    '{\"type\": \"http\", \"uris\": [\"https://druid.apache.org/data/wikipedia.json.gz\"]}',\n    '{\"type\": \"json\"}',\n    '[{\"name\": \"added\", \"type\": \"long\"}, {\"name\": \"channel\", \"type\": \"string\"}, {\"name\": \"cityName\", \"type\": \"string\"}, {\"name\": \"comment\", \"type\": \"string\"}, {\"name\": \"commentLength\", \"type\": \"long\"}, {\"name\": \"countryIsoCode\", \"type\": \"string\"}, {\"name\": \"countryName\", \"type\": \"string\"}, {\"name\": \"deleted\", \"type\": \"long\"}, {\"name\": \"delta\", \"type\": \"long\"}, {\"name\": \"deltaBucket\", \"type\": \"string\"}, {\"name\": \"diffUrl\", \"type\": \"string\"}, {\"name\": \"flags\", \"type\": \"string\"}, {\"name\": \"isAnonymous\", \"type\": \"string\"}, {\"name\": \"isMinor\", \"type\": \"string\"}, {\"name\": \"isNew\", \"type\": \"string\"}, {\"name\": \"isRobot\", \"type\": \"string\"}, {\"name\": \"isUnpatrolled\", \"type\": \"string\"}, {\"name\": \"metroCode\", \"type\": \"string\"}, {\"name\": \"namespace\", \"type\": \"string\"}, {\"name\": \"page\", \"type\": \"string\"}, {\"name\": \"regionIsoCode\", \"type\": \"string\"}, {\"name\": \"regionName\", \"type\": \"string\"}, {\"name\": \"timestamp\", \"type\": \"string\"}, {\"name\": \"user\", \"type\": \"string\"}]'\n  )\n)\nPARTITIONED BY DAY"
+})
+headers = {
+  'Content-Type': 'application/json'
+}
+
+response = requests.post(url, headers=headers, data=payload)
+
+print(response.text)
+
+```
+
+</TabItem>
+
+</Tabs>
+
+### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+```json
+{
+    "taskId": "query-431c4a18-9dde-4ec8-ab82-ec7fd17d5a4e",
+    "state": "RUNNING"
+}
+```
+</details>
+
+**Response fields**
+
+| Field | Description |
+|---|---|
+| `taskId` | Controller task ID. You can use Druid's standard [Tasks API](./tasks-api.md) to interact with this controller task. |
+| `state` | Initial state for the query. |
+
+## Get the status for a query task
+
+Retrieves the status of a query task. It returns a JSON object with the task's status code, runner status, task type, datasource, and other relevant metadata.
+
+### URL
+
+`GET` `/druid/indexer/v1/task/{taskId}/status`
+
+### Responses
+
+<Tabs>
+
+<TabItem value="7" label="200 SUCCESS">
+
+
+<br/>
+
+*Successfully retrieved task status*
+
+</TabItem>
+<TabItem value="8" label="404 NOT FOUND">
+
+
+<br/>
+
+*Cannot find task with ID*
+
+</TabItem>
+</Tabs>
+
+---
+
+### Sample request
+
+The following example shows how to retrieve the status of a task with the ID `query-3dc0c45d-34d7-4b15-86c9-cdb2d3ebfc4e`.
+
+<Tabs>
+
+<TabItem value="9" label="HTTP">
+
+```HTTP
+GET /druid/indexer/v1/task/query-3dc0c45d-34d7-4b15-86c9-cdb2d3ebfc4e/status HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+
+<TabItem value="10" label="cURL">
+
+
+```shell
+curl --location --request GET 'http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/task/query-3dc0c45d-34d7-4b15-86c9-cdb2d3ebfc4e/status'
+```
+
+</TabItem>
+
+<TabItem value="11" label="Python">
+
+
+```python
+import requests
+
+url = "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/task/query-3dc0c45d-34d7-4b15-86c9-cdb2d3ebfc4e/status"
+
+payload={}
+headers = {}
+
+response = requests.post(url, headers=headers, data=payload)
+
+print(response.text)
+print(response.text)
+```
+
+</TabItem>
+
+</Tabs>
+
+### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+```json
+{
+  "task": "query-3dc0c45d-34d7-4b15-86c9-cdb2d3ebfc4e",
+  "status": {
+    "id": "query-3dc0c45d-34d7-4b15-86c9-cdb2d3ebfc4e",
+    "groupId": "query-3dc0c45d-34d7-4b15-86c9-cdb2d3ebfc4e",
+    "type": "query_controller",
+    "createdTime": "2022-09-14T22:12:00.183Z",
+    "queueInsertionTime": "1970-01-01T00:00:00.000Z",
+    "statusCode": "RUNNING",
+    "status": "RUNNING",
+    "runnerStatusCode": "RUNNING",
+    "duration": -1,
+    "location": {
+      "host": "localhost",
+      "port": 8100,
+      "tlsPort": -1
+    },
+    "dataSource": "kttm_simple",
+    "errorMsg": null
+  }
+}
+```
+</details>
+
+## Get the report for a query task
+
+Retrieves the task report for a query.
+The report provides detailed information about the query task, including things like the stages, warnings, and errors.
+
+Keep the following in mind when using the task API to view reports:
+
+- The task report for an entire job is associated with the `query_controller` task. The `query_worker` tasks don't have their own reports; their information is incorporated into the controller report.
+- The task report API may report `404 Not Found` temporarily while the task is in the process of starting up.
+- As an experimental feature, the MSQ task engine supports running SELECT queries. SELECT query results are written into
+the `multiStageQuery.payload.results.results` task report key as an array of arrays. The behavior and result format of plain
+SELECT queries (without INSERT or REPLACE) is subject to change.
+- `multiStageQuery.payload.results.resultsTruncated` denotes whether the results of the report have been truncated to prevent the reports from blowing up.
+
+For an explanation of the fields in a report, see [Report response fields](#report-response-fields).
+
+### URL
+
+
+`GET` `/druid/indexer/v1/task/{taskId}/reports`
+
+### Responses
+
+<Tabs>
+
+<TabItem value="12" label="200 SUCCESS">
+
+
+<br/>
+
+*Successfully retrieved task report*
+
+</TabItem>
+</Tabs>
+
+---
+
+### Sample request
+
+The following example shows how to retrieve the report for a query with the task ID `query-3dc0c45d-34d7-4b15-86c9-cdb2d3ebfc4e`.
+
+<Tabs>
+
+<TabItem value="13" label="HTTP">
+
+```HTTP
+GET /druid/indexer/v1/task/query-3dc0c45d-34d7-4b15-86c9-cdb2d3ebfc4e/reports HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+
+<TabItem value="14" label="cURL">
+
+
+```shell
+curl --location --request GET 'http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/task/query-3dc0c45d-34d7-4b15-86c9-cdb2d3ebfc4e/reports'
+```
+
+</TabItem>
+
+<TabItem value="15" label="Python">
+
+
+```python
+import requests
+
+url = "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/task/query-3dc0c45d-34d7-4b15-86c9-cdb2d3ebfc4e/reports"
+
+headers = {}
+
+response = requests.post(url, headers=headers, data=payload)
+
+print(response.text)
+print(response.text)
+```
+
+</TabItem>
+
+</Tabs>
+
+### Sample response
+
+The response shows an example report for a query.
+
+<details>
+<summary>View the response</summary>
+
+```json
+{
+  "multiStageQuery": {
+    "type": "multiStageQuery",
+    "taskId": "query-3dc0c45d-34d7-4b15-86c9-cdb2d3ebfc4e",
+    "payload": {
+      "status": {
+        "status": "SUCCESS",
+        "startTime": "2022-09-14T22:12:09.266Z",
+        "durationMs": 28227,
+        "workers": {
+          "0": [
+            {
+              "workerId": "query-3dc0c45d-34d7-4b15-86c9-cdb2d3ebfc4e-worker0_0",
+              "state": "SUCCESS",
+              "durationMs": 15511,
+              "pendingMs": 137
+            }
+          ]
+        },
+        "pendingTasks": 0,
+        "runningTasks": 2,
+        "segmentLoadWaiterStatus": {
+          "state": "SUCCESS",
+          "dataSource": "kttm_simple",
+          "startTime": "2022-09-14T23:12:09.266Z",
+          "duration": 15,
+          "totalSegments": 1,
+          "usedSegments": 1,
+          "precachedSegments": 0,
+          "onDemandSegments": 0,
+          "pendingSegments": 0,
+          "unknownSegments": 0
+        },
+        "segmentReport": {
+          "shardSpec": "NumberedShardSpec",
+          "details": "Cannot use RangeShardSpec, RangedShardSpec only supports string CLUSTER BY keys. Using NumberedShardSpec instead."
+        }
+      },
+      "stages": [
+        {
+          "stageNumber": 0,
+          "definition": {
+            "id": "71ecb11e-09d7-42f8-9225-1662c8e7e121_0",
+            "input": [
+              {
+                "type": "external",
+                "inputSource": {
+                  "type": "http",
+                  "uris": [
+                    "https://static.imply.io/example-data/kttm-v2/kttm-v2-2019-08-25.json.gz"
+                  ],
+                  "httpAuthenticationUsername": null,
+                  "httpAuthenticationPassword": null
+                },
+                "inputFormat": {
+                  "type": "json",
+                  "flattenSpec": null,
+                  "featureSpec": {},
+                  "keepNullColumns": false
+                },
+                "signature": [
+                  {
+                    "name": "timestamp",
+                    "type": "STRING"
+                  },
+                  {
+                    "name": "agent_category",
+                    "type": "STRING"
+                  },
+                  {
+                    "name": "agent_type",
+                    "type": "STRING"
+                  }
+                ]
+              }
+            ],
+            "processor": {
+              "type": "scan",
+              "query": {
+                "queryType": "scan",
+                "dataSource": {
+                  "type": "inputNumber",
+                  "inputNumber": 0
+                },
+                "intervals": {
+                  "type": "intervals",
+                  "intervals": [
+                    "-146136543-09-08T08:23:32.096Z/146140482-04-24T15:36:27.903Z"
+                  ]
+                },
+                "resultFormat": "compactedList",
+                "columns": [
+                  "agent_category",
+                  "agent_type",
+                  "timestamp"
+                ],
+                "context": {
+                  "finalize": false,
+                  "finalizeAggregations": false,
+                  "groupByEnableMultiValueUnnesting": false,
+                  "scanSignature": "[{\"name\":\"agent_category\",\"type\":\"STRING\"},{\"name\":\"agent_type\",\"type\":\"STRING\"},{\"name\":\"timestamp\",\"type\":\"STRING\"}]",
+                  "sqlInsertSegmentGranularity": "{\"type\":\"all\"}",
+                  "sqlQueryId": "3dc0c45d-34d7-4b15-86c9-cdb2d3ebfc4e",
+                  "sqlReplaceTimeChunks": "all"
+                },
+                "granularity": {
+                  "type": "all"
+                }
+              }
+            },
+            "signature": [
+              {
+                "name": "__boost",
+                "type": "LONG"
+              },
+              {
+                "name": "agent_category",
+                "type": "STRING"
+              },
+              {
+                "name": "agent_type",
+                "type": "STRING"
+              },
+              {
+                "name": "timestamp",
+                "type": "STRING"
+              }
+            ],
+            "shuffleSpec": {
+              "type": "targetSize",
+              "clusterBy": {
+                "columns": [
+                  {
+                    "columnName": "__boost"
+                  }
+                ]
+              },
+              "targetSize": 3000000
+            },
+            "maxWorkerCount": 1,
+            "shuffleCheckHasMultipleValues": true
+          },
+          "phase": "FINISHED",
+          "workerCount": 1,
+          "partitionCount": 1,
+          "startTime": "2022-09-14T22:12:11.663Z",
+          "duration": 19965,
+          "sort": true
+        },
+        {
+          "stageNumber": 1,
+          "definition": {
+            "id": "71ecb11e-09d7-42f8-9225-1662c8e7e121_1",
+            "input": [
+              {
+                "type": "stage",
+                "stage": 0
+              }
+            ],
+            "processor": {
+              "type": "segmentGenerator",
+              "dataSchema": {
+                "dataSource": "kttm_simple",
+                "timestampSpec": {
+                  "column": "__time",
+                  "format": "millis",
+                  "missingValue": null
+                },
+                "dimensionsSpec": {
+                  "dimensions": [
+                    {
+                      "type": "string",
+                      "name": "timestamp",
+                      "multiValueHandling": "SORTED_ARRAY",
+                      "createBitmapIndex": true
+                    },
+                    {
+                      "type": "string",
+                      "name": "agent_category",
+                      "multiValueHandling": "SORTED_ARRAY",
+                      "createBitmapIndex": true
+                    },
+                    {
+                      "type": "string",
+                      "name": "agent_type",
+                      "multiValueHandling": "SORTED_ARRAY",
+                      "createBitmapIndex": true
+                    }
+                  ],
+                  "dimensionExclusions": [
+                    "__time"
+                  ],
+                  "includeAllDimensions": false
+                },
+                "metricsSpec": [],
+                "granularitySpec": {
+                  "type": "arbitrary",
+                  "queryGranularity": {
+                    "type": "none"
+                  },
+                  "rollup": false,
+                  "intervals": [
+                    "-146136543-09-08T08:23:32.096Z/146140482-04-24T15:36:27.903Z"
+                  ]
+                },
+                "transformSpec": {
+                  "filter": null,
+                  "transforms": []
+                }
+              },
+              "columnMappings": [
+                {
+                  "queryColumn": "timestamp",
+                  "outputColumn": "timestamp"
+                },
+                {
+                  "queryColumn": "agent_category",
+                  "outputColumn": "agent_category"
+                },
+                {
+                  "queryColumn": "agent_type",
+                  "outputColumn": "agent_type"
+                }
+              ],
+              "tuningConfig": {
+                "maxNumWorkers": 1,
+                "maxRowsInMemory": 100000,
+                "rowsPerSegment": 3000000
+              }
+            },
+            "signature": [],
+            "maxWorkerCount": 1
+          },
+          "phase": "FINISHED",
+          "workerCount": 1,
+          "partitionCount": 1,
+          "startTime": "2022-09-14T22:12:31.602Z",
+          "duration": 5891
+        }
+      ],
+      "counters": {
+        "0": {
+          "0": {
+            "input0": {
+              "type": "channel",
+              "rows": [
+                465346
+              ],
+              "files": [
+                1
+              ],
+              "totalFiles": [
+                1
+              ]
+            },
+            "output": {
+              "type": "channel",
+              "rows": [
+                465346
+              ],
+              "bytes": [
+                43694447
+              ],
+              "frames": [
+                7
+              ]
+            },
+            "shuffle": {
+              "type": "channel",
+              "rows": [
+                465346
+              ],
+              "bytes": [
+                41835307
+              ],
+              "frames": [
+                73
+              ]
+            },
+            "sortProgress": {
+              "type": "sortProgress",
+              "totalMergingLevels": 3,
+              "levelToTotalBatches": {
+                "0": 1,
+                "1": 1,
+                "2": 1
+              },
+              "levelToMergedBatches": {
+                "0": 1,
+                "1": 1,
+                "2": 1
+              },
+              "totalMergersForUltimateLevel": 1,
+              "progressDigest": 1
+            }
+          }
+        },
+        "1": {
+          "0": {
+            "input0": {
+              "type": "channel",
+              "rows": [
+                465346
+              ],
+              "bytes": [
+                41835307
+              ],
+              "frames": [
+                73
+              ]
+            },
+            "segmentGenerationProgress": {
+              "type": "segmentGenerationProgress",
+              "rowsProcessed": 465346,
+              "rowsPersisted": 465346,
+              "rowsMerged": 465346
+            }
+          }
+        }
+      }
+    }
+  }
+}
+```
+
+</details>
+
+<a name="report-response-fields"></a>
+
+The following table describes the response fields when you retrieve a report for a MSQ task engine using the `/druid/indexer/v1/task/{taskId}/reports` endpoint:
+
+| Field | Description |
+|---|---|
+| `multiStageQuery.taskId` | Controller task ID. |
+| `multiStageQuery.payload.status` | Query status container. |
+| `multiStageQuery.payload.status.status` | RUNNING, SUCCESS, or FAILED. |
+| `multiStageQuery.payload.status.startTime` | Start time of the query in ISO format. Only present if the query has started running. |
+| `multiStageQuery.payload.status.durationMs` | Milliseconds elapsed after the query has started running. -1 denotes that the query hasn't started running yet. |
+| `multiStageQuery.payload.status.workers` | Workers for the controller task.|
+| `multiStageQuery.payload.status.workers.<workerNumber>` | Array of worker tasks including retries. |
+| `multiStageQuery.payload.status.workers.<workerNumber>[].workerId` | Id of the worker task.| |
+| `multiStageQuery.payload.status.workers.<workerNumber>[].status` | RUNNING, SUCCESS, or FAILED.|
+| `multiStageQuery.payload.status.workers.<workerNumber>[].durationMs` | Milliseconds elapsed between when the worker task was first requested and when it finished. It is -1 for worker tasks with status RUNNING.|
+| `multiStageQuery.payload.status.workers.<workerNumber>[].pendingMs` | Milliseconds elapsed between when the worker task was first requested and when it fully started RUNNING. Actual work time can be calculated using `actualWorkTimeMS = durationMs - pendingMs`.|
+| `multiStageQuery.payload.status.pendingTasks` | Number of tasks that are not fully started. -1 denotes that the number is currently unknown. |
+| `multiStageQuery.payload.status.runningTasks` | Number of currently running tasks. Should be at least 1 since the controller is included. |
+| `multiStageQuery.payload.status.segmentLoadStatus` | Segment loading container. Only present after the segments have been published. |
+| `multiStageQuery.payload.status.segmentLoadStatus.state` | Either INIT, WAITING, SUCCESS, FAILED or TIMED_OUT. |
+| `multiStageQuery.payload.status.segmentLoadStatus.startTime` | Time since which the controller has been waiting for the segments to finish loading. |
+| `multiStageQuery.payload.status.segmentLoadStatus.duration` | The duration in milliseconds that the controller has been waiting for the segments to load. |
+| `multiStageQuery.payload.status.segmentLoadStatus.totalSegments` | The total number of segments generated by the job. This includes tombstone segments (if any). |
+| `multiStageQuery.payload.status.segmentLoadStatus.usedSegments` | The number of segments which are marked as used based on the load rules. Unused segments can be cleaned up at any time. |
+| `multiStageQuery.payload.status.segmentLoadStatus.precachedSegments` | The number of segments which are marked as precached and served by historicals, as per the load rules. |
+| `multiStageQuery.payload.status.segmentLoadStatus.onDemandSegments` | The number of segments which are not loaded on any historical, as per the load rules. |
+| `multiStageQuery.payload.status.segmentLoadStatus.pendingSegments` | The number of segments remaining to be loaded. |
+| `multiStageQuery.payload.status.segmentLoadStatus.unknownSegments` | The number of segments whose status is unknown. |
+| `multiStageQuery.payload.status.segmentReport` | Segment report. Only present if the query is an ingestion. |
+| `multiStageQuery.payload.status.segmentReport.shardSpec` | Contains the shard spec chosen. |
+| `multiStageQuery.payload.status.segmentReport.details` | Contains further reasoning about the shard spec chosen. |
+| `multiStageQuery.payload.status.errorReport` | Error object. Only present if there was an error. |
+| `multiStageQuery.payload.status.errorReport.taskId` | The task that reported the error, if known. May be a controller task or a worker task. |
+| `multiStageQuery.payload.status.errorReport.host` | The hostname and port of the task that reported the error, if known. |
+| `multiStageQuery.payload.status.errorReport.stageNumber` | The stage number that reported the error, if it happened during execution of a specific stage. |
+| `multiStageQuery.payload.status.errorReport.error` | Error object. Contains `errorCode` at a minimum, and may contain other fields as described in the [error code table](../multi-stage-query/reference.md#error-codes). Always present if there is an error. |
+| `multiStageQuery.payload.status.errorReport.error.errorCode` | One of the error codes from the [error code table](../multi-stage-query/reference.md#error-codes). Always present if there is an error. |
+| `multiStageQuery.payload.status.errorReport.error.errorMessage` | User-friendly error message. Not always present, even if there is an error. |
+| `multiStageQuery.payload.status.errorReport.exceptionStackTrace` | Java stack trace in string form, if the error was due to a server-side exception. |
+| `multiStageQuery.payload.stages` | Array of query stages. |
+| `multiStageQuery.payload.stages[].stageNumber` | Each stage has a number that differentiates it from other stages. |
+| `multiStageQuery.payload.stages[].phase` | Either NEW, READING_INPUT, POST_READING, RESULTS_COMPLETE, or FAILED. Only present if the stage has started. |
+| `multiStageQuery.payload.stages[].workerCount` | Number of parallel tasks that this stage is running on. Only present if the stage has started. |
+| `multiStageQuery.payload.stages[].partitionCount` | Number of output partitions generated by this stage. Only present if the stage has started and has computed its number of output partitions. |
+| `multiStageQuery.payload.stages[].startTime` | Start time of this stage. Only present if the stage has started. |
+| `multiStageQuery.payload.stages[].duration` | The number of milliseconds that the stage has been running. Only present if the stage has started. |
+| `multiStageQuery.payload.stages[].sort` | A boolean that is set to `true` if the stage does a sort as part of its execution. |
+| `multiStageQuery.payload.stages[].definition` | The object defining what the stage does. |
+| `multiStageQuery.payload.stages[].definition.id` | The unique identifier of the stage. |
+| `multiStageQuery.payload.stages[].definition.input` | Array of inputs that the stage has. |
+| `multiStageQuery.payload.stages[].definition.broadcast` | Array of input indexes that get broadcasted. Only present if there are inputs that get broadcasted. |
+| `multiStageQuery.payload.stages[].definition.processor` | An object defining the processor logic. |
+| `multiStageQuery.payload.stages[].definition.signature` | The output signature of the stage. |
+
+## Cancel a query task
+
+Cancels a query task.
+Returns a JSON object with the ID of the task that was canceled successfully.
+
+### URL
+
+`POST` `/druid/indexer/v1/task/{taskId}/shutdown`
+
+### Responses
+
+<Tabs>
+
+<TabItem value="16" label="200 SUCCESS">
+
+
+<br/>
+
+*Successfully shut down task*
+
+</TabItem>
+<TabItem value="17" label="404 NOT FOUND">
+
+
+<br/>
+
+*Cannot find task with ID or task is no longer running*
+
+</TabItem>
+</Tabs>
+
+---
+
+### Sample request
+
+The following example shows how to cancel a query task with the ID `query-655efe33-781a-4c50-ae84-c2911b42d63c`.
+
+<Tabs>
+
+<TabItem value="18" label="HTTP">
+
+
+```HTTP
+POST /druid/indexer/v1/task/query-655efe33-781a-4c50-ae84-c2911b42d63c/shutdown HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+
+<TabItem value="19" label="cURL">
+
+
+```shell
+curl --location --request POST 'http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/task/query-655efe33-781a-4c50-ae84-c2911b42d63c/shutdown'
+```
+
+</TabItem>
+
+<TabItem value="20" label="Python">
+
+
+```python
+import requests
+
+url = "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/task/query-655efe33-781a-4c50-ae84-c2911b42d63c/shutdown"
+
+payload = {}
+headers = {}
+
+response = requests.post(url, headers=headers, data=payload)
+
+print(response.text)
+print(response.text)
+```
+
+</TabItem>
+
+</Tabs>
+
+### Sample response
+
+The response shows the ID of the task that was canceled.
+
+```json
+{
+    "task": "query-655efe33-781a-4c50-ae84-c2911b42d63c"
+}
+```
\ No newline at end of file
diff --git a/docs/35.0.0/api-reference/sql-jdbc.md b/docs/35.0.0/api-reference/sql-jdbc.md
new file mode 100644
index 0000000000..affe9ea738
--- /dev/null
+++ b/docs/35.0.0/api-reference/sql-jdbc.md
@@ -0,0 +1,251 @@
+---
+id: sql-jdbc
+title: SQL JDBC driver API
+sidebar_label: SQL JDBC driver
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ Apache Druid supports two query languages: Druid SQL and [native queries](../querying/querying.md).
+ This document describes the SQL language.
+:::
+
+You can make [Druid SQL](../querying/sql.md) queries using the [Avatica JDBC driver](https://calcite.apache.org/avatica/downloads/).
+We recommend using Avatica JDBC driver version 1.23.0 or later. Note that starting with Avatica 1.21.0, you may need to set the [`transparent_reconnection`](https://calcite.apache.org/avatica/docs/client_reference.html#transparent_reconnection) property to `true` if you notice intermittent query failures.
+
+Once you've downloaded the Avatica client jar, add it to your classpath.
+
+Example connection string:
+
+```
+jdbc:avatica:remote:url=http://localhost:8888/druid/v2/sql/avatica/;transparent_reconnection=true
+```
+
+Or, to use the protobuf protocol instead of JSON:
+
+```
+jdbc:avatica:remote:url=http://localhost:8888/druid/v2/sql/avatica-protobuf/;transparent_reconnection=true;serialization=protobuf
+```
+
+The `url` is the `/druid/v2/sql/avatica/` endpoint on the Router, which routes JDBC connections to a consistent Broker.
+For more information, see [Connection stickiness](#connection-stickiness).
+
+Set `transparent_reconnection` to `true` so your connection is not interrupted if the pool of Brokers changes membership,
+or if a Broker is restarted.
+
+Set `serialization` to `protobuf` if using the protobuf endpoint.
+
+Note that as of the time of this writing, Avatica 1.23.0, the latest version, does not support passing
+[connection context parameters](../querying/sql-query-context.md) from the JDBC connection string to Druid. These context parameters
+must be passed using a `Properties` object instead. Refer to the Java code below for an example.
+
+Example Java code:
+
+```java
+// Connect to /druid/v2/sql/avatica/ on your Broker.
+String url = "jdbc:avatica:remote:url=http://localhost:8888/druid/v2/sql/avatica/;transparent_reconnection=true";
+
+// Set any connection context parameters you need here.
+// Any property from https://druid.apache.org/docs/latest/querying/sql-query-context.html can go here.
+Properties connectionProperties = new Properties();
+connectionProperties.setProperty("sqlTimeZone", "Etc/UTC");
+//To connect to a Druid deployment protected by basic authentication,
+//you can incorporate authentication details from https://druid.apache.org/docs/latest/operations/security-overview   
+connectionProperties.setProperty("user", "admin");                
+connectionProperties.setProperty("password", "password1");     
+
+try (Connection connection = DriverManager.getConnection(url, connectionProperties)) {
+  try (
+      final Statement statement = connection.createStatement();
+      final ResultSet resultSet = statement.executeQuery(query)
+  ) {
+    while (resultSet.next()) {
+      // process result set
+    }
+  }
+}
+```
+
+For a runnable example that includes a query that you might run, see [Examples](#examples).
+
+It is also possible to use a protocol buffers JDBC connection with Druid, this offer reduced bloat and potential performance
+improvements for larger result sets. To use it apply the following connection URL instead, everything else remains the same
+
+```
+String url = "jdbc:avatica:remote:url=http://localhost:8888/druid/v2/sql/avatica-protobuf/;transparent_reconnection=true;serialization=protobuf";
+```
+
+:::info
+ The protobuf endpoint is also known to work with the official [Golang Avatica driver](https://github.com/apache/calcite-avatica-go)
+:::
+
+Table metadata is available over JDBC using `connection.getMetaData()` or by querying the
+[INFORMATION_SCHEMA tables](../querying/sql-metadata-tables.md). For an example of this, see [Get the metadata for a datasource](#get-the-metadata-for-a-datasource).
+
+## Connection stickiness
+
+Druid's JDBC server does not share connection state between Brokers. This means that if you're using JDBC and have
+multiple Druid Brokers, you should either connect to a specific Broker or use a load balancer with sticky sessions
+enabled. The Druid Router process provides connection stickiness when balancing JDBC requests, and can be used to achieve
+the necessary stickiness even with a normal non-sticky load balancer. Please see the
+[Router](../design/router.md) documentation for more details.
+
+Note that the non-JDBC [JSON over HTTP](sql-api.md#submit-a-query) API is stateless and does not require stickiness.
+
+## Dynamic parameters
+
+You can use [parameterized queries](../querying/sql.md#dynamic-parameters) in JDBC code, as in this example:
+
+```java
+PreparedStatement statement = connection.prepareStatement("SELECT COUNT(*) AS cnt FROM druid.foo WHERE dim1 = ? OR dim1 = ?");
+statement.setString(1, "abc");
+statement.setString(2, "def");
+final ResultSet resultSet = statement.executeQuery();
+```
+
+Sample code where dynamic parameters replace arrays using STRING_TO_ARRAY:
+```java
+PreparedStatement statement = connection.prepareStatement("select l1 from numfoo where SCALAR_IN_ARRAY(l1, STRING_TO_ARRAY(CAST(? as varchar),','))");
+List<Integer> li = ImmutableList.of(0, 7);
+String sqlArg = Joiner.on(",").join(li);
+statement.setString(1, sqlArg);
+statement.executeQuery();
+```
+
+Sample code using native array:
+```java
+PreparedStatement statement = connection.prepareStatement("select l1 from numfoo where SCALAR_IN_ARRAY(l1, ?)");
+Iterable<Object> list = ImmutableList.of(0, 7);
+ArrayFactoryImpl arrayFactoryImpl = new ArrayFactoryImpl(TimeZone.getDefault());
+AvaticaType type = ColumnMetaData.scalar(Types.INTEGER, SqlType.INTEGER.name(), Rep.INTEGER);
+Array array = arrayFactoryImpl.createArray(type, list);
+statement.setArray(1, array);
+statement.executeQuery();
+```
+
+## Examples
+
+<!-- docs/tutorial-jdbc.md redirects here -->
+
+The following section contains two complete samples that use the JDBC connector:
+
+- [Get the metadata for a datasource](#get-the-metadata-for-a-datasource) shows you how to query the `INFORMATION_SCHEMA` to get metadata like column names. 
+- [Query data](#query-data) runs a select query against the datasource.
+
+You can try out these examples after verifying that you meet the [prerequisites](#prerequisites).
+
+For more information about the connection options, see [Client Reference](https://calcite.apache.org/avatica/docs/client_reference.html).
+
+### Prerequisites
+
+Make sure you meet the following requirements before trying these examples:
+
+- A supported [Java version](../operations/java.md)
+
+- [Avatica JDBC driver](https://calcite.apache.org/avatica/downloads/). You can add the JAR  to your `CLASSPATH` directly or manage it externally, such as through Maven and a `pom.xml` file.
+
+- An available Druid instance. You can use the `micro-quickstart` configuration described in [Quickstart (local)](../tutorials/index.md). The examples assume that you are using the quickstart, so no authentication or authorization is expected unless explicitly mentioned. 
+
+- The example `wikipedia` datasource from the quickstart is loaded on your Druid instance. If you have a different datasource loaded, you can still try these examples. You'll have to update the table name and column names to match your datasource.
+
+### Get the metadata for a datasource
+
+Metadata, such as column names, is available either through the [`INFORMATION_SCHEMA`](../querying/sql-metadata-tables.md) table or through `connection.getMetaData()`. The following example uses the `INFORMATION_SCHEMA` table to retrieve and print the list of column names for the `wikipedia` datasource that you loaded during a previous tutorial.
+
+```java
+import java.sql.*;
+import java.util.Properties;
+
+public class JdbcListColumns {
+
+    public static void main(String[] args)
+    {
+        // Connect to /druid/v2/sql/avatica/ on your Router. 
+        // You can connect to a Broker but must configure connection stickiness if you do. 
+        String url = "jdbc:avatica:remote:url=http://localhost:8888/druid/v2/sql/avatica/;transparent_reconnection=true";
+
+        String query = "SELECT COLUMN_NAME,* FROM INFORMATION_SCHEMA.COLUMNS WHERE TABLE_NAME = 'wikipedia' and TABLE_SCHEMA='druid'";
+
+        // Set any connection context parameters you need here.
+        // Any property from https://druid.apache.org/docs/latest/querying/sql-query-context.html can go here.
+        Properties connectionProperties = new Properties();
+
+        try (Connection connection = DriverManager.getConnection(url, connectionProperties)) {
+            try (
+                    final Statement statement = connection.createStatement();
+                    final ResultSet rs = statement.executeQuery(query)
+            ) {
+                while (rs.next()) {
+                    String columnName = rs.getString("COLUMN_NAME");
+                    System.out.println(columnName);
+                }
+            }
+        } catch (SQLException e) {
+            throw new RuntimeException(e);
+        }
+
+    }
+}
+```
+
+### Query data
+
+Now that you know what columns are available, you can start querying the data. The following example queries the datasource named `wikipedia` for the timestamps and comments from Japan. It also sets the [query context parameter](../querying/sql-query-context.md) `sqlTimeZone`. Optionally, you can also parameterize queries by using [dynamic parameters](#dynamic-parameters).
+
+```java
+import java.sql.*;
+import java.util.Properties;
+
+public class JdbcCountryAndTime {
+
+    public static void main(String[] args)
+    {
+        // Connect to /druid/v2/sql/avatica/ on your Router. 
+        // You can connect to a Broker but must configure connection stickiness if you do. 
+        String url = "jdbc:avatica:remote:url=http://localhost:8888/druid/v2/sql/avatica/;transparent_reconnection=true";
+
+        //The query you want to run.
+        String query = "SELECT __time, isRobot, countryName, comment FROM wikipedia WHERE countryName='Japan'";
+
+        // Set any connection context parameters you need here.
+        // Any property from https://druid.apache.org/docs/latest/querying/sql-query-context.html can go here.
+        Properties connectionProperties = new Properties();
+        connectionProperties.setProperty("sqlTimeZone", "America/Los_Angeles");
+
+        try (Connection connection = DriverManager.getConnection(url, connectionProperties)) {
+            try (
+                    final Statement statement = connection.createStatement();
+                    final ResultSet rs = statement.executeQuery(query)
+            ) {
+                while (rs.next()) {
+                    Timestamp timeStamp = rs.getTimestamp("__time");
+                    String comment = rs.getString("comment");
+                    System.out.println(timeStamp);
+                    System.out.println(comment);
+                }
+            }
+        } catch (SQLException e) {
+            throw new RuntimeException(e);
+        }
+
+    }
+}
+```
diff --git a/docs/35.0.0/api-reference/supervisor-api.md b/docs/35.0.0/api-reference/supervisor-api.md
new file mode 100644
index 0000000000..38e68d4e13
--- /dev/null
+++ b/docs/35.0.0/api-reference/supervisor-api.md
@@ -0,0 +1,3652 @@
+---
+id: supervisor-api
+title: Supervisor API
+sidebar_label: Supervisors
+---
+import Tabs from '@theme/Tabs';
+import TabItem from '@theme/TabItem';
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+This topic describes the API endpoints to manage and monitor supervisors for Apache Druid.
+The topic uses the Apache Kafka term offset to refer to the identifier for records in a partition. If you are using Amazon Kinesis, the equivalent is sequence number.
+
+In this topic, `http://ROUTER_IP:ROUTER_PORT` is a placeholder for your Router service address and port. Replace it with the information for your deployment. For example, use `http://localhost:8888` for quickstart deployments.
+
+## Supervisor information
+
+The following table lists the properties of a supervisor object:
+
+|Property|Type|Description|
+|---|---|---|
+|`id`|String|Unique identifier.|
+|`state`|String|Generic state of the supervisor. Available states:`UNHEALTHY_SUPERVISOR`, `UNHEALTHY_TASKS`, `PENDING`, `RUNNING`, `SUSPENDED`, `STOPPING`. See [Supervisor reference](../ingestion/supervisor.md#status-report) for more information.|
+|`detailedState`|String|Detailed state of the supervisor. This property contains a more descriptive, implementation-specific state that may provide more insight into the supervisor's activities than the `state` property. See [Apache Kafka ingestion](../ingestion/kafka-ingestion.md) and [Amazon Kinesis ingestion](../ingestion/kinesis-ingestion.md) for supervisor-specific states.|
+|`healthy`|Boolean|Supervisor health indicator.|
+|`spec`|Object|Container object for the supervisor configuration.|
+|`suspended`|Boolean|Indicates whether the supervisor is in a suspended state.|
+
+### Get an array of active supervisor IDs
+
+Returns an array of strings representing the names of active supervisors. If there are no active supervisors, it returns an empty array.
+
+#### URL
+
+`GET` `/druid/indexer/v1/supervisor`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="1" label="200 SUCCESS">
+
+
+*Successfully retrieved array of active supervisor IDs*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="2" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/supervisor"
+```
+
+</TabItem>
+<TabItem value="3" label="HTTP">
+
+
+```HTTP
+GET /druid/indexer/v1/supervisor HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+  [
+    "wikipedia_stream",
+    "social_media"
+  ]
+  ```
+</details>
+
+### Get an array of active supervisor objects
+
+Retrieves an array of active supervisor objects. If there are no active supervisors, it returns an empty array. For reference on the supervisor object properties, see the preceding [table](#supervisor-information).
+
+#### URL
+
+`GET` `/druid/indexer/v1/supervisor?full`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="4" label="200 SUCCESS">
+
+
+*Successfully retrieved supervisor objects*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="5" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/supervisor?full=null"
+```
+
+</TabItem>
+<TabItem value="6" label="HTTP">
+
+
+```HTTP
+GET /druid/indexer/v1/supervisor?full=null HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+  [
+    {
+        "id": "wikipedia_stream",
+        "state": "RUNNING",
+        "detailedState": "CONNECTING_TO_STREAM",
+        "healthy": true,
+        "spec": {
+            "type": "kafka",
+            "spec": {
+                "dataSchema": {
+                    "dataSource": "wikipedia_stream",
+                    "timestampSpec": {
+                        "column": "__time",
+                        "format": "iso",
+                        "missingValue": null
+                    },
+                    "dimensionsSpec": {
+                        "dimensions": [
+                            {
+                                "type": "string",
+                                "name": "username",
+                                "multiValueHandling": "SORTED_ARRAY",
+                                "createBitmapIndex": true
+                            },
+                            {
+                                "type": "string",
+                                "name": "post_title",
+                                "multiValueHandling": "SORTED_ARRAY",
+                                "createBitmapIndex": true
+                            },
+                            {
+                                "type": "long",
+                                "name": "views",
+                                "multiValueHandling": "SORTED_ARRAY",
+                                "createBitmapIndex": false
+                            },
+                            {
+                                "type": "long",
+                                "name": "upvotes",
+                                "multiValueHandling": "SORTED_ARRAY",
+                                "createBitmapIndex": false
+                            },
+                            {
+                                "type": "long",
+                                "name": "comments",
+                                "multiValueHandling": "SORTED_ARRAY",
+                                "createBitmapIndex": false
+                            },
+                            {
+                                "type": "string",
+                                "name": "edited",
+                                "multiValueHandling": "SORTED_ARRAY",
+                                "createBitmapIndex": true
+                            }
+                        ],
+                        "dimensionExclusions": [
+                            "__time"
+                        ],
+                        "includeAllDimensions": false,
+                        "useSchemaDiscovery": false
+                    },
+                    "metricsSpec": [],
+                    "granularitySpec": {
+                        "type": "uniform",
+                        "segmentGranularity": "HOUR",
+                        "queryGranularity": {
+                            "type": "none"
+                        },
+                        "rollup": false,
+                        "intervals": []
+                    },
+                    "transformSpec": {
+                        "filter": null,
+                        "transforms": []
+                    }
+                },
+                "ioConfig": {
+                    "topic": "social_media",
+                    "inputFormat": {
+                        "type": "json"
+                    },
+                    "replicas": 1,
+                    "taskCount": 1,
+                    "taskDuration": "PT3600S",
+                    "consumerProperties": {
+                        "bootstrap.servers": "localhost:9042"
+                    },
+                    "autoScalerConfig": null,
+                    "pollTimeout": 100,
+                    "startDelay": "PT5S",
+                    "period": "PT30S",
+                    "useEarliestOffset": true,
+                    "completionTimeout": "PT1800S",
+                    "lateMessageRejectionPeriod": null,
+                    "earlyMessageRejectionPeriod": null,
+                    "lateMessageRejectionStartDateTime": null,
+                    "configOverrides": null,
+                    "idleConfig": null,
+                    "stream": "social_media",
+                    "useEarliestSequenceNumber": true
+                },
+                "tuningConfig": {
+                    "type": "kafka",
+                    "appendableIndexSpec": {
+                        "type": "onheap",
+                        "preserveExistingMetrics": false
+                    },
+                    "maxRowsInMemory": 150000,
+                    "maxBytesInMemory": 0,
+                    "skipBytesInMemoryOverheadCheck": false,
+                    "maxRowsPerSegment": 5000000,
+                    "maxTotalRows": null,
+                    "intermediatePersistPeriod": "PT10M",
+                    "maxPendingPersists": 0,
+                    "indexSpec": {
+                        "bitmap": {
+                            "type": "roaring"
+                        },
+                        "dimensionCompression": "lz4",
+                        "stringDictionaryEncoding": {
+                            "type": "utf8"
+                        },
+                        "metricCompression": "lz4",
+                        "longEncoding": "longs"
+                    },
+                    "indexSpecForIntermediatePersists": {
+                        "bitmap": {
+                            "type": "roaring"
+                        },
+                        "dimensionCompression": "lz4",
+                        "stringDictionaryEncoding": {
+                            "type": "utf8"
+                        },
+                        "metricCompression": "lz4",
+                        "longEncoding": "longs"
+                    },
+                    "reportParseExceptions": false,
+                    "handoffConditionTimeout": 0,
+                    "resetOffsetAutomatically": false,
+                    "segmentWriteOutMediumFactory": null,
+                    "workerThreads": null,
+                    "chatRetries": 8,
+                    "httpTimeout": "PT10S",
+                    "shutdownTimeout": "PT80S",
+                    "offsetFetchPeriod": "PT30S",
+                    "intermediateHandoffPeriod": "P2147483647D",
+                    "logParseExceptions": false,
+                    "maxParseExceptions": 2147483647,
+                    "maxSavedParseExceptions": 0,
+                    "skipSequenceNumberAvailabilityCheck": false,
+                    "repartitionTransitionDuration": "PT120S"
+                }
+            },
+            "dataSchema": {
+                "dataSource": "wikipedia_stream",
+                "timestampSpec": {
+                    "column": "__time",
+                    "format": "iso",
+                    "missingValue": null
+                },
+                "dimensionsSpec": {
+                    "dimensions": [
+                        {
+                            "type": "string",
+                            "name": "username",
+                            "multiValueHandling": "SORTED_ARRAY",
+                            "createBitmapIndex": true
+                        },
+                        {
+                            "type": "string",
+                            "name": "post_title",
+                            "multiValueHandling": "SORTED_ARRAY",
+                            "createBitmapIndex": true
+                        },
+                        {
+                            "type": "long",
+                            "name": "views",
+                            "multiValueHandling": "SORTED_ARRAY",
+                            "createBitmapIndex": false
+                        },
+                        {
+                            "type": "long",
+                            "name": "upvotes",
+                            "multiValueHandling": "SORTED_ARRAY",
+                            "createBitmapIndex": false
+                        },
+                        {
+                            "type": "long",
+                            "name": "comments",
+                            "multiValueHandling": "SORTED_ARRAY",
+                            "createBitmapIndex": false
+                        },
+                        {
+                            "type": "string",
+                            "name": "edited",
+                            "multiValueHandling": "SORTED_ARRAY",
+                            "createBitmapIndex": true
+                        }
+                    ],
+                    "dimensionExclusions": [
+                        "__time"
+                    ],
+                    "includeAllDimensions": false,
+                    "useSchemaDiscovery": false
+                },
+                "metricsSpec": [],
+                "granularitySpec": {
+                    "type": "uniform",
+                    "segmentGranularity": "HOUR",
+                    "queryGranularity": {
+                        "type": "none"
+                    },
+                    "rollup": false,
+                    "intervals": []
+                },
+                "transformSpec": {
+                    "filter": null,
+                    "transforms": []
+                }
+            },
+            "tuningConfig": {
+                "type": "kafka",
+                "appendableIndexSpec": {
+                    "type": "onheap",
+                    "preserveExistingMetrics": false
+                },
+                "maxRowsInMemory": 150000,
+                "maxBytesInMemory": 0,
+                "skipBytesInMemoryOverheadCheck": false,
+                "maxRowsPerSegment": 5000000,
+                "maxTotalRows": null,
+                "intermediatePersistPeriod": "PT10M",
+                "maxPendingPersists": 0,
+                "indexSpec": {
+                    "bitmap": {
+                        "type": "roaring"
+                    },
+                    "dimensionCompression": "lz4",
+                    "stringDictionaryEncoding": {
+                        "type": "utf8"
+                    },
+                    "metricCompression": "lz4",
+                    "longEncoding": "longs"
+                },
+                "indexSpecForIntermediatePersists": {
+                    "bitmap": {
+                        "type": "roaring"
+                    },
+                    "dimensionCompression": "lz4",
+                    "stringDictionaryEncoding": {
+                        "type": "utf8"
+                    },
+                    "metricCompression": "lz4",
+                    "longEncoding": "longs"
+                },
+                "reportParseExceptions": false,
+                "handoffConditionTimeout": 0,
+                "resetOffsetAutomatically": false,
+                "segmentWriteOutMediumFactory": null,
+                "workerThreads": null,
+                "chatRetries": 8,
+                "httpTimeout": "PT10S",
+                "shutdownTimeout": "PT80S",
+                "offsetFetchPeriod": "PT30S",
+                "intermediateHandoffPeriod": "P2147483647D",
+                "logParseExceptions": false,
+                "maxParseExceptions": 2147483647,
+                "maxSavedParseExceptions": 0,
+                "skipSequenceNumberAvailabilityCheck": false,
+                "repartitionTransitionDuration": "PT120S"
+            },
+            "ioConfig": {
+                "topic": "social_media",
+                "inputFormat": {
+                    "type": "json"
+                },
+                "replicas": 1,
+                "taskCount": 1,
+                "taskDuration": "PT3600S",
+                "consumerProperties": {
+                    "bootstrap.servers": "localhost:9042"
+                },
+                "autoScalerConfig": null,
+                "pollTimeout": 100,
+                "startDelay": "PT5S",
+                "period": "PT30S",
+                "useEarliestOffset": true,
+                "completionTimeout": "PT1800S",
+                "lateMessageRejectionPeriod": null,
+                "earlyMessageRejectionPeriod": null,
+                "lateMessageRejectionStartDateTime": null,
+                "configOverrides": null,
+                "idleConfig": null,
+                "stream": "social_media",
+                "useEarliestSequenceNumber": true
+            },
+            "context": null,
+            "suspended": false
+        },
+        "suspended": false
+    },
+    {
+        "id": "social_media",
+        "state": "RUNNING",
+        "detailedState": "RUNNING",
+        "healthy": true,
+        "spec": {
+            "type": "kafka",
+            "spec": {
+                "dataSchema": {
+                    "dataSource": "social_media",
+                    "timestampSpec": {
+                        "column": "__time",
+                        "format": "iso",
+                        "missingValue": null
+                    },
+                    "dimensionsSpec": {
+                        "dimensions": [
+                            {
+                                "type": "string",
+                                "name": "username",
+                                "multiValueHandling": "SORTED_ARRAY",
+                                "createBitmapIndex": true
+                            },
+                            {
+                                "type": "string",
+                                "name": "post_title",
+                                "multiValueHandling": "SORTED_ARRAY",
+                                "createBitmapIndex": true
+                            },
+                            {
+                                "type": "long",
+                                "name": "views",
+                                "multiValueHandling": "SORTED_ARRAY",
+                                "createBitmapIndex": false
+                            },
+                            {
+                                "type": "long",
+                                "name": "upvotes",
+                                "multiValueHandling": "SORTED_ARRAY",
+                                "createBitmapIndex": false
+                            },
+                            {
+                                "type": "long",
+                                "name": "comments",
+                                "multiValueHandling": "SORTED_ARRAY",
+                                "createBitmapIndex": false
+                            },
+                            {
+                                "type": "string",
+                                "name": "edited",
+                                "multiValueHandling": "SORTED_ARRAY",
+                                "createBitmapIndex": true
+                            }
+                        ],
+                        "dimensionExclusions": [
+                            "__time"
+                        ],
+                        "includeAllDimensions": false,
+                        "useSchemaDiscovery": false
+                    },
+                    "metricsSpec": [],
+                    "granularitySpec": {
+                        "type": "uniform",
+                        "segmentGranularity": "HOUR",
+                        "queryGranularity": {
+                            "type": "none"
+                        },
+                        "rollup": false,
+                        "intervals": []
+                    },
+                    "transformSpec": {
+                        "filter": null,
+                        "transforms": []
+                    }
+                },
+                "ioConfig": {
+                    "topic": "social_media",
+                    "inputFormat": {
+                        "type": "json"
+                    },
+                    "replicas": 1,
+                    "taskCount": 1,
+                    "taskDuration": "PT3600S",
+                    "consumerProperties": {
+                        "bootstrap.servers": "localhost:9094"
+                    },
+                    "autoScalerConfig": null,
+                    "pollTimeout": 100,
+                    "startDelay": "PT5S",
+                    "period": "PT30S",
+                    "useEarliestOffset": true,
+                    "completionTimeout": "PT1800S",
+                    "lateMessageRejectionPeriod": null,
+                    "earlyMessageRejectionPeriod": null,
+                    "lateMessageRejectionStartDateTime": null,
+                    "configOverrides": null,
+                    "idleConfig": null,
+                    "stream": "social_media",
+                    "useEarliestSequenceNumber": true
+                },
+                "tuningConfig": {
+                    "type": "kafka",
+                    "appendableIndexSpec": {
+                        "type": "onheap",
+                        "preserveExistingMetrics": false
+                    },
+                    "maxRowsInMemory": 150000,
+                    "maxBytesInMemory": 0,
+                    "skipBytesInMemoryOverheadCheck": false,
+                    "maxRowsPerSegment": 5000000,
+                    "maxTotalRows": null,
+                    "intermediatePersistPeriod": "PT10M",
+                    "maxPendingPersists": 0,
+                    "indexSpec": {
+                        "bitmap": {
+                            "type": "roaring"
+                        },
+                        "dimensionCompression": "lz4",
+                        "stringDictionaryEncoding": {
+                            "type": "utf8"
+                        },
+                        "metricCompression": "lz4",
+                        "longEncoding": "longs"
+                    },
+                    "indexSpecForIntermediatePersists": {
+                        "bitmap": {
+                            "type": "roaring"
+                        },
+                        "dimensionCompression": "lz4",
+                        "stringDictionaryEncoding": {
+                            "type": "utf8"
+                        },
+                        "metricCompression": "lz4",
+                        "longEncoding": "longs"
+                    },
+                    "reportParseExceptions": false,
+                    "handoffConditionTimeout": 0,
+                    "resetOffsetAutomatically": false,
+                    "segmentWriteOutMediumFactory": null,
+                    "workerThreads": null,
+                    "chatRetries": 8,
+                    "httpTimeout": "PT10S",
+                    "shutdownTimeout": "PT80S",
+                    "offsetFetchPeriod": "PT30S",
+                    "intermediateHandoffPeriod": "P2147483647D",
+                    "logParseExceptions": false,
+                    "maxParseExceptions": 2147483647,
+                    "maxSavedParseExceptions": 0,
+                    "skipSequenceNumberAvailabilityCheck": false,
+                    "repartitionTransitionDuration": "PT120S"
+                }
+            },
+            "dataSchema": {
+                "dataSource": "social_media",
+                "timestampSpec": {
+                    "column": "__time",
+                    "format": "iso",
+                    "missingValue": null
+                },
+                "dimensionsSpec": {
+                    "dimensions": [
+                        {
+                            "type": "string",
+                            "name": "username",
+                            "multiValueHandling": "SORTED_ARRAY",
+                            "createBitmapIndex": true
+                        },
+                        {
+                            "type": "string",
+                            "name": "post_title",
+                            "multiValueHandling": "SORTED_ARRAY",
+                            "createBitmapIndex": true
+                        },
+                        {
+                            "type": "long",
+                            "name": "views",
+                            "multiValueHandling": "SORTED_ARRAY",
+                            "createBitmapIndex": false
+                        },
+                        {
+                            "type": "long",
+                            "name": "upvotes",
+                            "multiValueHandling": "SORTED_ARRAY",
+                            "createBitmapIndex": false
+                        },
+                        {
+                            "type": "long",
+                            "name": "comments",
+                            "multiValueHandling": "SORTED_ARRAY",
+                            "createBitmapIndex": false
+                        },
+                        {
+                            "type": "string",
+                            "name": "edited",
+                            "multiValueHandling": "SORTED_ARRAY",
+                            "createBitmapIndex": true
+                        }
+                    ],
+                    "dimensionExclusions": [
+                        "__time"
+                    ],
+                    "includeAllDimensions": false,
+                    "useSchemaDiscovery": false
+                },
+                "metricsSpec": [],
+                "granularitySpec": {
+                    "type": "uniform",
+                    "segmentGranularity": "HOUR",
+                    "queryGranularity": {
+                        "type": "none"
+                    },
+                    "rollup": false,
+                    "intervals": []
+                },
+                "transformSpec": {
+                    "filter": null,
+                    "transforms": []
+                }
+            },
+            "tuningConfig": {
+                "type": "kafka",
+                "appendableIndexSpec": {
+                    "type": "onheap",
+                    "preserveExistingMetrics": false
+                },
+                "maxRowsInMemory": 150000,
+                "maxBytesInMemory": 0,
+                "skipBytesInMemoryOverheadCheck": false,
+                "maxRowsPerSegment": 5000000,
+                "maxTotalRows": null,
+                "intermediatePersistPeriod": "PT10M",
+                "maxPendingPersists": 0,
+                "indexSpec": {
+                    "bitmap": {
+                        "type": "roaring"
+                    },
+                    "dimensionCompression": "lz4",
+                    "stringDictionaryEncoding": {
+                        "type": "utf8"
+                    },
+                    "metricCompression": "lz4",
+                    "longEncoding": "longs"
+                },
+                "indexSpecForIntermediatePersists": {
+                    "bitmap": {
+                        "type": "roaring"
+                    },
+                    "dimensionCompression": "lz4",
+                    "stringDictionaryEncoding": {
+                        "type": "utf8"
+                    },
+                    "metricCompression": "lz4",
+                    "longEncoding": "longs"
+                },
+                "reportParseExceptions": false,
+                "handoffConditionTimeout": 0,
+                "resetOffsetAutomatically": false,
+                "segmentWriteOutMediumFactory": null,
+                "workerThreads": null,
+                "chatRetries": 8,
+                "httpTimeout": "PT10S",
+                "shutdownTimeout": "PT80S",
+                "offsetFetchPeriod": "PT30S",
+                "intermediateHandoffPeriod": "P2147483647D",
+                "logParseExceptions": false,
+                "maxParseExceptions": 2147483647,
+                "maxSavedParseExceptions": 0,
+                "skipSequenceNumberAvailabilityCheck": false,
+                "repartitionTransitionDuration": "PT120S"
+            },
+            "ioConfig": {
+                "topic": "social_media",
+                "inputFormat": {
+                    "type": "json"
+                },
+                "replicas": 1,
+                "taskCount": 1,
+                "taskDuration": "PT3600S",
+                "consumerProperties": {
+                    "bootstrap.servers": "localhost:9094"
+                },
+                "autoScalerConfig": null,
+                "pollTimeout": 100,
+                "startDelay": "PT5S",
+                "period": "PT30S",
+                "useEarliestOffset": true,
+                "completionTimeout": "PT1800S",
+                "lateMessageRejectionPeriod": null,
+                "earlyMessageRejectionPeriod": null,
+                "lateMessageRejectionStartDateTime": null,
+                "configOverrides": null,
+                "idleConfig": null,
+                "stream": "social_media",
+                "useEarliestSequenceNumber": true
+            },
+            "context": null,
+            "suspended": false
+        },
+        "suspended": false
+    }
+  ]
+  ```
+</details>
+
+### Get an array of supervisor states
+
+Retrieves an array of objects representing active supervisors and their current state. If there are no active supervisors, it returns an empty array. For reference on the supervisor object properties, see the preceding [table](#supervisor-information).
+
+#### URL
+
+`GET` `/druid/indexer/v1/supervisor?state=true`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="7" label="200 SUCCESS">
+
+
+*Successfully retrieved supervisor state objects*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="8" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/supervisor?state=true"
+```
+
+</TabItem>
+<TabItem value="9" label="HTTP">
+
+
+```HTTP
+GET /druid/indexer/v1/supervisor?state=true HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+  [
+    {
+        "id": "wikipedia_stream",
+        "state": "UNHEALTHY_SUPERVISOR",
+        "detailedState": "UNABLE_TO_CONNECT_TO_STREAM",
+        "healthy": false,
+        "suspended": false
+    },
+    {
+        "id": "social_media",
+        "state": "RUNNING",
+        "detailedState": "RUNNING",
+        "healthy": true,
+        "suspended": false
+    }
+  ]
+  ```
+
+</details>
+
+### Get supervisor specification
+
+Retrieves the specification for a single supervisor. The returned specification includes the `dataSchema`, `ioConfig`, and `tuningConfig` objects.
+
+#### URL
+
+`GET` `/druid/indexer/v1/supervisor/{supervisorId}`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="10" label="200 SUCCESS">
+
+
+*Successfully retrieved supervisor spec*
+
+</TabItem>
+<TabItem value="11" label="404 NOT FOUND">
+
+
+*Invalid supervisor ID*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+The following example shows how to retrieve the specification of a supervisor with the name `wikipedia_stream`.
+
+<Tabs>
+
+<TabItem value="12" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/supervisor/wikipedia_stream"
+```
+
+</TabItem>
+<TabItem value="13" label="HTTP">
+
+
+```HTTP
+GET /druid/indexer/v1/supervisor/wikipedia_stream HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+{
+    "type": "kafka",
+    "spec": {
+        "dataSchema": {
+            "dataSource": "social_media",
+            "timestampSpec": {
+                "column": "__time",
+                "format": "iso",
+                "missingValue": null
+            },
+            "dimensionsSpec": {
+                "dimensions": [
+                    {
+                        "type": "string",
+                        "name": "username",
+                        "multiValueHandling": "SORTED_ARRAY",
+                        "createBitmapIndex": true
+                    },
+                    {
+                        "type": "string",
+                        "name": "post_title",
+                        "multiValueHandling": "SORTED_ARRAY",
+                        "createBitmapIndex": true
+                    },
+                    {
+                        "type": "long",
+                        "name": "views",
+                        "multiValueHandling": "SORTED_ARRAY",
+                        "createBitmapIndex": false
+                    },
+                    {
+                        "type": "long",
+                        "name": "upvotes",
+                        "multiValueHandling": "SORTED_ARRAY",
+                        "createBitmapIndex": false
+                    },
+                    {
+                        "type": "long",
+                        "name": "comments",
+                        "multiValueHandling": "SORTED_ARRAY",
+                        "createBitmapIndex": false
+                    },
+                    {
+                        "type": "string",
+                        "name": "edited",
+                        "multiValueHandling": "SORTED_ARRAY",
+                        "createBitmapIndex": true
+                    }
+                ],
+                "dimensionExclusions": [
+                    "__time"
+                ],
+                "includeAllDimensions": false,
+                "useSchemaDiscovery": false
+            },
+            "metricsSpec": [],
+            "granularitySpec": {
+                "type": "uniform",
+                "segmentGranularity": "HOUR",
+                "queryGranularity": {
+                    "type": "none"
+                },
+                "rollup": false,
+                "intervals": []
+            },
+            "transformSpec": {
+                "filter": null,
+                "transforms": []
+            }
+        },
+        "ioConfig": {
+            "topic": "social_media",
+            "inputFormat": {
+                "type": "json"
+            },
+            "replicas": 1,
+            "taskCount": 1,
+            "taskDuration": "PT3600S",
+            "consumerProperties": {
+                "bootstrap.servers": "localhost:9094"
+            },
+            "autoScalerConfig": null,
+            "pollTimeout": 100,
+            "startDelay": "PT5S",
+            "period": "PT30S",
+            "useEarliestOffset": true,
+            "completionTimeout": "PT1800S",
+            "lateMessageRejectionPeriod": null,
+            "earlyMessageRejectionPeriod": null,
+            "lateMessageRejectionStartDateTime": null,
+            "configOverrides": null,
+            "idleConfig": null,
+            "stream": "social_media",
+            "useEarliestSequenceNumber": true
+        },
+        "tuningConfig": {
+            "type": "kafka",
+            "appendableIndexSpec": {
+                "type": "onheap",
+                "preserveExistingMetrics": false
+            },
+            "maxRowsInMemory": 150000,
+            "maxBytesInMemory": 0,
+            "skipBytesInMemoryOverheadCheck": false,
+            "maxRowsPerSegment": 5000000,
+            "maxTotalRows": null,
+            "intermediatePersistPeriod": "PT10M",
+            "maxPendingPersists": 0,
+            "indexSpec": {
+                "bitmap": {
+                    "type": "roaring"
+                },
+                "dimensionCompression": "lz4",
+                "stringDictionaryEncoding": {
+                    "type": "utf8"
+                },
+                "metricCompression": "lz4",
+                "longEncoding": "longs"
+            },
+            "indexSpecForIntermediatePersists": {
+                "bitmap": {
+                    "type": "roaring"
+                },
+                "dimensionCompression": "lz4",
+                "stringDictionaryEncoding": {
+                    "type": "utf8"
+                },
+                "metricCompression": "lz4",
+                "longEncoding": "longs"
+            },
+            "reportParseExceptions": false,
+            "handoffConditionTimeout": 0,
+            "resetOffsetAutomatically": false,
+            "segmentWriteOutMediumFactory": null,
+            "workerThreads": null,
+            "chatRetries": 8,
+            "httpTimeout": "PT10S",
+            "shutdownTimeout": "PT80S",
+            "offsetFetchPeriod": "PT30S",
+            "intermediateHandoffPeriod": "P2147483647D",
+            "logParseExceptions": false,
+            "maxParseExceptions": 2147483647,
+            "maxSavedParseExceptions": 0,
+            "skipSequenceNumberAvailabilityCheck": false,
+            "repartitionTransitionDuration": "PT120S"
+        }
+    },
+    "dataSchema": {
+        "dataSource": "social_media",
+        "timestampSpec": {
+            "column": "__time",
+            "format": "iso",
+            "missingValue": null
+        },
+        "dimensionsSpec": {
+            "dimensions": [
+                {
+                    "type": "string",
+                    "name": "username",
+                    "multiValueHandling": "SORTED_ARRAY",
+                    "createBitmapIndex": true
+                },
+                {
+                    "type": "string",
+                    "name": "post_title",
+                    "multiValueHandling": "SORTED_ARRAY",
+                    "createBitmapIndex": true
+                },
+                {
+                    "type": "long",
+                    "name": "views",
+                    "multiValueHandling": "SORTED_ARRAY",
+                    "createBitmapIndex": false
+                },
+                {
+                    "type": "long",
+                    "name": "upvotes",
+                    "multiValueHandling": "SORTED_ARRAY",
+                    "createBitmapIndex": false
+                },
+                {
+                    "type": "long",
+                    "name": "comments",
+                    "multiValueHandling": "SORTED_ARRAY",
+                    "createBitmapIndex": false
+                },
+                {
+                    "type": "string",
+                    "name": "edited",
+                    "multiValueHandling": "SORTED_ARRAY",
+                    "createBitmapIndex": true
+                }
+            ],
+            "dimensionExclusions": [
+                "__time"
+            ],
+            "includeAllDimensions": false,
+            "useSchemaDiscovery": false
+        },
+        "metricsSpec": [],
+        "granularitySpec": {
+            "type": "uniform",
+            "segmentGranularity": "HOUR",
+            "queryGranularity": {
+                "type": "none"
+            },
+            "rollup": false,
+            "intervals": []
+        },
+        "transformSpec": {
+            "filter": null,
+            "transforms": []
+        }
+    },
+    "tuningConfig": {
+        "type": "kafka",
+        "appendableIndexSpec": {
+            "type": "onheap",
+            "preserveExistingMetrics": false
+        },
+        "maxRowsInMemory": 150000,
+        "maxBytesInMemory": 0,
+        "skipBytesInMemoryOverheadCheck": false,
+        "maxRowsPerSegment": 5000000,
+        "maxTotalRows": null,
+        "intermediatePersistPeriod": "PT10M",
+        "maxPendingPersists": 0,
+        "indexSpec": {
+            "bitmap": {
+                "type": "roaring"
+            },
+            "dimensionCompression": "lz4",
+            "stringDictionaryEncoding": {
+                "type": "utf8"
+            },
+            "metricCompression": "lz4",
+            "longEncoding": "longs"
+        },
+        "indexSpecForIntermediatePersists": {
+            "bitmap": {
+                "type": "roaring"
+            },
+            "dimensionCompression": "lz4",
+            "stringDictionaryEncoding": {
+                "type": "utf8"
+            },
+            "metricCompression": "lz4",
+            "longEncoding": "longs"
+        },
+        "reportParseExceptions": false,
+        "handoffConditionTimeout": 0,
+        "resetOffsetAutomatically": false,
+        "segmentWriteOutMediumFactory": null,
+        "workerThreads": null,
+        "chatRetries": 8,
+        "httpTimeout": "PT10S",
+        "shutdownTimeout": "PT80S",
+        "offsetFetchPeriod": "PT30S",
+        "intermediateHandoffPeriod": "P2147483647D",
+        "logParseExceptions": false,
+        "maxParseExceptions": 2147483647,
+        "maxSavedParseExceptions": 0,
+        "skipSequenceNumberAvailabilityCheck": false,
+        "repartitionTransitionDuration": "PT120S"
+    },
+    "ioConfig": {
+        "topic": "social_media",
+        "inputFormat": {
+            "type": "json"
+        },
+        "replicas": 1,
+        "taskCount": 1,
+        "taskDuration": "PT3600S",
+        "consumerProperties": {
+            "bootstrap.servers": "localhost:9094"
+        },
+        "autoScalerConfig": null,
+        "pollTimeout": 100,
+        "startDelay": "PT5S",
+        "period": "PT30S",
+        "useEarliestOffset": true,
+        "completionTimeout": "PT1800S",
+        "lateMessageRejectionPeriod": null,
+        "earlyMessageRejectionPeriod": null,
+        "lateMessageRejectionStartDateTime": null,
+        "configOverrides": null,
+        "idleConfig": null,
+        "stream": "social_media",
+        "useEarliestSequenceNumber": true
+    },
+    "context": null,
+    "suspended": false
+}
+  ```
+</details>
+
+### Get supervisor status
+
+Retrieves the current status report for a single supervisor. The report contains the state of the supervisor tasks and an array of recently thrown exceptions.
+
+For additional information about the status report, see [Supervisor reference](../ingestion/supervisor.md#status-report).
+
+#### URL
+
+`GET` `/druid/indexer/v1/supervisor/{supervisorId}/status`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="14" label="200 SUCCESS">
+
+
+*Successfully retrieved supervisor status*
+
+</TabItem>
+<TabItem value="15" label="404 NOT FOUND">
+
+
+*Invalid supervisor ID*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+The following example shows how to retrieve the status of a supervisor with the name `social_media`.
+
+<Tabs>
+
+<TabItem value="16" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/supervisor/social_media/status"
+```
+
+</TabItem>
+<TabItem value="17" label="HTTP">
+
+
+```HTTP
+GET /druid/indexer/v1/supervisor/social_media/status HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+  {
+      "id": "social_media",
+      "generationTime": "2023-07-05T23:24:43.934Z",
+      "payload": {
+          "dataSource": "social_media",
+          "stream": "social_media",
+          "partitions": 1,
+          "replicas": 1,
+          "durationSeconds": 3600,
+          "activeTasks": [
+              {
+                  "id": "index_kafka_social_media_ab72ae4127c591c_flcbhdlh",
+                  "startingOffsets": {
+                      "0": 3176381
+                  },
+                  "startTime": "2023-07-05T23:21:39.321Z",
+                  "remainingSeconds": 3415,
+                  "type": "ACTIVE",
+                  "currentOffsets": {
+                      "0": 3296632
+                  },
+                  "lag": {
+                      "0": 3
+                  }
+              }
+          ],
+          "publishingTasks": [],
+          "latestOffsets": {
+              "0": 3296635
+          },
+          "minimumLag": {
+              "0": 3
+          },
+          "aggregateLag": 3,
+          "offsetsLastUpdated": "2023-07-05T23:24:30.212Z",
+          "suspended": false,
+          "healthy": true,
+          "state": "RUNNING",
+          "detailedState": "RUNNING",
+          "recentErrors": []
+      }
+  }
+  ```
+</details>
+
+### Get supervisor health
+
+Retrieves the current health report for a single supervisor. The health of a supervisor is determined by the supervisor's `state` (as returned by the `/status` endpoint) and the `druid.supervisor.*` Overlord configuration thresholds.
+
+#### URL
+
+`GET` `/druid/indexer/v1/supervisor/{supervisorId}/health`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="18" label="200 SUCCESS">
+
+*Supervisor is healthy*
+
+</TabItem>
+
+<TabItem value="19" label="404 NOT FOUND">
+
+*Invalid supervisor ID*
+
+</TabItem>
+
+<TabItem value="20" label="503 SERVICE UNAVAILABLE">
+
+*Supervisor is unhealthy*
+
+</TabItem>
+
+</Tabs>
+
+---
+
+#### Sample request
+
+The following example shows how to retrieve the health report for a supervisor with the name `social_media`.
+
+<Tabs>
+
+<TabItem value="21" label="cURL">
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/supervisor/social_media/health"
+```
+</TabItem>
+
+<TabItem value="22" label="HTTP">
+
+```HTTP
+GET /druid/indexer/v1/supervisor/social_media/health HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+</TabItem>
+
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+  {
+    "healthy": false
+  }
+  ```
+</details>
+
+### Get supervisor ingestion stats
+
+Returns a snapshot of the current ingestion row counters for each task being managed by the supervisor, along with moving averages for the row counters. See [Row stats](../ingestion/tasks.md#row-stats) for more information.
+
+#### URL
+
+`GET` `/druid/indexer/v1/supervisor/{supervisorId}/stats`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="23" label="200 SUCCESS">
+
+*Successfully retrieved supervisor stats*
+
+</TabItem>
+
+<TabItem value="24" label="404 NOT FOUND">
+
+*Invalid supervisor ID*
+
+</TabItem>
+
+</Tabs>
+
+---
+
+#### Sample request
+
+The following example shows how to retrieve the current ingestion row counters for a supervisor with the name `custom_data`.
+
+<Tabs>
+
+<TabItem value="25" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/supervisor/custom_data/stats"
+```
+
+</TabItem>
+<TabItem value="26" label="HTTP">
+
+
+```HTTP
+GET /druid/indexer/v1/supervisor/custom_data/stats HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+  {
+    "0": {
+        "index_kafka_custom_data_881d621078f6b7c_ccplchbi": {
+            "movingAverages": {
+                "buildSegments": {
+                    "5m": {
+                        "processed": 53.401225142603316,
+                        "processedBytes": 5226.400757148808,
+                        "unparseable": 0.0,
+                        "thrownAway": 0.0,
+                        "processedWithError": 0.0
+                    },
+                    "15m": {
+                        "processed": 56.92994990102502,
+                        "processedBytes": 5571.772059828217,
+                        "unparseable": 0.0,
+                        "thrownAway": 0.0,
+                        "processedWithError": 0.0
+                    },
+                    "1m": {
+                        "processed": 37.134921285556636,
+                        "processedBytes": 3634.2766230628677,
+                        "unparseable": 0.0,
+                        "thrownAway": 0.0,
+                        "processedWithError": 0.0
+                    }
+                }
+            },
+            "totals": {
+                "buildSegments": {
+                    "processed": 665,
+                    "processedBytes": 65079,
+                    "processedWithError": 0,
+                    "thrownAway": 0,
+                    "unparseable": 0
+                    }
+                }
+            }
+        }
+    }
+  ```
+</details>
+
+## Audit history
+
+An audit history provides a comprehensive log of events, including supervisor configuration, creation, suspension, and modification history.
+
+### Get audit history for all supervisors
+
+Retrieves an audit history of specs for all supervisors.
+
+#### URL
+
+`GET` `/druid/indexer/v1/supervisor/history`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="27" label="200 SUCCESS">
+
+
+*Successfully retrieved audit history*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="28" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/supervisor/history"
+```
+
+</TabItem>
+<TabItem value="29" label="HTTP">
+
+
+```HTTP
+GET /druid/indexer/v1/supervisor/history HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+{
+    "social_media": [
+        {
+            "spec": {
+                "type": "kafka",
+                "spec": {
+                    "dataSchema": {
+                        "dataSource": "social_media",
+                        "timestampSpec": {
+                            "column": "__time",
+                            "format": "iso",
+                            "missingValue": null
+                        },
+                        "dimensionsSpec": {
+                            "dimensions": [
+                                {
+                                    "type": "string",
+                                    "name": "username",
+                                    "multiValueHandling": "SORTED_ARRAY",
+                                    "createBitmapIndex": true
+                                },
+                                {
+                                    "type": "string",
+                                    "name": "post_title",
+                                    "multiValueHandling": "SORTED_ARRAY",
+                                    "createBitmapIndex": true
+                                },
+                                {
+                                    "type": "long",
+                                    "name": "views",
+                                    "multiValueHandling": "SORTED_ARRAY",
+                                    "createBitmapIndex": false
+                                },
+                                {
+                                    "type": "long",
+                                    "name": "upvotes",
+                                    "multiValueHandling": "SORTED_ARRAY",
+                                    "createBitmapIndex": false
+                                },
+                                {
+                                    "type": "long",
+                                    "name": "comments",
+                                    "multiValueHandling": "SORTED_ARRAY",
+                                    "createBitmapIndex": false
+                                },
+                                {
+                                    "type": "string",
+                                    "name": "edited",
+                                    "multiValueHandling": "SORTED_ARRAY",
+                                    "createBitmapIndex": true
+                                }
+                            ],
+                            "dimensionExclusions": [
+                                "__time"
+                            ],
+                            "includeAllDimensions": false,
+                            "useSchemaDiscovery": false
+                        },
+                        "metricsSpec": [],
+                        "granularitySpec": {
+                            "type": "uniform",
+                            "segmentGranularity": "HOUR",
+                            "queryGranularity": {
+                                "type": "none"
+                            },
+                            "rollup": false,
+                            "intervals": []
+                        },
+                        "transformSpec": {
+                            "filter": null,
+                            "transforms": []
+                        }
+                    },
+                    "ioConfig": {
+                        "topic": "social_media",
+                        "inputFormat": {
+                            "type": "json"
+                        },
+                        "replicas": 1,
+                        "taskCount": 1,
+                        "taskDuration": "PT3600S",
+                        "consumerProperties": {
+                            "bootstrap.servers": "localhost:9094"
+                        },
+                        "autoScalerConfig": null,
+                        "pollTimeout": 100,
+                        "startDelay": "PT5S",
+                        "period": "PT30S",
+                        "useEarliestOffset": true,
+                        "completionTimeout": "PT1800S",
+                        "lateMessageRejectionPeriod": null,
+                        "earlyMessageRejectionPeriod": null,
+                        "lateMessageRejectionStartDateTime": null,
+                        "configOverrides": null,
+                        "idleConfig": null,
+                        "stream": "social_media",
+                        "useEarliestSequenceNumber": true
+                    },
+                    "tuningConfig": {
+                        "type": "kafka",
+                        "appendableIndexSpec": {
+                            "type": "onheap",
+                            "preserveExistingMetrics": false
+                        },
+                        "maxRowsInMemory": 150000,
+                        "maxBytesInMemory": 0,
+                        "skipBytesInMemoryOverheadCheck": false,
+                        "maxRowsPerSegment": 5000000,
+                        "maxTotalRows": null,
+                        "intermediatePersistPeriod": "PT10M",
+                        "maxPendingPersists": 0,
+                        "indexSpec": {
+                            "bitmap": {
+                                "type": "roaring"
+                            },
+                            "dimensionCompression": "lz4",
+                            "stringDictionaryEncoding": {
+                                "type": "utf8"
+                            },
+                            "metricCompression": "lz4",
+                            "longEncoding": "longs"
+                        },
+                        "indexSpecForIntermediatePersists": {
+                            "bitmap": {
+                                "type": "roaring"
+                            },
+                            "dimensionCompression": "lz4",
+                            "stringDictionaryEncoding": {
+                                "type": "utf8"
+                            },
+                            "metricCompression": "lz4",
+                            "longEncoding": "longs"
+                        },
+                        "reportParseExceptions": false,
+                        "handoffConditionTimeout": 0,
+                        "resetOffsetAutomatically": false,
+                        "segmentWriteOutMediumFactory": null,
+                        "workerThreads": null,
+                        "chatRetries": 8,
+                        "httpTimeout": "PT10S",
+                        "shutdownTimeout": "PT80S",
+                        "offsetFetchPeriod": "PT30S",
+                        "intermediateHandoffPeriod": "P2147483647D",
+                        "logParseExceptions": false,
+                        "maxParseExceptions": 2147483647,
+                        "maxSavedParseExceptions": 0,
+                        "skipSequenceNumberAvailabilityCheck": false,
+                        "repartitionTransitionDuration": "PT120S"
+                    }
+                },
+                "dataSchema": {
+                    "dataSource": "social_media",
+                    "timestampSpec": {
+                        "column": "__time",
+                        "format": "iso",
+                        "missingValue": null
+                    },
+                    "dimensionsSpec": {
+                        "dimensions": [
+                            {
+                                "type": "string",
+                                "name": "username",
+                                "multiValueHandling": "SORTED_ARRAY",
+                                "createBitmapIndex": true
+                            },
+                            {
+                                "type": "string",
+                                "name": "post_title",
+                                "multiValueHandling": "SORTED_ARRAY",
+                                "createBitmapIndex": true
+                            },
+                            {
+                                "type": "long",
+                                "name": "views",
+                                "multiValueHandling": "SORTED_ARRAY",
+                                "createBitmapIndex": false
+                            },
+                            {
+                                "type": "long",
+                                "name": "upvotes",
+                                "multiValueHandling": "SORTED_ARRAY",
+                                "createBitmapIndex": false
+                            },
+                            {
+                                "type": "long",
+                                "name": "comments",
+                                "multiValueHandling": "SORTED_ARRAY",
+                                "createBitmapIndex": false
+                            },
+                            {
+                                "type": "string",
+                                "name": "edited",
+                                "multiValueHandling": "SORTED_ARRAY",
+                                "createBitmapIndex": true
+                            }
+                        ],
+                        "dimensionExclusions": [
+                            "__time"
+                        ],
+                        "includeAllDimensions": false,
+                        "useSchemaDiscovery": false
+                    },
+                    "metricsSpec": [],
+                    "granularitySpec": {
+                        "type": "uniform",
+                        "segmentGranularity": "HOUR",
+                        "queryGranularity": {
+                            "type": "none"
+                        },
+                        "rollup": false,
+                        "intervals": []
+                    },
+                    "transformSpec": {
+                        "filter": null,
+                        "transforms": []
+                    }
+                },
+                "tuningConfig": {
+                    "type": "kafka",
+                    "appendableIndexSpec": {
+                        "type": "onheap",
+                        "preserveExistingMetrics": false
+                    },
+                    "maxRowsInMemory": 150000,
+                    "maxBytesInMemory": 0,
+                    "skipBytesInMemoryOverheadCheck": false,
+                    "maxRowsPerSegment": 5000000,
+                    "maxTotalRows": null,
+                    "intermediatePersistPeriod": "PT10M",
+                    "maxPendingPersists": 0,
+                    "indexSpec": {
+                        "bitmap": {
+                            "type": "roaring"
+                        },
+                        "dimensionCompression": "lz4",
+                        "stringDictionaryEncoding": {
+                            "type": "utf8"
+                        },
+                        "metricCompression": "lz4",
+                        "longEncoding": "longs"
+                    },
+                    "indexSpecForIntermediatePersists": {
+                        "bitmap": {
+                            "type": "roaring"
+                        },
+                        "dimensionCompression": "lz4",
+                        "stringDictionaryEncoding": {
+                            "type": "utf8"
+                        },
+                        "metricCompression": "lz4",
+                        "longEncoding": "longs"
+                    },
+                    "reportParseExceptions": false,
+                    "handoffConditionTimeout": 0,
+                    "resetOffsetAutomatically": false,
+                    "segmentWriteOutMediumFactory": null,
+                    "workerThreads": null,
+                    "chatRetries": 8,
+                    "httpTimeout": "PT10S",
+                    "shutdownTimeout": "PT80S",
+                    "offsetFetchPeriod": "PT30S",
+                    "intermediateHandoffPeriod": "P2147483647D",
+                    "logParseExceptions": false,
+                    "maxParseExceptions": 2147483647,
+                    "maxSavedParseExceptions": 0,
+                    "skipSequenceNumberAvailabilityCheck": false,
+                    "repartitionTransitionDuration": "PT120S"
+                },
+                "ioConfig": {
+                    "topic": "social_media",
+                    "inputFormat": {
+                        "type": "json"
+                    },
+                    "replicas": 1,
+                    "taskCount": 1,
+                    "taskDuration": "PT3600S",
+                    "consumerProperties": {
+                        "bootstrap.servers": "localhost:9094"
+                    },
+                    "autoScalerConfig": null,
+                    "pollTimeout": 100,
+                    "startDelay": "PT5S",
+                    "period": "PT30S",
+                    "useEarliestOffset": true,
+                    "completionTimeout": "PT1800S",
+                    "lateMessageRejectionPeriod": null,
+                    "earlyMessageRejectionPeriod": null,
+                    "lateMessageRejectionStartDateTime": null,
+                    "configOverrides": null,
+                    "idleConfig": null,
+                    "stream": "social_media",
+                    "useEarliestSequenceNumber": true
+                },
+                "context": null,
+                "suspended": false
+            },
+            "version": "2023-07-03T18:51:02.970Z"
+        }
+    ]
+}
+  ```
+</details>
+
+### Get audit history for a specific supervisor
+
+Retrieves an audit history of specs for a single supervisor.
+
+#### URL
+
+`GET` `/druid/indexer/v1/supervisor/{supervisorId}/history`
+
+#### Query parameters
+
+* `count` (optional)
+  * Type: Integer
+  * Limit the number of results to the last `n` entries. Must be greater than 0 if specified.
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="30" label="200 SUCCESS">
+
+
+*Successfully retrieved supervisor audit history*
+
+</TabItem>
+<TabItem value="31" label="404 NOT FOUND">
+
+
+*Invalid supervisor ID*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+The following examples show how to retrieve the audit history of a supervisor with the name `wikipedia_stream`.
+
+**Get all history entries:**
+
+<Tabs>
+
+<TabItem value="23" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/supervisor/wikipedia_stream/history"
+```
+
+</TabItem>
+<TabItem value="32" label="HTTP">
+
+
+```HTTP
+GET /druid/indexer/v1/supervisor/wikipedia_stream/history HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+**Get last 10 history entries:**
+
+<Tabs>
+
+<TabItem value="33" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/supervisor/wikipedia_stream/history?count=10"
+```
+
+</TabItem>
+<TabItem value="34" label="HTTP">
+
+
+```HTTP
+GET /druid/indexer/v1/supervisor/wikipedia_stream/history?count=10 HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+[
+    {
+        "spec": {
+            "type": "kafka",
+            "spec": {
+                "dataSchema": {
+                    "dataSource": "wikipedia_stream",
+                    "timestampSpec": {
+                        "column": "__time",
+                        "format": "iso",
+                        "missingValue": null
+                    },
+                    "dimensionsSpec": {
+                        "dimensions": [
+                            {
+                                "type": "string",
+                                "name": "username",
+                                "multiValueHandling": "SORTED_ARRAY",
+                                "createBitmapIndex": true
+                            },
+                            {
+                                "type": "string",
+                                "name": "post_title",
+                                "multiValueHandling": "SORTED_ARRAY",
+                                "createBitmapIndex": true
+                            },
+                            {
+                                "type": "long",
+                                "name": "views",
+                                "multiValueHandling": "SORTED_ARRAY",
+                                "createBitmapIndex": false
+                            },
+                            {
+                                "type": "long",
+                                "name": "upvotes",
+                                "multiValueHandling": "SORTED_ARRAY",
+                                "createBitmapIndex": false
+                            },
+                            {
+                                "type": "long",
+                                "name": "comments",
+                                "multiValueHandling": "SORTED_ARRAY",
+                                "createBitmapIndex": false
+                            },
+                            {
+                                "type": "string",
+                                "name": "edited",
+                                "multiValueHandling": "SORTED_ARRAY",
+                                "createBitmapIndex": true
+                            }
+                        ],
+                        "dimensionExclusions": [
+                            "__time"
+                        ],
+                        "includeAllDimensions": false,
+                        "useSchemaDiscovery": false
+                    },
+                    "metricsSpec": [],
+                    "granularitySpec": {
+                        "type": "uniform",
+                        "segmentGranularity": "HOUR",
+                        "queryGranularity": {
+                            "type": "none"
+                        },
+                        "rollup": false,
+                        "intervals": []
+                    },
+                    "transformSpec": {
+                        "filter": null,
+                        "transforms": []
+                    }
+                },
+                "ioConfig": {
+                    "topic": "social_media",
+                    "inputFormat": {
+                        "type": "json"
+                    },
+                    "replicas": 1,
+                    "taskCount": 1,
+                    "taskDuration": "PT3600S",
+                    "consumerProperties": {
+                        "bootstrap.servers": "localhost:9042"
+                    },
+                    "autoScalerConfig": null,
+                    "pollTimeout": 100,
+                    "startDelay": "PT5S",
+                    "period": "PT30S",
+                    "useEarliestOffset": true,
+                    "completionTimeout": "PT1800S",
+                    "lateMessageRejectionPeriod": null,
+                    "earlyMessageRejectionPeriod": null,
+                    "lateMessageRejectionStartDateTime": null,
+                    "configOverrides": null,
+                    "idleConfig": null,
+                    "stream": "social_media",
+                    "useEarliestSequenceNumber": true
+                },
+                "tuningConfig": {
+                    "type": "kafka",
+                    "appendableIndexSpec": {
+                        "type": "onheap",
+                        "preserveExistingMetrics": false
+                    },
+                    "maxRowsInMemory": 150000,
+                    "maxBytesInMemory": 0,
+                    "skipBytesInMemoryOverheadCheck": false,
+                    "maxRowsPerSegment": 5000000,
+                    "maxTotalRows": null,
+                    "intermediatePersistPeriod": "PT10M",
+                    "maxPendingPersists": 0,
+                    "indexSpec": {
+                        "bitmap": {
+                            "type": "roaring"
+                        },
+                        "dimensionCompression": "lz4",
+                        "stringDictionaryEncoding": {
+                            "type": "utf8"
+                        },
+                        "metricCompression": "lz4",
+                        "longEncoding": "longs"
+                    },
+                    "indexSpecForIntermediatePersists": {
+                        "bitmap": {
+                            "type": "roaring"
+                        },
+                        "dimensionCompression": "lz4",
+                        "stringDictionaryEncoding": {
+                            "type": "utf8"
+                        },
+                        "metricCompression": "lz4",
+                        "longEncoding": "longs"
+                    },
+                    "reportParseExceptions": false,
+                    "handoffConditionTimeout": 0,
+                    "resetOffsetAutomatically": false,
+                    "segmentWriteOutMediumFactory": null,
+                    "workerThreads": null,
+                    "chatRetries": 8,
+                    "httpTimeout": "PT10S",
+                    "shutdownTimeout": "PT80S",
+                    "offsetFetchPeriod": "PT30S",
+                    "intermediateHandoffPeriod": "P2147483647D",
+                    "logParseExceptions": false,
+                    "maxParseExceptions": 2147483647,
+                    "maxSavedParseExceptions": 0,
+                    "skipSequenceNumberAvailabilityCheck": false,
+                    "repartitionTransitionDuration": "PT120S"
+                }
+            },
+            "dataSchema": {
+                "dataSource": "wikipedia_stream",
+                "timestampSpec": {
+                    "column": "__time",
+                    "format": "iso",
+                    "missingValue": null
+                },
+                "dimensionsSpec": {
+                    "dimensions": [
+                        {
+                            "type": "string",
+                            "name": "username",
+                            "multiValueHandling": "SORTED_ARRAY",
+                            "createBitmapIndex": true
+                        },
+                        {
+                            "type": "string",
+                            "name": "post_title",
+                            "multiValueHandling": "SORTED_ARRAY",
+                            "createBitmapIndex": true
+                        },
+                        {
+                            "type": "long",
+                            "name": "views",
+                            "multiValueHandling": "SORTED_ARRAY",
+                            "createBitmapIndex": false
+                        },
+                        {
+                            "type": "long",
+                            "name": "upvotes",
+                            "multiValueHandling": "SORTED_ARRAY",
+                            "createBitmapIndex": false
+                        },
+                        {
+                            "type": "long",
+                            "name": "comments",
+                            "multiValueHandling": "SORTED_ARRAY",
+                            "createBitmapIndex": false
+                        },
+                        {
+                            "type": "string",
+                            "name": "edited",
+                            "multiValueHandling": "SORTED_ARRAY",
+                            "createBitmapIndex": true
+                        }
+                    ],
+                    "dimensionExclusions": [
+                        "__time"
+                    ],
+                    "includeAllDimensions": false,
+                    "useSchemaDiscovery": false
+                },
+                "metricsSpec": [],
+                "granularitySpec": {
+                    "type": "uniform",
+                    "segmentGranularity": "HOUR",
+                    "queryGranularity": {
+                        "type": "none"
+                    },
+                    "rollup": false,
+                    "intervals": []
+                },
+                "transformSpec": {
+                    "filter": null,
+                    "transforms": []
+                }
+            },
+            "tuningConfig": {
+                "type": "kafka",
+                "appendableIndexSpec": {
+                    "type": "onheap",
+                    "preserveExistingMetrics": false
+                },
+                "maxRowsInMemory": 150000,
+                "maxBytesInMemory": 0,
+                "skipBytesInMemoryOverheadCheck": false,
+                "maxRowsPerSegment": 5000000,
+                "maxTotalRows": null,
+                "intermediatePersistPeriod": "PT10M",
+                "maxPendingPersists": 0,
+                "indexSpec": {
+                    "bitmap": {
+                        "type": "roaring"
+                    },
+                    "dimensionCompression": "lz4",
+                    "stringDictionaryEncoding": {
+                        "type": "utf8"
+                    },
+                    "metricCompression": "lz4",
+                    "longEncoding": "longs"
+                },
+                "indexSpecForIntermediatePersists": {
+                    "bitmap": {
+                        "type": "roaring"
+                    },
+                    "dimensionCompression": "lz4",
+                    "stringDictionaryEncoding": {
+                        "type": "utf8"
+                    },
+                    "metricCompression": "lz4",
+                    "longEncoding": "longs"
+                },
+                "reportParseExceptions": false,
+                "handoffConditionTimeout": 0,
+                "resetOffsetAutomatically": false,
+                "segmentWriteOutMediumFactory": null,
+                "workerThreads": null,
+                "chatRetries": 8,
+                "httpTimeout": "PT10S",
+                "shutdownTimeout": "PT80S",
+                "offsetFetchPeriod": "PT30S",
+                "intermediateHandoffPeriod": "P2147483647D",
+                "logParseExceptions": false,
+                "maxParseExceptions": 2147483647,
+                "maxSavedParseExceptions": 0,
+                "skipSequenceNumberAvailabilityCheck": false,
+                "repartitionTransitionDuration": "PT120S"
+            },
+            "ioConfig": {
+                "topic": "social_media",
+                "inputFormat": {
+                    "type": "json"
+                },
+                "replicas": 1,
+                "taskCount": 1,
+                "taskDuration": "PT3600S",
+                "consumerProperties": {
+                    "bootstrap.servers": "localhost:9042"
+                },
+                "autoScalerConfig": null,
+                "pollTimeout": 100,
+                "startDelay": "PT5S",
+                "period": "PT30S",
+                "useEarliestOffset": true,
+                "completionTimeout": "PT1800S",
+                "lateMessageRejectionPeriod": null,
+                "earlyMessageRejectionPeriod": null,
+                "lateMessageRejectionStartDateTime": null,
+                "configOverrides": null,
+                "idleConfig": null,
+                "stream": "social_media",
+                "useEarliestSequenceNumber": true
+            },
+            "context": null,
+            "suspended": false
+        },
+        "version": "2023-07-05T20:59:16.872Z"
+    }
+]
+  ```
+</details>
+
+## Manage supervisors
+
+### Create or update a supervisor
+
+Creates a new supervisor spec or updates an existing one with new configuration and schema information. When updating a supervisor spec, the datasource must remain the same as the previous supervisor.
+
+You can define a supervisor spec for [Apache Kafka](../ingestion/kafka-ingestion.md) or [Amazon Kinesis](../ingestion/kinesis-ingestion.md) streaming ingestion methods.
+
+The following table lists the properties of a supervisor spec:
+
+|Property|Type|Description|Required|
+|--------|----|-----------|--------|
+|`type`|String|The supervisor type. One of`kafka` or `kinesis`.|Yes|
+|`spec`|Object|The container object for the supervisor configuration.|Yes|
+|`ioConfig`|Object|The I/O configuration object to define the connection and I/O-related settings for the supervisor and indexing task.|Yes|
+|`dataSchema`|Object|The schema for the indexing task to use during ingestion. See [`dataSchema`](../ingestion/ingestion-spec.md#dataschema) for more information.|Yes|
+|`tuningConfig`|Object|The tuning configuration object to define performance-related settings for the supervisor and indexing tasks.|No|
+
+When you call this endpoint on an existing supervisor, the running supervisor signals its tasks to stop reading and begin publishing, exiting itself. Druid then uses the provided configuration from the request body to create a new supervisor. Druid submits a new schema while retaining existing publishing tasks and starts new tasks at the previous task offsets.
+This way, you can apply configuration changes without a pause in ingestion.
+
+#### URL
+
+`POST` `/druid/indexer/v1/supervisor`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="33" label="200 SUCCESS">
+
+
+*Successfully created a new supervisor or updated an existing supervisor*
+
+</TabItem>
+<TabItem value="34" label="415 UNSUPPORTED MEDIA TYPE">
+
+
+*Request body content type is not in JSON format*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+The following example uses JSON input format to create a supervisor spec for Kafka with a `social_media` datasource and `social_media` topic.
+
+<Tabs>
+
+<TabItem value="35" label="cURL">
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/supervisor" \
+--header 'Content-Type: application/json' \
+--data '{
+    "type": "kafka",
+    "spec": {
+        "ioConfig": {
+            "type": "kafka",
+            "consumerProperties": {
+                "bootstrap.servers": "localhost:9094"
+            },
+            "topic": "social_media",
+            "inputFormat": {
+                "type": "json"
+            },
+            "useEarliestOffset": true
+        },
+        "tuningConfig": {
+            "type": "kafka"
+        },
+        "dataSchema": {
+            "dataSource": "social_media",
+            "timestampSpec": {
+                "column": "__time",
+                "format": "iso"
+            },
+            "dimensionsSpec": {
+                "dimensions": [
+                    "username",
+                    "post_title",
+                    {
+                        "type": "long",
+                        "name": "views"
+                    },
+                    {
+                        "type": "long",
+                        "name": "upvotes"
+                    },
+                    {
+                        "type": "long",
+                        "name": "comments"
+                    },
+                    "edited"
+                ]
+            },
+            "granularitySpec": {
+                "queryGranularity": "none",
+                "rollup": false,
+                "segmentGranularity": "hour"
+            }
+        }
+    }
+}'
+```
+
+</TabItem>
+
+<TabItem value="36" label="HTTP">
+
+```HTTP
+POST /druid/indexer/v1/supervisor HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+Content-Type: application/json
+Content-Length: 1359
+
+{
+    "type": "kafka",
+    "spec": {
+        "ioConfig": {
+            "type": "kafka",
+            "consumerProperties": {
+                "bootstrap.servers": "localhost:9094"
+            },
+            "topic": "social_media",
+            "inputFormat": {
+                "type": "json"
+            },
+            "useEarliestOffset": true
+        },
+        "tuningConfig": {
+            "type": "kafka"
+        },
+        "dataSchema": {
+            "dataSource": "social_media",
+            "timestampSpec": {
+                "column": "__time",
+                "format": "iso"
+            },
+            "dimensionsSpec": {
+                "dimensions": [
+                    "username",
+                    "post_title",
+                    {
+                        "type": "long",
+                        "name": "views"
+                    },
+                    {
+                        "type": "long",
+                        "name": "upvotes"
+                    },
+                    {
+                        "type": "long",
+                        "name": "comments"
+                    },
+                    "edited"
+                ]
+            },
+            "granularitySpec": {
+                "queryGranularity": "none",
+                "rollup": false,
+                "segmentGranularity": "hour"
+            }
+        }
+    }
+}
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample request with `skipRestartIfUnmodified`
+
+The following example sets the `skipRestartIfUnmodified` flag to true. With this flag set to true, the Supervisor will only restart if there has been a modification to the SupervisorSpec. If left unset, the flag defaults to false.
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/supervisor?skipRestartIfUnmodified=true" \
+--header 'Content-Type: application/json' \
+--data '{
+    "type": "kafka",
+    "spec": {
+        "ioConfig": {
+            "type": "kafka",
+            "consumerProperties": {
+                "bootstrap.servers": "localhost:9094"
+            },
+            "topic": "social_media",
+            "inputFormat": {
+                "type": "json"
+            },
+            "useEarliestOffset": true
+        },
+        "tuningConfig": {
+            "type": "kafka"
+        },
+        "dataSchema": {
+            "dataSource": "social_media",
+            "timestampSpec": {
+                "column": "__time",
+                "format": "iso"
+            },
+            "dimensionsSpec": {
+                "dimensions": [
+                    "username",
+                    "post_title",
+                    {
+                        "type": "long",
+                        "name": "views"
+                    },
+                    {
+                        "type": "long",
+                        "name": "upvotes"
+                    },
+                    {
+                        "type": "long",
+                        "name": "comments"
+                    },
+                    "edited"
+                ]
+            },
+            "granularitySpec": {
+                "queryGranularity": "none",
+                "rollup": false,
+                "segmentGranularity": "hour"
+            }
+        }
+    }
+}'
+```
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+{
+    "id": "social_media"
+}
+  ```
+</details>
+
+### Suspend a running supervisor
+
+Suspends a single running supervisor. Returns the updated supervisor spec, where the `suspended` property is set to `true`. The suspended supervisor continues to emit logs and metrics.
+Indexing tasks remain suspended until you [resume the supervisor](#resume-a-supervisor).
+
+#### URL
+
+`POST` `/druid/indexer/v1/supervisor/{supervisorId}/suspend`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="37" label="200 SUCCESS">
+
+
+*Successfully shut down supervisor*
+
+</TabItem>
+<TabItem value="38" label="400 BAD REQUEST">
+
+
+*Supervisor already suspended*
+
+</TabItem>
+<TabItem value="39" label="404 NOT FOUND">
+
+
+*Invalid supervisor ID*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+The following example shows how to suspend a running supervisor with the name `social_media`.
+
+<Tabs>
+
+<TabItem value="40" label="cURL">
+
+
+```shell
+curl --request POST "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/supervisor/social_media/suspend"
+```
+
+</TabItem>
+<TabItem value="41" label="HTTP">
+
+
+```HTTP
+POST /druid/indexer/v1/supervisor/social_media/suspend HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+{
+    "type": "kafka",
+    "spec": {
+        "dataSchema": {
+            "dataSource": "social_media",
+            "timestampSpec": {
+                "column": "__time",
+                "format": "iso",
+                "missingValue": null
+            },
+            "dimensionsSpec": {
+                "dimensions": [
+                    {
+                        "type": "string",
+                        "name": "username",
+                        "multiValueHandling": "SORTED_ARRAY",
+                        "createBitmapIndex": true
+                    },
+                    {
+                        "type": "string",
+                        "name": "post_title",
+                        "multiValueHandling": "SORTED_ARRAY",
+                        "createBitmapIndex": true
+                    },
+                    {
+                        "type": "long",
+                        "name": "views",
+                        "multiValueHandling": "SORTED_ARRAY",
+                        "createBitmapIndex": false
+                    },
+                    {
+                        "type": "long",
+                        "name": "upvotes",
+                        "multiValueHandling": "SORTED_ARRAY",
+                        "createBitmapIndex": false
+                    },
+                    {
+                        "type": "long",
+                        "name": "comments",
+                        "multiValueHandling": "SORTED_ARRAY",
+                        "createBitmapIndex": false
+                    },
+                    {
+                        "type": "string",
+                        "name": "edited",
+                        "multiValueHandling": "SORTED_ARRAY",
+                        "createBitmapIndex": true
+                    }
+                ],
+                "dimensionExclusions": [
+                    "__time"
+                ],
+                "includeAllDimensions": false,
+                "useSchemaDiscovery": false
+            },
+            "metricsSpec": [],
+            "granularitySpec": {
+                "type": "uniform",
+                "segmentGranularity": "HOUR",
+                "queryGranularity": {
+                    "type": "none"
+                },
+                "rollup": false,
+                "intervals": []
+            },
+            "transformSpec": {
+                "filter": null,
+                "transforms": []
+            }
+        },
+        "ioConfig": {
+            "topic": "social_media",
+            "inputFormat": {
+                "type": "json"
+            },
+            "replicas": 1,
+            "taskCount": 1,
+            "taskDuration": "PT3600S",
+            "consumerProperties": {
+                "bootstrap.servers": "localhost:9094"
+            },
+            "autoScalerConfig": null,
+            "pollTimeout": 100,
+            "startDelay": "PT5S",
+            "period": "PT30S",
+            "useEarliestOffset": true,
+            "completionTimeout": "PT1800S",
+            "lateMessageRejectionPeriod": null,
+            "earlyMessageRejectionPeriod": null,
+            "lateMessageRejectionStartDateTime": null,
+            "configOverrides": null,
+            "idleConfig": null,
+            "stream": "social_media",
+            "useEarliestSequenceNumber": true
+        },
+        "tuningConfig": {
+            "type": "kafka",
+            "appendableIndexSpec": {
+                "type": "onheap",
+                "preserveExistingMetrics": false
+            },
+            "maxRowsInMemory": 150000,
+            "maxBytesInMemory": 0,
+            "skipBytesInMemoryOverheadCheck": false,
+            "maxRowsPerSegment": 5000000,
+            "maxTotalRows": null,
+            "intermediatePersistPeriod": "PT10M",
+            "maxPendingPersists": 0,
+            "indexSpec": {
+                "bitmap": {
+                    "type": "roaring"
+                },
+                "dimensionCompression": "lz4",
+                "stringDictionaryEncoding": {
+                    "type": "utf8"
+                },
+                "metricCompression": "lz4",
+                "longEncoding": "longs"
+            },
+            "indexSpecForIntermediatePersists": {
+                "bitmap": {
+                    "type": "roaring"
+                },
+                "dimensionCompression": "lz4",
+                "stringDictionaryEncoding": {
+                    "type": "utf8"
+                },
+                "metricCompression": "lz4",
+                "longEncoding": "longs"
+            },
+            "reportParseExceptions": false,
+            "handoffConditionTimeout": 0,
+            "resetOffsetAutomatically": false,
+            "segmentWriteOutMediumFactory": null,
+            "workerThreads": null,
+            "chatRetries": 8,
+            "httpTimeout": "PT10S",
+            "shutdownTimeout": "PT80S",
+            "offsetFetchPeriod": "PT30S",
+            "intermediateHandoffPeriod": "P2147483647D",
+            "logParseExceptions": false,
+            "maxParseExceptions": 2147483647,
+            "maxSavedParseExceptions": 0,
+            "skipSequenceNumberAvailabilityCheck": false,
+            "repartitionTransitionDuration": "PT120S"
+        }
+    },
+    "dataSchema": {
+        "dataSource": "social_media",
+        "timestampSpec": {
+            "column": "__time",
+            "format": "iso",
+            "missingValue": null
+        },
+        "dimensionsSpec": {
+            "dimensions": [
+                {
+                    "type": "string",
+                    "name": "username",
+                    "multiValueHandling": "SORTED_ARRAY",
+                    "createBitmapIndex": true
+                },
+                {
+                    "type": "string",
+                    "name": "post_title",
+                    "multiValueHandling": "SORTED_ARRAY",
+                    "createBitmapIndex": true
+                },
+                {
+                    "type": "long",
+                    "name": "views",
+                    "multiValueHandling": "SORTED_ARRAY",
+                    "createBitmapIndex": false
+                },
+                {
+                    "type": "long",
+                    "name": "upvotes",
+                    "multiValueHandling": "SORTED_ARRAY",
+                    "createBitmapIndex": false
+                },
+                {
+                    "type": "long",
+                    "name": "comments",
+                    "multiValueHandling": "SORTED_ARRAY",
+                    "createBitmapIndex": false
+                },
+                {
+                    "type": "string",
+                    "name": "edited",
+                    "multiValueHandling": "SORTED_ARRAY",
+                    "createBitmapIndex": true
+                }
+            ],
+            "dimensionExclusions": [
+                "__time"
+            ],
+            "includeAllDimensions": false,
+            "useSchemaDiscovery": false
+        },
+        "metricsSpec": [],
+        "granularitySpec": {
+            "type": "uniform",
+            "segmentGranularity": "HOUR",
+            "queryGranularity": {
+                "type": "none"
+            },
+            "rollup": false,
+            "intervals": []
+        },
+        "transformSpec": {
+            "filter": null,
+            "transforms": []
+        }
+    },
+    "tuningConfig": {
+        "type": "kafka",
+        "appendableIndexSpec": {
+            "type": "onheap",
+            "preserveExistingMetrics": false
+        },
+        "maxRowsInMemory": 150000,
+        "maxBytesInMemory": 0,
+        "skipBytesInMemoryOverheadCheck": false,
+        "maxRowsPerSegment": 5000000,
+        "maxTotalRows": null,
+        "intermediatePersistPeriod": "PT10M",
+        "maxPendingPersists": 0,
+        "indexSpec": {
+            "bitmap": {
+                "type": "roaring"
+            },
+            "dimensionCompression": "lz4",
+            "stringDictionaryEncoding": {
+                "type": "utf8"
+            },
+            "metricCompression": "lz4",
+            "longEncoding": "longs"
+        },
+        "indexSpecForIntermediatePersists": {
+            "bitmap": {
+                "type": "roaring"
+            },
+            "dimensionCompression": "lz4",
+            "stringDictionaryEncoding": {
+                "type": "utf8"
+            },
+            "metricCompression": "lz4",
+            "longEncoding": "longs"
+        },
+        "reportParseExceptions": false,
+        "handoffConditionTimeout": 0,
+        "resetOffsetAutomatically": false,
+        "segmentWriteOutMediumFactory": null,
+        "workerThreads": null,
+        "chatRetries": 8,
+        "httpTimeout": "PT10S",
+        "shutdownTimeout": "PT80S",
+        "offsetFetchPeriod": "PT30S",
+        "intermediateHandoffPeriod": "P2147483647D",
+        "logParseExceptions": false,
+        "maxParseExceptions": 2147483647,
+        "maxSavedParseExceptions": 0,
+        "skipSequenceNumberAvailabilityCheck": false,
+        "repartitionTransitionDuration": "PT120S"
+    },
+    "ioConfig": {
+        "topic": "social_media",
+        "inputFormat": {
+            "type": "json"
+        },
+        "replicas": 1,
+        "taskCount": 1,
+        "taskDuration": "PT3600S",
+        "consumerProperties": {
+            "bootstrap.servers": "localhost:9094"
+        },
+        "autoScalerConfig": null,
+        "pollTimeout": 100,
+        "startDelay": "PT5S",
+        "period": "PT30S",
+        "useEarliestOffset": true,
+        "completionTimeout": "PT1800S",
+        "lateMessageRejectionPeriod": null,
+        "earlyMessageRejectionPeriod": null,
+        "lateMessageRejectionStartDateTime": null,
+        "configOverrides": null,
+        "idleConfig": null,
+        "stream": "social_media",
+        "useEarliestSequenceNumber": true
+    },
+    "context": null,
+    "suspended": true
+}
+  ```
+</details>
+
+### Suspend all supervisors
+
+Suspends all supervisors. Note that this endpoint returns an HTTP `200 Success` code message even if there are no supervisors or running supervisors to suspend.
+
+#### URL
+
+`POST` `/druid/indexer/v1/supervisor/suspendAll`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="42" label="200 SUCCESS">
+
+
+*Successfully suspended all supervisors*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="43" label="cURL">
+
+
+```shell
+curl --request POST "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/supervisor/suspendAll"
+```
+
+</TabItem>
+<TabItem value="44" label="HTTP">
+
+
+```HTTP
+POST /druid/indexer/v1/supervisor/suspendAll HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+{
+    "status": "success"
+}
+  ```
+</details>
+
+### Resume a supervisor
+
+Resumes indexing tasks for a supervisor. Returns an updated supervisor spec with the `suspended` property set to `false`.
+
+#### URL
+
+`POST` `/druid/indexer/v1/supervisor/{supervisorId}/resume`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="45" label="200 SUCCESS">
+
+
+*Successfully resumed supervisor*
+
+</TabItem>
+<TabItem value="46" label="400 BAD REQUEST">
+
+
+*Supervisor already running*
+
+</TabItem>
+<TabItem value="47" label="404 NOT FOUND">
+
+
+*Invalid supervisor ID*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+The following example resumes a previously suspended supervisor with name `social_media`.
+
+<Tabs>
+
+<TabItem value="48" label="cURL">
+
+
+```shell
+curl --request POST "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/supervisor/social_media/resume"
+```
+
+</TabItem>
+<TabItem value="49" label="HTTP">
+
+
+```HTTP
+POST /druid/indexer/v1/supervisor/social_media/resume HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+{
+    "type": "kafka",
+    "spec": {
+        "dataSchema": {
+            "dataSource": "social_media",
+            "timestampSpec": {
+                "column": "__time",
+                "format": "iso",
+                "missingValue": null
+            },
+            "dimensionsSpec": {
+                "dimensions": [
+                    {
+                        "type": "string",
+                        "name": "username",
+                        "multiValueHandling": "SORTED_ARRAY",
+                        "createBitmapIndex": true
+                    },
+                    {
+                        "type": "string",
+                        "name": "post_title",
+                        "multiValueHandling": "SORTED_ARRAY",
+                        "createBitmapIndex": true
+                    },
+                    {
+                        "type": "long",
+                        "name": "views",
+                        "multiValueHandling": "SORTED_ARRAY",
+                        "createBitmapIndex": false
+                    },
+                    {
+                        "type": "long",
+                        "name": "upvotes",
+                        "multiValueHandling": "SORTED_ARRAY",
+                        "createBitmapIndex": false
+                    },
+                    {
+                        "type": "long",
+                        "name": "comments",
+                        "multiValueHandling": "SORTED_ARRAY",
+                        "createBitmapIndex": false
+                    },
+                    {
+                        "type": "string",
+                        "name": "edited",
+                        "multiValueHandling": "SORTED_ARRAY",
+                        "createBitmapIndex": true
+                    }
+                ],
+                "dimensionExclusions": [
+                    "__time"
+                ],
+                "includeAllDimensions": false,
+                "useSchemaDiscovery": false
+            },
+            "metricsSpec": [],
+            "granularitySpec": {
+                "type": "uniform",
+                "segmentGranularity": "HOUR",
+                "queryGranularity": {
+                    "type": "none"
+                },
+                "rollup": false,
+                "intervals": []
+            },
+            "transformSpec": {
+                "filter": null,
+                "transforms": []
+            }
+        },
+        "ioConfig": {
+            "topic": "social_media",
+            "inputFormat": {
+                "type": "json"
+            },
+            "replicas": 1,
+            "taskCount": 1,
+            "taskDuration": "PT3600S",
+            "consumerProperties": {
+                "bootstrap.servers": "localhost:9094"
+            },
+            "autoScalerConfig": null,
+            "pollTimeout": 100,
+            "startDelay": "PT5S",
+            "period": "PT30S",
+            "useEarliestOffset": true,
+            "completionTimeout": "PT1800S",
+            "lateMessageRejectionPeriod": null,
+            "earlyMessageRejectionPeriod": null,
+            "lateMessageRejectionStartDateTime": null,
+            "configOverrides": null,
+            "idleConfig": null,
+            "stream": "social_media",
+            "useEarliestSequenceNumber": true
+        },
+        "tuningConfig": {
+            "type": "kafka",
+            "appendableIndexSpec": {
+                "type": "onheap",
+                "preserveExistingMetrics": false
+            },
+            "maxRowsInMemory": 150000,
+            "maxBytesInMemory": 0,
+            "skipBytesInMemoryOverheadCheck": false,
+            "maxRowsPerSegment": 5000000,
+            "maxTotalRows": null,
+            "intermediatePersistPeriod": "PT10M",
+            "maxPendingPersists": 0,
+            "indexSpec": {
+                "bitmap": {
+                    "type": "roaring"
+                },
+                "dimensionCompression": "lz4",
+                "stringDictionaryEncoding": {
+                    "type": "utf8"
+                },
+                "metricCompression": "lz4",
+                "longEncoding": "longs"
+            },
+            "indexSpecForIntermediatePersists": {
+                "bitmap": {
+                    "type": "roaring"
+                },
+                "dimensionCompression": "lz4",
+                "stringDictionaryEncoding": {
+                    "type": "utf8"
+                },
+                "metricCompression": "lz4",
+                "longEncoding": "longs"
+            },
+            "reportParseExceptions": false,
+            "handoffConditionTimeout": 0,
+            "resetOffsetAutomatically": false,
+            "segmentWriteOutMediumFactory": null,
+            "workerThreads": null,
+            "chatRetries": 8,
+            "httpTimeout": "PT10S",
+            "shutdownTimeout": "PT80S",
+            "offsetFetchPeriod": "PT30S",
+            "intermediateHandoffPeriod": "P2147483647D",
+            "logParseExceptions": false,
+            "maxParseExceptions": 2147483647,
+            "maxSavedParseExceptions": 0,
+            "skipSequenceNumberAvailabilityCheck": false,
+            "repartitionTransitionDuration": "PT120S"
+        }
+    },
+    "dataSchema": {
+        "dataSource": "social_media",
+        "timestampSpec": {
+            "column": "__time",
+            "format": "iso",
+            "missingValue": null
+        },
+        "dimensionsSpec": {
+            "dimensions": [
+                {
+                    "type": "string",
+                    "name": "username",
+                    "multiValueHandling": "SORTED_ARRAY",
+                    "createBitmapIndex": true
+                },
+                {
+                    "type": "string",
+                    "name": "post_title",
+                    "multiValueHandling": "SORTED_ARRAY",
+                    "createBitmapIndex": true
+                },
+                {
+                    "type": "long",
+                    "name": "views",
+                    "multiValueHandling": "SORTED_ARRAY",
+                    "createBitmapIndex": false
+                },
+                {
+                    "type": "long",
+                    "name": "upvotes",
+                    "multiValueHandling": "SORTED_ARRAY",
+                    "createBitmapIndex": false
+                },
+                {
+                    "type": "long",
+                    "name": "comments",
+                    "multiValueHandling": "SORTED_ARRAY",
+                    "createBitmapIndex": false
+                },
+                {
+                    "type": "string",
+                    "name": "edited",
+                    "multiValueHandling": "SORTED_ARRAY",
+                    "createBitmapIndex": true
+                }
+            ],
+            "dimensionExclusions": [
+                "__time"
+            ],
+            "includeAllDimensions": false,
+            "useSchemaDiscovery": false
+        },
+        "metricsSpec": [],
+        "granularitySpec": {
+            "type": "uniform",
+            "segmentGranularity": "HOUR",
+            "queryGranularity": {
+                "type": "none"
+            },
+            "rollup": false,
+            "intervals": []
+        },
+        "transformSpec": {
+            "filter": null,
+            "transforms": []
+        }
+    },
+    "tuningConfig": {
+        "type": "kafka",
+        "appendableIndexSpec": {
+            "type": "onheap",
+            "preserveExistingMetrics": false
+        },
+        "maxRowsInMemory": 150000,
+        "maxBytesInMemory": 0,
+        "skipBytesInMemoryOverheadCheck": false,
+        "maxRowsPerSegment": 5000000,
+        "maxTotalRows": null,
+        "intermediatePersistPeriod": "PT10M",
+        "maxPendingPersists": 0,
+        "indexSpec": {
+            "bitmap": {
+                "type": "roaring"
+            },
+            "dimensionCompression": "lz4",
+            "stringDictionaryEncoding": {
+                "type": "utf8"
+            },
+            "metricCompression": "lz4",
+            "longEncoding": "longs"
+        },
+        "indexSpecForIntermediatePersists": {
+            "bitmap": {
+                "type": "roaring"
+            },
+            "dimensionCompression": "lz4",
+            "stringDictionaryEncoding": {
+                "type": "utf8"
+            },
+            "metricCompression": "lz4",
+            "longEncoding": "longs"
+        },
+        "reportParseExceptions": false,
+        "handoffConditionTimeout": 0,
+        "resetOffsetAutomatically": false,
+        "segmentWriteOutMediumFactory": null,
+        "workerThreads": null,
+        "chatRetries": 8,
+        "httpTimeout": "PT10S",
+        "shutdownTimeout": "PT80S",
+        "offsetFetchPeriod": "PT30S",
+        "intermediateHandoffPeriod": "P2147483647D",
+        "logParseExceptions": false,
+        "maxParseExceptions": 2147483647,
+        "maxSavedParseExceptions": 0,
+        "skipSequenceNumberAvailabilityCheck": false,
+        "repartitionTransitionDuration": "PT120S"
+    },
+    "ioConfig": {
+        "topic": "social_media",
+        "inputFormat": {
+            "type": "json"
+        },
+        "replicas": 1,
+        "taskCount": 1,
+        "taskDuration": "PT3600S",
+        "consumerProperties": {
+            "bootstrap.servers": "localhost:9094"
+        },
+        "autoScalerConfig": null,
+        "pollTimeout": 100,
+        "startDelay": "PT5S",
+        "period": "PT30S",
+        "useEarliestOffset": true,
+        "completionTimeout": "PT1800S",
+        "lateMessageRejectionPeriod": null,
+        "earlyMessageRejectionPeriod": null,
+        "lateMessageRejectionStartDateTime": null,
+        "configOverrides": null,
+        "idleConfig": null,
+        "stream": "social_media",
+        "useEarliestSequenceNumber": true
+    },
+    "context": null,
+    "suspended": false
+}
+  ```
+</details>
+
+### Resume all supervisors
+
+Resumes all supervisors. Note that this endpoint returns an HTTP `200 Success` code even if there are no supervisors or suspended supervisors to resume.
+
+#### URL
+
+`POST` `/druid/indexer/v1/supervisor/resumeAll`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="50" label="200 SUCCESS">
+
+
+*Successfully resumed all supervisors*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="51" label="cURL">
+
+
+```shell
+curl --request POST "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/supervisor/resumeAll"
+```
+
+</TabItem>
+<TabItem value="52" label="HTTP">
+
+
+```HTTP
+POST /druid/indexer/v1/supervisor/resumeAll HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+{
+    "status": "success"
+}
+  ```
+</details>
+
+### Reset a supervisor
+
+The supervisor must be running for this endpoint to be available.
+
+Resets the specified supervisor. This endpoint clears supervisor metadata, prompting the supervisor to resume data reading. The supervisor restarts from the earliest or latest available position, depending on the value of the `useEarliestOffset` property.
+After clearing all stored offsets, the supervisor kills and recreates active tasks,
+so that tasks begin reading from valid positions.
+
+Use this endpoint to recover from a stopped state due to missing offsets. Use this endpoint with caution as it may result in skipped messages and lead to data loss or duplicate data.
+
+The indexing service keeps track of the latest persisted offsets to provide exactly-once ingestion guarantees across tasks. Subsequent tasks must start reading from where the previous task completed for Druid to accept the generated segments. If the messages at the expected starting offsets are no longer available, the supervisor refuses to start and in-flight tasks fail. Possible causes for missing messages include the message retention period elapsing or the topic being removed and re-created. Use the `reset` endpoint to recover from this condition.
+
+#### URL
+
+`POST` `/druid/indexer/v1/supervisor/{supervisorId}/reset`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="53" label="200 SUCCESS">
+
+
+*Successfully reset supervisor*
+
+</TabItem>
+<TabItem value="54" label="404 NOT FOUND">
+
+
+*Invalid supervisor ID*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+The following example shows how to reset a supervisor with the name `social_media`.
+
+<Tabs>
+
+<TabItem value="55" label="cURL">
+
+
+```shell
+curl --request POST "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/supervisor/social_media/reset"
+```
+
+</TabItem>
+<TabItem value="56" label="HTTP">
+
+
+```HTTP
+POST /druid/indexer/v1/supervisor/social_media/reset HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+{
+    "id": "social_media"
+}
+  ```
+</details>
+
+### Reset offsets for a supervisor
+
+The supervisor must be running for this endpoint to be available.
+
+Resets the specified offsets for partitions without resetting the entire set.
+
+This endpoint clears only the stored offsets, prompting the supervisor to resume reading data from the specified offsets.
+If there are no stored offsets, the specified offsets are set in the metadata store.
+
+After resetting stored offsets, the supervisor kills and recreates any active tasks pertaining to the specified partitions,
+so that tasks begin reading specified offsets. For partitions that are not specified in this operation, the supervisor resumes from the last stored offset.
+
+Use this endpoint with caution. It can cause skipped messages, leading to data loss or duplicate data.
+
+#### URL
+
+`POST` `/druid/indexer/v1/supervisor/{supervisorId}/resetOffsets`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="1" label="200 SUCCESS">
+
+
+*Successfully reset offsets*
+
+</TabItem>
+<TabItem value="2" label="404 NOT FOUND">
+
+
+*Invalid supervisor ID*
+
+</TabItem>
+</Tabs>
+
+---
+#### Reset Offsets Metadata
+
+This section presents the structure and details of the reset offsets metadata payload.
+
+| Field | Type | Description | Required |
+|---------|---------|---------|---------|
+| `type` | String | The type of reset offsets metadata payload. It must match the supervisor's `type`. Possible values: `kafka` or `kinesis`. | Yes |
+| `partitions` | Object | An object representing the reset metadata. See below for details. | Yes |
+
+#### Partitions
+
+The following table defines the fields within the `partitions` object in the reset offsets metadata payload.
+
+| Field | Type | Description | Required |
+|---------|---------|---------|---------|
+| `type` | String | Must be set as `end`.  Indicates the end sequence numbers for the reset offsets. | Yes |
+| `stream` | String | The stream to be reset. It must be a valid stream consumed by the supervisor. | Yes |
+| `partitionOffsetMap` | Object | A map of partitions to corresponding offsets for the stream to be reset.| Yes |
+
+#### Sample request
+
+The following example shows how to reset offsets for a Kafka supervisor with the name `social_media`. For example, the supervisor is reading from a Kafka topic `ads_media_stream` and has the stored offsets: `{"0": 0, "1": 10, "2": 20, "3": 40}`.
+
+<Tabs>
+
+<TabItem value="3" label="cURL">
+
+
+```shell
+curl --request POST "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/supervisor/social_media/resetOffsets"
+--header 'Content-Type: application/json'
+--data-raw '{"type":"kafka","partitions":{"type":"end","stream":"ads_media_stream","partitionOffsetMap":{"0":100, "2": 650}}}'
+```
+
+</TabItem>
+<TabItem value="4" label="HTTP">
+
+
+```HTTP
+POST /druid/indexer/v1/supervisor/social_media/resetOffsets HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+Content-Type: application/json
+
+{
+  "type": "kafka",
+  "partitions": {
+    "type": "end",
+    "stream": "ads_media_stream",
+    "partitionOffsetMap": {
+      "0": 100,
+      "2": 650
+    }
+  }
+}
+```
+
+The example operation resets offsets only for partitions `0` and `2` to 100 and 650 respectively. After a successful reset,
+when the supervisor's tasks restart, they resume reading from `{"0": 100, "1": 10, "2": 650, "3": 40}`.
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+{
+    "id": "social_media"
+}
+  ```
+</details>
+
+### Terminate a supervisor
+
+Terminates a supervisor and its associated indexing tasks, triggering the publishing of their segments. When you terminate a supervisor, Druid places a tombstone marker in the metadata store to prevent reloading on restart.
+
+The terminated supervisor still exists in the metadata store and its history can be retrieved.
+
+#### URL
+
+`POST` `/druid/indexer/v1/supervisor/{supervisorId}/terminate`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="49" label="200 SUCCESS">
+
+
+*Successfully terminated a supervisor*
+
+</TabItem>
+<TabItem value="50" label="404 NOT FOUND">
+
+
+*Invalid supervisor ID or supervisor not running*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="51" label="cURL">
+
+
+```shell
+curl --request POST "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/supervisor/social_media/terminate"
+```
+
+</TabItem>
+<TabItem value="52" label="HTTP">
+
+
+```HTTP
+POST /druid/indexer/v1/supervisor/social_media/terminate HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+{
+    "id": "social_media"
+}
+  ```
+</details>
+
+### Terminate all supervisors
+
+Terminates all supervisors. Terminated supervisors still exist in the metadata store and their history can be retrieved. Note that this endpoint returns an HTTP `200 Success` code even if there are no supervisors or running supervisors to terminate.
+
+#### URL
+
+`POST` `/druid/indexer/v1/supervisor/terminateAll`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="53" label="200 SUCCESS">
+
+
+*Successfully terminated all supervisors*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="54" label="cURL">
+
+
+```shell
+curl --request POST "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/supervisor/terminateAll"
+```
+
+</TabItem>
+<TabItem value="55" label="HTTP">
+
+
+```HTTP
+POST /druid/indexer/v1/supervisor/terminateAll HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+{
+    "status": "success"
+}
+  ```
+</details>
+
+### Handoff task groups for a supervisor early
+
+Trigger handoff for specified task groups of a supervisor early. This is a best effort API and makes no guarantees of handoff execution
+
+#### URL
+
+`POST` `/druid/indexer/v1/supervisor/{supervisorId}/taskGroups/handoff`
+
+#### Sample request
+
+The following example shows how to handoff task groups for a supervisor with the name `social_media` and has the task groups: `1,2,3`.
+
+<Tabs>
+
+<TabItem value="3" label="cURL">
+
+
+```shell
+curl --request POST "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/supervisor/social_media/taskGroups/handoff"
+--header 'Content-Type: application/json'
+--data-raw '{"taskGroupIds": [1, 2, 3]}'
+```
+
+</TabItem>
+<TabItem value="4" label="HTTP">
+
+
+```HTTP
+POST /druid/indexer/v1/supervisor/social_media/taskGroups/handoff HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+Content-Type: application/json
+
+{
+  "taskGroupIds": [1, 2, 3],
+}
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+(empty response)
+</details>
+
+### Shut down a supervisor
+
+Shuts down a supervisor. This endpoint is deprecated and will be removed in future releases. Use the equivalent [terminate](#terminate-a-supervisor) endpoint instead.
+
+#### URL
+
+`POST` `/druid/indexer/v1/supervisor/{supervisorId}/shutdown`
diff --git a/docs/35.0.0/api-reference/tasks-api.md b/docs/35.0.0/api-reference/tasks-api.md
new file mode 100644
index 0000000000..f53037f84e
--- /dev/null
+++ b/docs/35.0.0/api-reference/tasks-api.md
@@ -0,0 +1,1663 @@
+---
+id: tasks-api
+title: Tasks API
+sidebar_label: Tasks
+---
+import Tabs from '@theme/Tabs';
+import TabItem from '@theme/TabItem';
+
+
+<!--
+
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+This document describes the API endpoints for task retrieval, submission, and deletion for Apache Druid. Tasks are individual jobs performed by Druid to complete operations such as ingestion, querying, and compaction.
+
+In this topic, `http://ROUTER_IP:ROUTER_PORT` is a placeholder for the Router service address and port. For example, on the quickstart configuration, use `http://localhost:8888`.
+
+## Task information and retrieval
+
+### Get an array of tasks
+
+Retrieves an array of all tasks in the Druid cluster. Each task object includes information on its ID, status, associated datasource, and other metadata. For definitions of the response properties, see the [Tasks table](../querying/sql-metadata-tables.md#tasks-table).
+
+#### URL
+
+`GET` `/druid/indexer/v1/tasks`
+
+#### Query parameters
+
+The endpoint supports a set of optional query parameters to filter results.
+
+|Parameter|Type|Description|
+|---|---|---|
+|`state`|String|Filter list of tasks by task state, valid options are `running`, `complete`, `waiting`, and `pending`.|
+| `datasource`|String| Return tasks filtered by Druid datasource.|
+| `createdTimeInterval`|String (ISO-8601)| Return tasks created within the specified interval. Use `_` as the delimiter for the interval string. Do not use `/`. For example, `2023-06-27_2023-06-28`.|
+| `max`|Integer|Maximum number of `complete` tasks to return. Only applies when `state` is set to `complete`.|
+| `type`|String|Filter tasks by task type. See [task documentation](../ingestion/tasks.md) for more details.|
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="1" label="200 SUCCESS">
+
+
+<br/>
+
+*Successfully retrieved list of tasks*
+
+</TabItem>
+<TabItem value="2" label="400 BAD REQUEST">
+
+
+<br/>
+
+*Invalid `state` query parameter value*
+
+</TabItem>
+<TabItem value="3" label="500 SERVER ERROR">
+
+
+<br/>
+
+*Invalid query parameter*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+The following example shows how to retrieve a list of tasks filtered with the following query parameters:
+* State: `complete`
+* Datasource: `wikipedia_api`
+* Time interval: between `2015-09-12` and `2015-09-13`
+* Max entries returned: `10`
+* Task type: `query_worker`
+
+<Tabs>
+
+<TabItem value="4" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/tasks/?state=complete&datasource=wikipedia_api&createdTimeInterval=2015-09-12_2015-09-13&max=10&type=query_worker"
+```
+
+</TabItem>
+<TabItem value="5" label="HTTP">
+
+
+```HTTP
+GET /druid/indexer/v1/tasks/?state=complete&datasource=wikipedia_api&createdTimeInterval=2015-09-12_2015-09-13&max=10&type=query_worker HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+  [
+    {
+        "id": "query-223549f8-b993-4483-b028-1b0d54713cad-worker0_0",
+        "groupId": "query-223549f8-b993-4483-b028-1b0d54713cad",
+        "type": "query_worker",
+        "createdTime": "2023-06-22T22:11:37.012Z",
+        "queueInsertionTime": "1970-01-01T00:00:00.000Z",
+        "statusCode": "SUCCESS",
+        "status": "SUCCESS",
+        "runnerStatusCode": "NONE",
+        "duration": 17897,
+        "location": {
+            "host": "localhost",
+            "port": 8101,
+            "tlsPort": -1
+        },
+        "dataSource": "wikipedia_api",
+        "errorMsg": null
+    },
+    {
+        "id": "query-fa82fa40-4c8c-4777-b832-cabbee5f519f-worker0_0",
+        "groupId": "query-fa82fa40-4c8c-4777-b832-cabbee5f519f",
+        "type": "query_worker",
+        "createdTime": "2023-06-20T22:51:21.302Z",
+        "queueInsertionTime": "1970-01-01T00:00:00.000Z",
+        "statusCode": "SUCCESS",
+        "status": "SUCCESS",
+        "runnerStatusCode": "NONE",
+        "duration": 16911,
+        "location": {
+            "host": "localhost",
+            "port": 8101,
+            "tlsPort": -1
+        },
+        "dataSource": "wikipedia_api",
+        "errorMsg": null
+    },
+    {
+        "id": "query-5419da7a-b270-492f-90e6-920ecfba766a-worker0_0",
+        "groupId": "query-5419da7a-b270-492f-90e6-920ecfba766a",
+        "type": "query_worker",
+        "createdTime": "2023-06-20T22:45:53.909Z",
+        "queueInsertionTime": "1970-01-01T00:00:00.000Z",
+        "statusCode": "SUCCESS",
+        "status": "SUCCESS",
+        "runnerStatusCode": "NONE",
+        "duration": 17030,
+        "location": {
+            "host": "localhost",
+            "port": 8101,
+            "tlsPort": -1
+        },
+        "dataSource": "wikipedia_api",
+        "errorMsg": null
+    }
+  ]
+  ```
+
+</details>
+
+### Get an array of complete tasks
+
+Retrieves an array of completed tasks in the Druid cluster. This is functionally equivalent to `/druid/indexer/v1/tasks?state=complete`. For definitions of the response properties, see the [Tasks table](../querying/sql-metadata-tables.md#tasks-table).
+
+#### URL
+
+`GET` `/druid/indexer/v1/completeTasks`
+
+#### Query parameters
+
+The endpoint supports a set of optional query parameters to filter results.
+
+|Parameter|Type|Description|
+|---|---|---|
+| `datasource`|String| Return tasks filtered by Druid datasource.|
+| `createdTimeInterval`|String (ISO-8601)| Return tasks created within the specified interval. The interval string should be delimited by `_` instead of `/`. For example, `2023-06-27_2023-06-28`.|
+| `max`|Integer|Maximum number of `complete` tasks to return. Only applies when `state` is set to `complete`.|
+| `type`|String|Filter tasks by task type. See [task documentation](../ingestion/tasks.md) for more details.|
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="6" label="200 SUCCESS">
+
+
+<br/>
+
+*Successfully retrieved list of complete tasks*
+
+</TabItem>
+<TabItem value="7" label="404 NOT FOUND">
+
+
+<br/>
+
+*Request sent to incorrect service*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="8" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/completeTasks"
+```
+
+</TabItem>
+<TabItem value="9" label="HTTP">
+
+
+```HTTP
+GET /druid/indexer/v1/completeTasks HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+  [
+    {
+        "id": "query-223549f8-b993-4483-b028-1b0d54713cad-worker0_0",
+        "groupId": "query-223549f8-b993-4483-b028-1b0d54713cad",
+        "type": "query_worker",
+        "createdTime": "2023-06-22T22:11:37.012Z",
+        "queueInsertionTime": "1970-01-01T00:00:00.000Z",
+        "statusCode": "SUCCESS",
+        "status": "SUCCESS",
+        "runnerStatusCode": "NONE",
+        "duration": 17897,
+        "location": {
+            "host": "localhost",
+            "port": 8101,
+            "tlsPort": -1
+        },
+        "dataSource": "wikipedia_api",
+        "errorMsg": null
+    },
+    {
+        "id": "query-223549f8-b993-4483-b028-1b0d54713cad",
+        "groupId": "query-223549f8-b993-4483-b028-1b0d54713cad",
+        "type": "query_controller",
+        "createdTime": "2023-06-22T22:11:28.367Z",
+        "queueInsertionTime": "1970-01-01T00:00:00.000Z",
+        "statusCode": "SUCCESS",
+        "status": "SUCCESS",
+        "runnerStatusCode": "NONE",
+        "duration": 30317,
+        "location": {
+            "host": "localhost",
+            "port": 8100,
+            "tlsPort": -1
+        },
+        "dataSource": "wikipedia_api",
+        "errorMsg": null
+    }
+  ]
+  ```
+
+</details>
+
+### Get an array of running tasks
+
+Retrieves an array of running task objects in the Druid cluster. It is functionally equivalent to `/druid/indexer/v1/tasks?state=running`. For definitions of the response properties, see the [Tasks table](../querying/sql-metadata-tables.md#tasks-table).
+
+#### URL
+
+`GET` `/druid/indexer/v1/runningTasks`
+
+#### Query parameters
+
+The endpoint supports a set of optional query parameters to filter results.
+
+|Parameter|Type|Description|
+|---|---|---|
+| `datasource`|String| Return tasks filtered by Druid datasource.|
+| `createdTimeInterval`|String (ISO-8601)| Return tasks created within the specified interval. The interval string should be delimited by `_` instead of `/`. For example, `2023-06-27_2023-06-28`.|
+| `max`|Integer|Maximum number of `complete` tasks to return. Only applies when `state` is set to `complete`.|
+| `type`|String|Filter tasks by task type. See [task documentation](../ingestion/tasks.md) for more details.|
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="10" label="200 SUCCESS">
+
+
+<br/>
+
+*Successfully retrieved list of running tasks*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="11" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/runningTasks"
+```
+
+</TabItem>
+<TabItem value="12" label="HTTP">
+
+
+```HTTP
+GET /druid/indexer/v1/runningTasks HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+  [
+    {
+        "id": "query-32663269-ead9-405a-8eb6-0817a952ef47",
+        "groupId": "query-32663269-ead9-405a-8eb6-0817a952ef47",
+        "type": "query_controller",
+        "createdTime": "2023-06-22T22:54:43.170Z",
+        "queueInsertionTime": "2023-06-22T22:54:43.170Z",
+        "statusCode": "RUNNING",
+        "status": "RUNNING",
+        "runnerStatusCode": "RUNNING",
+        "duration": -1,
+        "location": {
+            "host": "localhost",
+            "port": 8100,
+            "tlsPort": -1
+        },
+        "dataSource": "wikipedia_api",
+        "errorMsg": null
+    }
+  ]
+  ```
+
+</details>
+
+### Get an array of waiting tasks
+
+Retrieves an array of waiting tasks in the Druid cluster. It is functionally equivalent to `/druid/indexer/v1/tasks?state=waiting`. For definitions of the response properties, see the [Tasks table](../querying/sql-metadata-tables.md#tasks-table).
+
+#### URL
+
+`GET` `/druid/indexer/v1/waitingTasks`
+
+#### Query parameters
+
+The endpoint supports a set of optional query parameters to filter results.
+
+|Parameter|Type|Description|
+|---|---|---|
+| `datasource`|String| Return tasks filtered by Druid datasource.|
+| `createdTimeInterval`|String (ISO-8601)| Return tasks created within the specified interval. The interval string should be delimited by `_` instead of `/`. For example, `2023-06-27_2023-06-28`.|
+| `max`|Integer|Maximum number of `complete` tasks to return. Only applies when `state` is set to `complete`.|
+| `type`|String|Filter tasks by task type. See [task documentation](../ingestion/tasks.md) for more details.|
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="13" label="200 SUCCESS">
+
+
+<br/>
+
+*Successfully retrieved list of waiting tasks*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="14" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/waitingTasks"
+```
+
+</TabItem>
+<TabItem value="15" label="HTTP">
+
+
+```HTTP
+GET /druid/indexer/v1/waitingTasks HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+  [
+    {
+        "id": "index_parallel_wikipedia_auto_biahcbmf_2023-06-26T21:08:05.216Z",
+        "groupId": "index_parallel_wikipedia_auto_biahcbmf_2023-06-26T21:08:05.216Z",
+        "type": "index_parallel",
+        "createdTime": "2023-06-26T21:08:05.217Z",
+        "queueInsertionTime": "1970-01-01T00:00:00.000Z",
+        "statusCode": "RUNNING",
+        "status": "RUNNING",
+        "runnerStatusCode": "WAITING",
+        "duration": -1,
+        "location": {
+            "host": null,
+            "port": -1,
+            "tlsPort": -1
+        },
+        "dataSource": "wikipedia_auto",
+        "errorMsg": null
+    },
+    {
+        "id": "index_parallel_wikipedia_auto_afggfiec_2023-06-26T21:08:05.546Z",
+        "groupId": "index_parallel_wikipedia_auto_afggfiec_2023-06-26T21:08:05.546Z",
+        "type": "index_parallel",
+        "createdTime": "2023-06-26T21:08:05.548Z",
+        "queueInsertionTime": "1970-01-01T00:00:00.000Z",
+        "statusCode": "RUNNING",
+        "status": "RUNNING",
+        "runnerStatusCode": "WAITING",
+        "duration": -1,
+        "location": {
+            "host": null,
+            "port": -1,
+            "tlsPort": -1
+        },
+        "dataSource": "wikipedia_auto",
+        "errorMsg": null
+    },
+    {
+        "id": "index_parallel_wikipedia_auto_jmmddihf_2023-06-26T21:08:06.644Z",
+        "groupId": "index_parallel_wikipedia_auto_jmmddihf_2023-06-26T21:08:06.644Z",
+        "type": "index_parallel",
+        "createdTime": "2023-06-26T21:08:06.671Z",
+        "queueInsertionTime": "1970-01-01T00:00:00.000Z",
+        "statusCode": "RUNNING",
+        "status": "RUNNING",
+        "runnerStatusCode": "WAITING",
+        "duration": -1,
+        "location": {
+            "host": null,
+            "port": -1,
+            "tlsPort": -1
+        },
+        "dataSource": "wikipedia_auto",
+        "errorMsg": null
+    }
+  ]
+  ```
+
+</details>
+
+### Get an array of pending tasks
+
+Retrieves an array of pending tasks in the Druid cluster. It is functionally equivalent to `/druid/indexer/v1/tasks?state=pending`. For definitions of the response properties, see the [Tasks table](../querying/sql-metadata-tables.md#tasks-table).
+
+#### URL
+
+`GET` `/druid/indexer/v1/pendingTasks`
+
+#### Query parameters
+
+The endpoint supports a set of optional query parameters to filter results.
+
+|Parameter|Type|Description|
+|---|---|---|
+| `datasource`|String| Return tasks filtered by Druid datasource.|
+| `createdTimeInterval`|String (ISO-8601)| Return tasks created within the specified interval. The interval string should be delimited by `_` instead of `/`. For example, `2023-06-27_2023-06-28`.|
+| `max`|Integer|Maximum number of `complete` tasks to return. Only applies when `state` is set to `complete`.|
+| `type`|String|Filter tasks by task type. See [task documentation](../ingestion/tasks.md) for more details.|
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="16" label="200 SUCCESS">
+
+
+<br/>
+
+*Successfully retrieved list of pending tasks*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+<Tabs>
+
+<TabItem value="17" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/pendingTasks"
+```
+
+</TabItem>
+<TabItem value="18" label="HTTP">
+
+
+```HTTP
+GET /druid/indexer/v1/pendingTasks HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+  [
+    {
+        "id": "query-7b37c315-50a0-4b68-aaa8-b1ef1f060e67",
+        "groupId": "query-7b37c315-50a0-4b68-aaa8-b1ef1f060e67",
+        "type": "query_controller",
+        "createdTime": "2023-06-23T19:53:06.037Z",
+        "queueInsertionTime": "2023-06-23T19:53:06.037Z",
+        "statusCode": "RUNNING",
+        "status": "RUNNING",
+        "runnerStatusCode": "PENDING",
+        "duration": -1,
+        "location": {
+            "host": null,
+            "port": -1,
+            "tlsPort": -1
+        },
+        "dataSource": "wikipedia_api",
+        "errorMsg": null
+    },
+    {
+        "id": "query-544f0c41-f81d-4504-b98b-f9ab8b36ef36",
+        "groupId": "query-544f0c41-f81d-4504-b98b-f9ab8b36ef36",
+        "type": "query_controller",
+        "createdTime": "2023-06-23T19:53:06.616Z",
+        "queueInsertionTime": "2023-06-23T19:53:06.616Z",
+        "statusCode": "RUNNING",
+        "status": "RUNNING",
+        "runnerStatusCode": "PENDING",
+        "duration": -1,
+        "location": {
+            "host": null,
+            "port": -1,
+            "tlsPort": -1
+        },
+        "dataSource": "wikipedia_api",
+        "errorMsg": null
+    }
+  ]
+  ```
+
+</details>
+
+### Get task payload
+
+Retrieves the payload of a task given the task ID. It returns a JSON object with the task ID and payload that includes task configuration details and relevant specifications associated with the execution of the task.
+
+#### URL
+
+`GET` `/druid/indexer/v1/task/{taskId}`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="19" label="200 SUCCESS">
+
+
+<br/>
+
+*Successfully retrieved payload of task*
+
+</TabItem>
+<TabItem value="20" label="404 NOT FOUND">
+
+
+<br/>
+
+*Cannot find task with ID*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+The following examples shows how to retrieve the task payload of a task with the specified ID `index_parallel_wikipedia_short_iajoonnd_2023-07-07T17:53:12.174Z`.
+
+<Tabs>
+
+<TabItem value="21" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/task/index_parallel_wikipedia_short_iajoonnd_2023-07-07T17:53:12.174Z"
+```
+
+</TabItem>
+<TabItem value="22" label="HTTP">
+
+
+```HTTP
+GET /druid/indexer/v1/task/index_parallel_wikipedia_short_iajoonnd_2023-07-07T17:53:12.174Z HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+  {
+    "task": "index_parallel_wikipedia_short_iajoonnd_2023-07-07T17:53:12.174Z",
+    "payload": {
+        "type": "index_parallel",
+        "id": "index_parallel_wikipedia_short_iajoonnd_2023-07-07T17:53:12.174Z",
+        "groupId": "index_parallel_wikipedia_short_iajoonnd_2023-07-07T17:53:12.174Z",
+        "resource": {
+            "availabilityGroup": "index_parallel_wikipedia_short_iajoonnd_2023-07-07T17:53:12.174Z",
+            "requiredCapacity": 1
+        },
+        "spec": {
+            "dataSchema": {
+                "dataSource": "wikipedia_short",
+                "timestampSpec": {
+                    "column": "time",
+                    "format": "iso",
+                    "missingValue": null
+                },
+                "dimensionsSpec": {
+                    "dimensions": [
+                        {
+                            "type": "string",
+                            "name": "cityName",
+                            "multiValueHandling": "SORTED_ARRAY",
+                            "createBitmapIndex": true
+                        },
+                        {
+                            "type": "string",
+                            "name": "countryName",
+                            "multiValueHandling": "SORTED_ARRAY",
+                            "createBitmapIndex": true
+                        },
+                        {
+                            "type": "string",
+                            "name": "regionName",
+                            "multiValueHandling": "SORTED_ARRAY",
+                            "createBitmapIndex": true
+                        }
+                    ],
+                    "dimensionExclusions": [
+                        "__time",
+                        "time"
+                    ],
+                    "includeAllDimensions": false,
+                    "useSchemaDiscovery": false
+                },
+                "metricsSpec": [],
+                "granularitySpec": {
+                    "type": "uniform",
+                    "segmentGranularity": "DAY",
+                    "queryGranularity": {
+                        "type": "none"
+                    },
+                    "rollup": false,
+                    "intervals": [
+                        "2015-09-12T00:00:00.000Z/2015-09-13T00:00:00.000Z"
+                    ]
+                },
+                "transformSpec": {
+                    "filter": null,
+                    "transforms": []
+                }
+            },
+            "ioConfig": {
+                "type": "index_parallel",
+                "inputSource": {
+                    "type": "local",
+                    "baseDir": "quickstart/tutorial",
+                    "filter": "wikiticker-2015-09-12-sampled.json.gz"
+                },
+                "inputFormat": {
+                    "type": "json"
+                },
+                "appendToExisting": false,
+                "dropExisting": false
+            },
+            "tuningConfig": {
+                "type": "index_parallel",
+                "maxRowsPerSegment": 5000000,
+                "appendableIndexSpec": {
+                    "type": "onheap",
+                    "preserveExistingMetrics": false
+                },
+                "maxRowsInMemory": 25000,
+                "maxBytesInMemory": 0,
+                "skipBytesInMemoryOverheadCheck": false,
+                "maxTotalRows": null,
+                "numShards": null,
+                "splitHintSpec": null,
+                "partitionsSpec": {
+                    "type": "dynamic",
+                    "maxRowsPerSegment": 5000000,
+                    "maxTotalRows": null
+                },
+                "indexSpec": {
+                    "bitmap": {
+                        "type": "roaring"
+                    },
+                    "dimensionCompression": "lz4",
+                    "stringDictionaryEncoding": {
+                        "type": "utf8"
+                    },
+                    "metricCompression": "lz4",
+                    "longEncoding": "longs"
+                },
+                "indexSpecForIntermediatePersists": {
+                    "bitmap": {
+                        "type": "roaring"
+                    },
+                    "dimensionCompression": "lz4",
+                    "stringDictionaryEncoding": {
+                        "type": "utf8"
+                    },
+                    "metricCompression": "lz4",
+                    "longEncoding": "longs"
+                },
+                "maxPendingPersists": 0,
+                "forceGuaranteedRollup": false,
+                "reportParseExceptions": false,
+                "pushTimeout": 0,
+                "segmentWriteOutMediumFactory": null,
+                "maxNumConcurrentSubTasks": 1,
+                "maxRetry": 3,
+                "taskStatusCheckPeriodMs": 1000,
+                "chatHandlerTimeout": "PT10S",
+                "chatHandlerNumRetries": 5,
+                "maxNumSegmentsToMerge": 100,
+                "totalNumMergeTasks": 10,
+                "logParseExceptions": false,
+                "maxParseExceptions": 2147483647,
+                "maxSavedParseExceptions": 0,
+                "maxColumnsToMerge": -1,
+                "awaitSegmentAvailabilityTimeoutMillis": 0,
+                "maxAllowedLockCount": -1,
+                "partitionDimensions": []
+            }
+        },
+        "context": {
+            "forceTimeChunkLock": true,
+            "useLineageBasedSegmentAllocation": true
+        },
+        "dataSource": "wikipedia_short"
+    }
+}
+  ```
+
+</details>
+
+### Get task status
+
+Retrieves the status of a task given the task ID. It returns a JSON object with the task's status code, runner status, task type, datasource, and other relevant metadata.
+
+#### URL
+
+`GET` `/druid/indexer/v1/task/{taskId}/status`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="23" label="200 SUCCESS">
+
+
+<br/>
+
+*Successfully retrieved task status*
+
+</TabItem>
+<TabItem value="24" label="404 NOT FOUND">
+
+
+<br/>
+
+*Cannot find task with ID*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+The following examples shows how to retrieve the status of a task with the specified ID `query-223549f8-b993-4483-b028-1b0d54713cad`.
+
+<Tabs>
+
+<TabItem value="25" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/task/query-223549f8-b993-4483-b028-1b0d54713cad/status"
+```
+
+</TabItem>
+<TabItem value="26" label="HTTP">
+
+
+```HTTP
+GET /druid/indexer/v1/task/query-223549f8-b993-4483-b028-1b0d54713cad/status HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+  {
+    "task": "query-223549f8-b993-4483-b028-1b0d54713cad",
+    "status": {
+      "id": "query-223549f8-b993-4483-b028-1b0d54713cad",
+      "groupId": "query-223549f8-b993-4483-b028-1b0d54713cad",
+      "type": "query_controller",
+      "createdTime": "2023-06-22T22:11:28.367Z",
+      "queueInsertionTime": "1970-01-01T00:00:00.000Z",
+      "statusCode": "RUNNING",
+      "status": "RUNNING",
+      "runnerStatusCode": "RUNNING",
+      "duration": -1,
+      "location": {"host": "localhost", "port": 8100, "tlsPort": -1},
+      "dataSource": "wikipedia_api",
+      "errorMsg": null
+    }
+  }
+  ```
+
+</details>
+
+### Get task segments
+
+:::info
+ This API is not supported anymore and always returns a 404 response.
+ Use the metric `segment/added/bytes` instead to identify the segment IDs committed by a task.
+:::
+
+#### URL
+
+`GET` `/druid/indexer/v1/task/{taskId}/segments`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="27" label="404 NOT FOUND">
+
+
+```json
+{
+  "error": "Segment IDs committed by a task action are not persisted anymore. Use the metric 'segment/added/bytes' to identify the segments created by a task."
+}
+```
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+The following examples shows how to retrieve the task segment of the task with the specified ID `query-52a8aafe-7265-4427-89fe-dc51275cc470`.
+
+<Tabs>
+
+<TabItem value="28" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/task/query-52a8aafe-7265-4427-89fe-dc51275cc470/reports"
+```
+
+</TabItem>
+<TabItem value="29" label="HTTP">
+
+
+```HTTP
+GET /druid/indexer/v1/task/query-52a8aafe-7265-4427-89fe-dc51275cc470/reports HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+A successful request returns a `200 OK` response and an array of the task segments.
+
+### Get task log
+
+Retrieves the event log associated with a task. It returns a list of logged events during the lifecycle of the task. The endpoint is useful for providing information about the execution of the task, including any errors or warnings raised.
+
+Task logs are automatically retrieved from the Middle Manager/Indexer or in long-term storage. For reference, see [Task logs](../ingestion/tasks.md#task-logs).
+
+#### URL
+
+`GET` `/druid/indexer/v1/task/{taskId}/log`
+
+#### Query parameters
+
+* `offset` (optional)
+    * Type: Int
+    * Exclude the first passed in number of entries from the response.
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="30" label="200 SUCCESS">
+
+
+<br/>
+
+*Successfully retrieved task log*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+The following examples shows how to retrieve the task log of a task with the specified ID `index_kafka_social_media_0e905aa31037879_nommnaeg`.
+
+<Tabs>
+
+<TabItem value="31" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/task/index_kafka_social_media_0e905aa31037879_nommnaeg/log"
+```
+
+</TabItem>
+<TabItem value="32" label="HTTP">
+
+
+```HTTP
+GET /druid/indexer/v1/task/index_kafka_social_media_0e905aa31037879_nommnaeg/log HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+    2023-07-03T22:11:17,891 INFO [qtp1251996697-122] org.apache.druid.indexing.seekablestream.SeekableStreamIndexTaskRunner - Sequence[index_kafka_social_media_0e905aa31037879_0] end offsets updated from [{0=9223372036854775807}] to [{0=230985}].
+    2023-07-03T22:11:17,900 INFO [qtp1251996697-122] org.apache.druid.indexing.seekablestream.SeekableStreamIndexTaskRunner - Saved sequence metadata to disk: [SequenceMetadata{sequenceId=0, sequenceName='index_kafka_social_media_0e905aa31037879_0', assignments=[0], startOffsets={0=230985}, exclusiveStartPartitions=[], endOffsets={0=230985}, sentinel=false, checkpointed=true}]
+    2023-07-03T22:11:17,901 INFO [task-runner-0-priority-0] org.apache.druid.indexing.seekablestream.SeekableStreamIndexTaskRunner - Received resume command, resuming ingestion.
+    2023-07-03T22:11:17,901 INFO [task-runner-0-priority-0] org.apache.druid.indexing.seekablestream.SeekableStreamIndexTaskRunner - Finished reading partition[0], up to[230985].
+    2023-07-03T22:11:17,902 INFO [task-runner-0-priority-0] org.apache.kafka.clients.consumer.internals.ConsumerCoordinator - [Consumer clientId=consumer-kafka-supervisor-dcanhmig-1, groupId=kafka-supervisor-dcanhmig] Resetting generation and member id due to: consumer pro-actively leaving the group
+    2023-07-03T22:11:17,902 INFO [task-runner-0-priority-0] org.apache.kafka.clients.consumer.internals.ConsumerCoordinator - [Consumer clientId=consumer-kafka-supervisor-dcanhmig-1, groupId=kafka-supervisor-dcanhmig] Request joining group due to: consumer pro-actively leaving the group
+    2023-07-03T22:11:17,902 INFO [task-runner-0-priority-0] org.apache.kafka.clients.consumer.KafkaConsumer - [Consumer clientId=consumer-kafka-supervisor-dcanhmig-1, groupId=kafka-supervisor-dcanhmig] Unsubscribed all topics or patterns and assigned partitions
+    2023-07-03T22:11:17,912 INFO [task-runner-0-priority-0] org.apache.druid.segment.realtime.appenderator.StreamAppenderator - Persisted rows[0] and (estimated) bytes[0]
+    2023-07-03T22:11:17,916 INFO [[index_kafka_social_media_0e905aa31037879_nommnaeg]-appenderator-persist] org.apache.druid.segment.realtime.appenderator.StreamAppenderator - Flushed in-memory data with commit metadata [AppenderatorDriverMetadata{segments={}, lastSegmentIds={}, callerMetadata={nextPartitions=SeekableStreamEndSequenceNumbers{stream='social_media', partitionSequenceNumberMap={0=230985}}}}] for segments:
+    2023-07-03T22:11:17,917 INFO [[index_kafka_social_media_0e905aa31037879_nommnaeg]-appenderator-persist] org.apache.druid.segment.realtime.appenderator.StreamAppenderator - Persisted stats: processed rows: [0], persisted rows[0], sinks: [0], total fireHydrants (across sinks): [0], persisted fireHydrants (across sinks): [0]
+    2023-07-03T22:11:17,919 INFO [task-runner-0-priority-0] org.apache.druid.segment.realtime.appenderator.BaseAppenderatorDriver - Pushing [0] segments in background
+    2023-07-03T22:11:17,921 INFO [task-runner-0-priority-0] org.apache.druid.segment.realtime.appenderator.StreamAppenderator - Persisted rows[0] and (estimated) bytes[0]
+    2023-07-03T22:11:17,924 INFO [[index_kafka_social_media_0e905aa31037879_nommnaeg]-appenderator-persist] org.apache.druid.segment.realtime.appenderator.StreamAppenderator - Flushed in-memory data with commit metadata [AppenderatorDriverMetadata{segments={}, lastSegmentIds={}, callerMetadata={nextPartitions=SeekableStreamStartSequenceNumbers{stream='social_media', partitionSequenceNumberMap={0=230985}, exclusivePartitions=[]}, publishPartitions=SeekableStreamEndSequenceNumbers{stream='social_media', partitionSequenceNumberMap={0=230985}}}}] for segments:
+    2023-07-03T22:11:17,924 INFO [[index_kafka_social_media_0e905aa31037879_nommnaeg]-appenderator-persist] org.apache.druid.segment.realtime.appenderator.StreamAppenderator - Persisted stats: processed rows: [0], persisted rows[0], sinks: [0], total fireHydrants (across sinks): [0], persisted fireHydrants (across sinks): [0]
+    2023-07-03T22:11:17,925 INFO [[index_kafka_social_media_0e905aa31037879_nommnaeg]-appenderator-merge] org.apache.druid.segment.realtime.appenderator.StreamAppenderator - Preparing to push (stats): processed rows: [0], sinks: [0], fireHydrants (across sinks): [0]
+    2023-07-03T22:11:17,925 INFO [[index_kafka_social_media_0e905aa31037879_nommnaeg]-appenderator-merge] org.apache.druid.segment.realtime.appenderator.StreamAppenderator - Push complete...
+    2023-07-03T22:11:17,929 INFO [[index_kafka_social_media_0e905aa31037879_nommnaeg]-publish] org.apache.druid.indexing.seekablestream.SequenceMetadata - With empty segment set, start offsets [SeekableStreamStartSequenceNumbers{stream='social_media', partitionSequenceNumberMap={0=230985}, exclusivePartitions=[]}] and end offsets [SeekableStreamEndSequenceNumbers{stream='social_media', partitionSequenceNumberMap={0=230985}}] are the same, skipping metadata commit.
+    2023-07-03T22:11:17,930 INFO [[index_kafka_social_media_0e905aa31037879_nommnaeg]-publish] org.apache.druid.segment.realtime.appenderator.BaseAppenderatorDriver - Published [0] segments with commit metadata [{nextPartitions=SeekableStreamStartSequenceNumbers{stream='social_media', partitionSequenceNumberMap={0=230985}, exclusivePartitions=[]}, publishPartitions=SeekableStreamEndSequenceNumbers{stream='social_media', partitionSequenceNumberMap={0=230985}}}]
+    2023-07-03T22:11:17,930 INFO [[index_kafka_social_media_0e905aa31037879_nommnaeg]-publish] org.apache.druid.indexing.seekablestream.SeekableStreamIndexTaskRunner - Published 0 segments for sequence [index_kafka_social_media_0e905aa31037879_0] with metadata [AppenderatorDriverMetadata{segments={}, lastSegmentIds={}, callerMetadata={nextPartitions=SeekableStreamStartSequenceNumbers{stream='social_media', partitionSequenceNumberMap={0=230985}, exclusivePartitions=[]}, publishPartitions=SeekableStreamEndSequenceNumbers{stream='social_media', partitionSequenceNumberMap={0=230985}}}}].
+    2023-07-03T22:11:17,931 INFO [[index_kafka_social_media_0e905aa31037879_nommnaeg]-publish] org.apache.druid.indexing.seekablestream.SeekableStreamIndexTaskRunner - Saved sequence metadata to disk: []
+    2023-07-03T22:11:17,932 INFO [task-runner-0-priority-0] org.apache.druid.indexing.seekablestream.SeekableStreamIndexTaskRunner - Handoff complete for segments:
+    2023-07-03T22:11:17,932 INFO [task-runner-0-priority-0] org.apache.kafka.clients.consumer.internals.ConsumerCoordinator - [Consumer clientId=consumer-kafka-supervisor-dcanhmig-1, groupId=kafka-supervisor-dcanhmig] Resetting generation and member id due to: consumer pro-actively leaving the group
+    2023-07-03T22:11:17,932 INFO [task-runner-0-priority-0] org.apache.kafka.clients.consumer.internals.ConsumerCoordinator - [Consumer clientId=consumer-kafka-supervisor-dcanhmig-1, groupId=kafka-supervisor-dcanhmig] Request joining group due to: consumer pro-actively leaving the group
+    2023-07-03T22:11:17,933 INFO [task-runner-0-priority-0] org.apache.kafka.common.metrics.Metrics - Metrics scheduler closed
+    2023-07-03T22:11:17,933 INFO [task-runner-0-priority-0] org.apache.kafka.common.metrics.Metrics - Closing reporter org.apache.kafka.common.metrics.JmxReporter
+    2023-07-03T22:11:17,933 INFO [task-runner-0-priority-0] org.apache.kafka.common.metrics.Metrics - Metrics reporters closed
+    2023-07-03T22:11:17,935 INFO [task-runner-0-priority-0] org.apache.kafka.common.utils.AppInfoParser - App info kafka.consumer for consumer-kafka-supervisor-dcanhmig-1 unregistered
+    2023-07-03T22:11:17,936 INFO [task-runner-0-priority-0] org.apache.druid.curator.announcement.PathChildrenAnnouncer - Unannouncing [/druid/internal-discovery/PEON/localhost:8100]
+    2023-07-03T22:11:17,972 INFO [task-runner-0-priority-0] org.apache.druid.curator.discovery.CuratorDruidNodeAnnouncer - Unannounced self [{"druidNode":{"service":"druid/middleManager","host":"localhost","bindOnHost":false,"plaintextPort":8100,"port":-1,"tlsPort":-1,"enablePlaintextPort":true,"enableTlsPort":false},"nodeType":"peon","services":{"dataNodeService":{"type":"dataNodeService","tier":"_default_tier","maxSize":0,"type":"indexer-executor","serverType":"indexer-executor","priority":0},"lookupNodeService":{"type":"lookupNodeService","lookupTier":"__default"}}}].
+    2023-07-03T22:11:17,972 INFO [task-runner-0-priority-0] org.apache.druid.curator.announcement.PathChildrenAnnouncer - Unannouncing [/druid/announcements/localhost:8100]
+    2023-07-03T22:11:17,996 INFO [task-runner-0-priority-0] org.apache.druid.indexing.worker.executor.ExecutorLifecycle - Task completed with status: {
+    "id" : "index_kafka_social_media_0e905aa31037879_nommnaeg",
+    "status" : "SUCCESS",
+    "duration" : 3601130,
+    "errorMsg" : null,
+    "location" : {
+        "host" : null,
+        "port" : -1,
+        "tlsPort" : -1
+    }
+    }
+    2023-07-03T22:11:17,998 INFO [main] org.apache.druid.java.util.common.lifecycle.Lifecycle - Stopping lifecycle [module] stage [ANNOUNCEMENTS]
+    2023-07-03T22:11:18,005 INFO [main] org.apache.druid.java.util.common.lifecycle.Lifecycle - Stopping lifecycle [module] stage [SERVER]
+    2023-07-03T22:11:18,009 INFO [main] org.eclipse.jetty.server.AbstractConnector - Stopped ServerConnector@6491006{HTTP/1.1, (http/1.1)}{0.0.0.0:8100}
+    2023-07-03T22:11:18,009 INFO [main] org.eclipse.jetty.server.session - node0 Stopped scavenging
+    2023-07-03T22:11:18,012 INFO [main] org.eclipse.jetty.server.handler.ContextHandler - Stopped o.e.j.s.ServletContextHandler@742aa00a{/,null,STOPPED}
+    2023-07-03T22:11:18,014 INFO [main] org.apache.druid.java.util.common.lifecycle.Lifecycle - Stopping lifecycle [module] stage [NORMAL]
+    2023-07-03T22:11:18,014 INFO [main] org.apache.druid.server.coordination.ZkCoordinator - Stopping ZkCoordinator for [DruidServerMetadata{name='localhost:8100', hostAndPort='localhost:8100', hostAndTlsPort='null', maxSize=0, tier='_default_tier', type=indexer-executor, priority=0}]
+    2023-07-03T22:11:18,014 INFO [main] org.apache.druid.server.coordination.SegmentLoadDropHandler - Stopping...
+    2023-07-03T22:11:18,014 INFO [main] org.apache.druid.server.coordination.SegmentLoadDropHandler - Stopped.
+    2023-07-03T22:11:18,014 INFO [main] org.apache.druid.indexing.overlord.SingleTaskBackgroundRunner - Starting graceful shutdown of task[index_kafka_social_media_0e905aa31037879_nommnaeg].
+    2023-07-03T22:11:18,014 INFO [main] org.apache.druid.indexing.seekablestream.SeekableStreamIndexTaskRunner - Stopping forcefully (status: [PUBLISHING])
+    2023-07-03T22:11:18,019 INFO [LookupExtractorFactoryContainerProvider-MainThread] org.apache.druid.query.lookup.LookupReferencesManager - Lookup Management loop exited. Lookup notices are not handled anymore.
+    2023-07-03T22:11:18,020 INFO [main] org.apache.druid.query.lookup.LookupReferencesManager - Closed lookup [name].
+    2023-07-03T22:11:18,020 INFO [Curator-Framework-0] org.apache.curator.framework.imps.CuratorFrameworkImpl - backgroundOperationsLoop exiting
+    2023-07-03T22:11:18,147 INFO [main] org.apache.zookeeper.ZooKeeper - Session: 0x1000097ceaf0007 closed
+    2023-07-03T22:11:18,147 INFO [main-EventThread] org.apache.zookeeper.ClientCnxn - EventThread shut down for session: 0x1000097ceaf0007
+    2023-07-03T22:11:18,151 INFO [main] org.apache.druid.java.util.common.lifecycle.Lifecycle - Stopping lifecycle [module] stage [INIT]
+    Finished peon task
+  ```
+
+</details>
+
+### Get task completion report
+
+Retrieves a [task completion report](../ingestion/tasks.md#task-reports) for a task. It returns a JSON object with information about the number of rows ingested, and any parse exceptions that Druid raised.
+
+#### URL
+
+`GET` `/druid/indexer/v1/task/{taskId}/reports`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="33" label="200 SUCCESS">
+
+
+<br/>
+
+*Successfully retrieved task report*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+The following examples shows how to retrieve the completion report of a task with the specified ID `query-52a8aafe-7265-4427-89fe-dc51275cc470`.
+
+<Tabs>
+
+<TabItem value="34" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/task/query-52a8aafe-7265-4427-89fe-dc51275cc470/reports"
+```
+
+</TabItem>
+<TabItem value="35" label="HTTP">
+
+
+```HTTP
+GET /druid/indexer/v1/task/query-52a8aafe-7265-4427-89fe-dc51275cc470/reports HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+  {
+    "ingestionStatsAndErrors": {
+        "type": "ingestionStatsAndErrors",
+        "taskId": "query-52a8aafe-7265-4427-89fe-dc51275cc470",
+        "payload": {
+            "ingestionState": "COMPLETED",
+            "unparseableEvents": {},
+            "rowStats": {
+                "determinePartitions": {
+                    "processed": 0,
+                    "processedBytes": 0,
+                    "processedWithError": 0,
+                    "thrownAway": 0,
+                    "unparseable": 0
+                },
+                "buildSegments": {
+                    "processed": 39244,
+                    "processedBytes": 17106256,
+                    "processedWithError": 0,
+                    "thrownAway": 0,
+                    "unparseable": 0
+                }
+            },
+            "errorMsg": null,
+            "segmentAvailabilityConfirmed": false,
+            "segmentAvailabilityWaitTimeMs": 0
+        }
+    }
+  }
+  ```
+
+</details>
+
+## Task operations
+
+### Submit a task
+
+Submits a JSON-based ingestion spec or supervisor spec to the Overlord. It returns the task ID of the submitted task. For information on creating an ingestion spec, refer to the [ingestion spec reference](../ingestion/ingestion-spec.md).
+
+Note that for most batch ingestion use cases, you should use the [SQL-ingestion API](./sql-ingestion-api.md) instead of JSON-based batch ingestion.
+
+#### URL
+
+`POST` `/druid/indexer/v1/task`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="36" label="200 SUCCESS">
+
+
+<br/>
+
+*Successfully submitted task*
+
+</TabItem>
+<TabItem value="37" label="400 BAD REQUEST">
+
+
+<br/>
+
+*Missing information in query*
+
+</TabItem>
+<TabItem value="38" label="415 UNSUPPORTED MEDIA TYPE">
+
+
+<br/>
+
+*Incorrect request body media type*
+
+</TabItem>
+<TabItem value="39" label="500 Server Error">
+
+
+<br/>
+
+*Unexpected token or characters in request body*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+The following request is an example of submitting a task to create a datasource named `"wikipedia auto"`.
+
+<Tabs>
+
+<TabItem value="40" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/task" \
+--header 'Content-Type: application/json' \
+--data '{
+  "type" : "index_parallel",
+  "spec" : {
+    "dataSchema" : {
+      "dataSource" : "wikipedia_auto",
+      "timestampSpec": {
+        "column": "time",
+        "format": "iso"
+      },
+      "dimensionsSpec" : {
+        "useSchemaDiscovery": true
+      },
+      "metricsSpec" : [],
+      "granularitySpec" : {
+        "type" : "uniform",
+        "segmentGranularity" : "day",
+        "queryGranularity" : "none",
+        "intervals" : ["2015-09-12/2015-09-13"],
+        "rollup" : false
+      }
+    },
+    "ioConfig" : {
+      "type" : "index_parallel",
+      "inputSource" : {
+        "type" : "local",
+        "baseDir" : "quickstart/tutorial/",
+        "filter" : "wikiticker-2015-09-12-sampled.json.gz"
+      },
+      "inputFormat" : {
+        "type" : "json"
+      },
+      "appendToExisting" : false
+    },
+    "tuningConfig" : {
+      "type" : "index_parallel",
+      "maxRowsPerSegment" : 5000000,
+      "maxRowsInMemory" : 25000
+    }
+  }
+}'
+
+```
+</TabItem>
+<TabItem value="41" label="HTTP">
+
+
+```HTTP
+POST /druid/indexer/v1/task HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+Content-Type: application/json
+Content-Length: 952
+
+{
+  "type" : "index_parallel",
+  "spec" : {
+    "dataSchema" : {
+      "dataSource" : "wikipedia_auto",
+      "timestampSpec": {
+        "column": "time",
+        "format": "iso"
+      },
+      "dimensionsSpec" : {
+        "useSchemaDiscovery": true
+      },
+      "metricsSpec" : [],
+      "granularitySpec" : {
+        "type" : "uniform",
+        "segmentGranularity" : "day",
+        "queryGranularity" : "none",
+        "intervals" : ["2015-09-12/2015-09-13"],
+        "rollup" : false
+      }
+    },
+    "ioConfig" : {
+      "type" : "index_parallel",
+      "inputSource" : {
+        "type" : "local",
+        "baseDir" : "quickstart/tutorial/",
+        "filter" : "wikiticker-2015-09-12-sampled.json.gz"
+      },
+      "inputFormat" : {
+        "type" : "json"
+      },
+      "appendToExisting" : false
+    },
+    "tuningConfig" : {
+      "type" : "index_parallel",
+      "maxRowsPerSegment" : 5000000,
+      "maxRowsInMemory" : 25000
+    }
+  }
+}
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+  {
+      "task": "index_parallel_wikipedia_odofhkle_2023-06-23T21:07:28.226Z"
+  }
+  ```
+
+</details>
+
+### Shut down a task
+
+Shuts down a task if it not already complete. Returns a JSON object with the ID of the task that was shut down successfully.
+
+#### URL
+
+`POST` `/druid/indexer/v1/task/{taskId}/shutdown`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="42" label="200 SUCCESS">
+
+
+<br/>
+
+*Successfully shut down task*
+
+</TabItem>
+<TabItem value="43" label="404 NOT FOUND">
+
+
+<br/>
+
+*Cannot find task with ID or task is no longer running*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+The following request shows how to shut down a task with the ID `query-52as 8aafe-7265-4427-89fe-dc51275cc470`.
+
+<Tabs>
+
+<TabItem value="44" label="cURL">
+
+
+```shell
+curl --request POST "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/task/query-52as 8aafe-7265-4427-89fe-dc51275cc470/shutdown"
+```
+
+</TabItem>
+<TabItem value="45" label="HTTP">
+
+
+```HTTP
+POST /druid/indexer/v1/task/query-52as 8aafe-7265-4427-89fe-dc51275cc470/shutdown HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+  {
+    "task": "query-577a83dd-a14e-4380-bd01-c942b781236b"
+  }
+  ```
+
+</details>
+
+### Shut down all tasks for a datasource
+
+Shuts down all tasks for a specified datasource. If successful, it returns a JSON object with the name of the datasource whose tasks are shut down.
+
+#### URL
+
+`POST` `/druid/indexer/v1/datasources/{datasource}/shutdownAllTasks`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="46" label="200 SUCCESS">
+
+
+<br/>
+
+*Successfully shut down tasks*
+
+</TabItem>
+<TabItem value="47" label="404 NOT FOUND">
+
+
+<br/>
+
+*Error or datasource does not have a running task*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+The following request is an example of shutting down all tasks for datasource `wikipedia_auto`.
+
+<Tabs>
+
+<TabItem value="48" label="cURL">
+
+
+```shell
+curl --request POST "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/datasources/wikipedia_auto/shutdownAllTasks"
+```
+
+</TabItem>
+<TabItem value="49" label="HTTP">
+
+
+```HTTP
+POST /druid/indexer/v1/datasources/wikipedia_auto/shutdownAllTasks HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+  {
+    "dataSource": "wikipedia_api"
+  }
+  ```
+
+</details>
+
+## Task management
+
+### Retrieve status objects for tasks
+
+Retrieves list of task status objects for list of task ID strings in request body. It returns a set of JSON objects with the status, duration, location of each task, and any error messages.
+
+#### URL
+
+`POST` `/druid/indexer/v1/taskStatus`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="50" label="200 SUCCESS">
+
+
+<br/>
+
+*Successfully retrieved status objects*
+
+</TabItem>
+<TabItem value="51" label="415 UNSUPPORTED MEDIA TYPE">
+
+
+<br/>
+
+*Missing request body or incorrect request body type*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+The following request is an example of retrieving status objects for task ID `index_parallel_wikipedia_auto_jndhkpbo_2023-06-26T17:23:05.308Z` and `index_parallel_wikipedia_auto_jbgiianh_2023-06-26T23:17:56.769Z` .
+
+<Tabs>
+
+<TabItem value="52" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/taskStatus" \
+--header 'Content-Type: application/json' \
+--data '["index_parallel_wikipedia_auto_jndhkpbo_2023-06-26T17:23:05.308Z","index_parallel_wikipedia_auto_jbgiianh_2023-06-26T23:17:56.769Z"]'
+```
+
+</TabItem>
+<TabItem value="53" label="HTTP">
+
+
+```HTTP
+POST /druid/indexer/v1/taskStatus HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+Content-Type: application/json
+Content-Length: 134
+
+["index_parallel_wikipedia_auto_jndhkpbo_2023-06-26T17:23:05.308Z", "index_parallel_wikipedia_auto_jbgiianh_2023-06-26T23:17:56.769Z"]
+```
+
+</TabItem>
+</Tabs>
+
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+  {
+    "index_parallel_wikipedia_auto_jbgiianh_2023-06-26T23:17:56.769Z": {
+        "id": "index_parallel_wikipedia_auto_jbgiianh_2023-06-26T23:17:56.769Z",
+        "status": "SUCCESS",
+        "duration": 10630,
+        "errorMsg": null,
+        "location": {
+            "host": "localhost",
+            "port": 8100,
+            "tlsPort": -1
+        }
+    },
+    "index_parallel_wikipedia_auto_jndhkpbo_2023-06-26T17:23:05.308Z": {
+        "id": "index_parallel_wikipedia_auto_jndhkpbo_2023-06-26T17:23:05.308Z",
+        "status": "SUCCESS",
+        "duration": 11012,
+        "errorMsg": null,
+        "location": {
+            "host": "localhost",
+            "port": 8100,
+            "tlsPort": -1
+        }
+    }
+  }
+  ```
+
+</details>
+
+### Clean up pending segments for a datasource
+
+Manually clean up pending segments table in metadata storage for `datasource`. It returns a JSON object response with
+`numDeleted` for the number of rows deleted from the pending segments table. This API is used by the
+`druid.coordinator.kill.pendingSegments.on` [Coordinator setting](../configuration/index.md#data-management)
+which automates this operation to perform periodically.
+
+#### URL
+
+`DELETE` `/druid/indexer/v1/pendingSegments/{datasource}`
+
+#### Responses
+
+<Tabs>
+
+<TabItem value="54" label="200 SUCCESS">
+
+
+<br/>
+
+*Successfully deleted pending segments*
+
+</TabItem>
+</Tabs>
+
+---
+
+#### Sample request
+
+The following request is an example of cleaning up pending segments for the `wikipedia_api` datasource.
+
+<Tabs>
+
+<TabItem value="55" label="cURL">
+
+
+```shell
+curl --request DELETE "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/pendingSegments/wikipedia_api"
+```
+
+</TabItem>
+<TabItem value="56" label="HTTP">
+
+
+```HTTP
+DELETE /druid/indexer/v1/pendingSegments/wikipedia_api HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+#### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+  ```json
+  {
+    "numDeleted": 2
+  }
+  ```
+
+</details>
\ No newline at end of file
diff --git a/docs/35.0.0/assets/compaction-config.png b/docs/35.0.0/assets/compaction-config.png
new file mode 100644
index 0000000000..9dbcfefa80
Binary files /dev/null and b/docs/35.0.0/assets/compaction-config.png differ
diff --git a/docs/35.0.0/assets/datasources-action-button.png b/docs/35.0.0/assets/datasources-action-button.png
new file mode 100644
index 0000000000..6a52b8444d
Binary files /dev/null and b/docs/35.0.0/assets/datasources-action-button.png differ
diff --git a/docs/35.0.0/assets/druid-architecture.png b/docs/35.0.0/assets/druid-architecture.png
new file mode 100644
index 0000000000..954a87bc1b
Binary files /dev/null and b/docs/35.0.0/assets/druid-architecture.png differ
diff --git a/docs/35.0.0/assets/druid-architecture.svg b/docs/35.0.0/assets/druid-architecture.svg
new file mode 100644
index 0000000000..9d0e67188f
--- /dev/null
+++ b/docs/35.0.0/assets/druid-architecture.svg
@@ -0,0 +1,19 @@
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+  <svg xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:lucid="lucid" width="1967.24" height="872.83"><g transform="translate(5341 -19.5)" lucid:page-tab-id="0_0"><path d="M-5320 166a6 6 0 0 1 6-6h508a6 6 0 0 1 6 6v308a6 6 0 0 1-6 6h-508a6 6 0 0 1-6-6zM-4640 166a6 6 0 0 1 6-6h508a6 6 0 0 1 6 6v308a6 6 0 0 1-6 6h-508a6 6 0 0 1-6-6zM-3960 166a6 6 0 0 1 6-6h508a6 6 0 0 1 6 6v308a6 6 0 0 1-6 6h-508a6 6 0 0 1-6-6z" stroke="#cfe4ff" stroke-width="2" fill="#cfe4ff"/><path d="M-5280 266a6 6 0 0 1 6-6h168a6 6 0 0 1 6 6v108a6 6 0 0 1-6 6h-168a6 6 0 0 1-6-6z" stroke="#fc9432" fill="#ffdda6"/><use xlink:href="#a" transform="matrix(1,0,0,1,-5275,265) translate(9.728395061728392 60.923611111111114)"/><path d="M-5020 266a6 6 0 0 1 6-6h168a6 6 0 0 1 6 6v108a6 6 0 0 1-6 6h-168a6 6 0 0 1-6-6z" stroke="#fc9432" fill="#ffdda6"/><use xlink:href="#b" transform="matrix(1,0,0,1,-5015,265) translate(29.750000000000007 60.923611111111114)"/><path d="M-3920 266a6 6 0 0 1 6-6h208a6 6 0 0 1 6 6v108a6 6 0 0 1-6 6h-208a6 6 0 0 1-6-6z" stroke="#fc9432" fill="#ffdda6"/><use xlink:href="#c" transform="matrix(1,0,0,1,-3915,265) translate(1.6820987654321016 60.923611111111114)"/><use xlink:href="#d" transform="matrix(1,0,0,1,-3915,265) translate(94.52777777777779 60.923611111111114)"/><path d="M-4340 266a6 6 0 0 1 6-6h168a6 6 0 0 1 6 6v108a6 6 0 0 1-6 6h-168a6 6 0 0 1-6-6z" stroke="#fc9432" fill="#ffdda6"/><use xlink:href="#e" transform="matrix(1,0,0,1,-4335,265) translate(42.54938271604939 60.923611111111114)"/><path d="M-4600 266a6 6 0 0 1 6-6h168a6 6 0 0 1 6 6v108a6 6 0 0 1-6 6h-168a6 6 0 0 1-6-6z" stroke="#fc9432" fill="#ffdda6"/><use xlink:href="#f" transform="matrix(1,0,0,1,-4595,265) translate(41.74691358024692 60.923611111111114)"/><path d="M-3660 266a6 6 0 0 1 6-6h168a6 6 0 0 1 6 6v108a6 6 0 0 1-6 6h-168a6 6 0 0 1-6-6z" stroke="#fc9432" fill="#ffdda6"/><use xlink:href="#g" transform="matrix(1,0,0,1,-3655,265) translate(25.817901234567906 60.923611111111114)"/><path d="M-4401 320h42" stroke="#3a414a" stroke-width="2" fill="none"/><path d="M-4416.26 320l14.26-4.63v9.26zM-4343.74 320l-14.26 4.63v-9.26z" stroke="#3a414a" stroke-width="2" fill="#3a414a"/><path d="M-5320 156.33a6 6 0 0 1 6-6h208a6 6 0 0 1 6 6v67.34a6 6 0 0 1-6 6h-208a6 6 0 0 1-6-6z" stroke="#000" stroke-opacity="0" fill="#fff" fill-opacity="0"/><use xlink:href="#h" transform="matrix(1,0,0,1,-5315,155.33333333333334) translate(11.191358024691354 40.611111111111114)"/><use xlink:href="#i" transform="matrix(1,0,0,1,-5315,155.33333333333334) translate(112.14197530864197 40.611111111111114)"/><path d="M-4640 166a6 6 0 0 1 6-6h188a6 6 0 0 1 6 6v48a6 6 0 0 1-6 6h-188a6 6 0 0 1-6-6z" stroke="#000" stroke-opacity="0" fill="#fff" fill-opacity="0"/><use xlink:href="#j" transform="matrix(1,0,0,1,-4635,165.00000000000006) translate(5.966049382716051 29.36111111111111)"/><use xlink:href="#i" transform="matrix(1,0,0,1,-4635,165.00000000000006) translate(97.36728395061729 29.36111111111111)"/><path d="M-3960 166a6 6 0 0 1 6-6h188a6 6 0 0 1 6 6v48a6 6 0 0 1-6 6h-188a6 6 0 0 1-6-6z" stroke="#000" stroke-opacity="0" fill="#fff" fill-opacity="0"/><use xlink:href="#k" transform="matrix(1,0,0,1,-3955,165.00000000000006) translate(16.43827160493828 29.36111111111111)"/><use xlink:href="#i" transform="matrix(1,0,0,1,-3955,165.00000000000006) translate(86.89506172839506 29.36111111111111)"/><path d="M-5000 646a6 6 0 0 1 6-6h1228a6 6 0 0 1 6 6v188a6 6 0 0 1-6 6h-1228a6 6 0 0 1-6-6z" stroke="#ced4db" fill="#f2f3f5"/><use xlink:href="#l" transform="matrix(1,0,0,1,-4988,652) translate(567.9074074074074 94.77777777777777)"/><path d="M-4530 686a6 6 0 0 1 6-6h288a6 6 0 0 1 6 6v68a6 6 0 0 1-6 6h-288a6 6 0 0 1-6-6z" stroke="#9391ff" fill="#dedeff"/><use xlink:href="#m" transform="matrix(1,0,0,1,-4518,692) translate(66.6604938271605 33.611111111111114)"/><path d="M-4120 686a6 6 0 0 1 6-6h288a6 6 0 0 1 6 6v68a6 6 0 0 1-6 6h-288a6 6 0 0 1-6-6z" stroke="#9391ff" fill="#dedeff"/><use xlink:href="#n" transform="matrix(1,0,0,1,-4108,692) translate(51.4135802469136 33.611111111111114)"/><use xlink:href="#o" transform="matrix(1,0,0,1,-4108,692) translate(128.37037037037038 33.611111111111114)"/><path d="M-4940 686a6 6 0 0 1 6-6h288a6 6 0 0 1 6 6v68a6 6 0 0 1-6 6h-288a6 6 0 0 1-6-6z" stroke="#9391ff" fill="#dedeff"/><use xlink:href="#p" transform="matrix(1,0,0,1,-4928,692) translate(25.734567901234584 33.611111111111114)"/><use xlink:href="#o" transform="matrix(1,0,0,1,-4928,692) translate(154.0493827160494 33.611111111111114)"/><path d="M-4560 766.67a6 6 0 0 1 6-6h348a6 6 0 0 1 6 6V834a6 6 0 0 1-6 6h-348a6 6 0 0 1-6-6z" stroke="#000" stroke-opacity="0" fill="#fff" fill-opacity="0"/><use xlink:href="#q" transform="matrix(1,0,0,1,-4555,765.6666666666666) translate(17.99691358024691 40.611111111111114)"/><use xlink:href="#r" transform="matrix(1,0,0,1,-4555,765.6666666666666) translate(139.81172839506172 40.611111111111114)"/><path d="M-4387.38 662.53l-1.6-3.68m-3.2-7.36l-3.2-7.38m-3.2-7.36l-3.2-7.36m-3.2-7.36l-3.2-7.37m-3.2-7.36l-3.2-7.35m-3.2-7.37l-3.2-7.36m-3.2-7.36l-3.2-7.36m-3.2-7.37l-3.22-7.36m-3.2-7.36l-3.2-7.36m-3.2-7.36l-3.2-7.36m-3.2-7.36l-3.2-7.37m-3.2-7.37l-3.2-7.36m-3.2-7.37l-3.2-7.36m-3.2-7.36l-3.2-7.36m-3.2-7.37l-3.2-7.36m-3.2-7.37l-3.22-7.37m-3.2-7.36l-3.2-7.36m-3.2-7.37l-3.2-7.36m-3.2-7.35l-1.6-3.68" stroke="#3a414a" stroke-width="2" fill="none"/><path d="M-4381.3 676.53l-9.93-11.23 8.5-3.7zM-4508.7 383.47l9.93 11.23-8.5 3.7z" stroke="#3a414a" stroke-width="2" fill="#3a414a"/><path d="M-4372.62 662.53l1.6-3.68m3.2-7.36l3.2-7.38m3.2-7.36l3.2-7.36m3.2-7.36l3.2-7.37m3.2-7.36l3.2-7.35m3.2-7.37l3.2-7.36m3.2-7.36l3.2-7.36m3.2-7.37l3.22-7.36m3.2-7.36l3.2-7.36m3.2-7.36l3.2-7.36m3.2-7.36l3.2-7.37m3.2-7.37l3.2-7.36m3.2-7.37l3.2-7.36m3.2-7.36l3.2-7.36m3.2-7.37l3.2-7.36m3.2-7.37l3.22-7.37m3.2-7.36l3.2-7.36m3.2-7.37l3.2-7.36m3.2-7.35l1.6-3.68" stroke="#3a414a" stroke-width="2" fill="none"/><path d="M-4378.7 676.53l1.43-14.93 8.5 3.7zM-4251.3 383.47l-1.43 14.93-8.5-3.7z" stroke="#3a414a" stroke-width="2" fill="#3a414a"/><path d="M-4269.67 669.65l3.36-2.12m6.72-4.23l6.73-4.23m6.72-4.23l6.73-4.23m6.73-4.23l6.73-4.23m6.72-4.23l6.73-4.22m6.74-4.23l6.73-4.24m6.72-4.22l6.72-4.23m6.73-4.23l6.73-4.23m6.72-4.24l6.73-4.24m6.73-4.23l6.72-4.24m6.73-4.23l6.74-4.23m6.73-4.24l6.72-4.23m6.72-4.23l6.73-4.23m6.73-4.23l6.72-4.23m6.73-4.23l6.73-4.23m6.73-4.23l6.7-4.22m6.74-4.23l6.73-4.23m6.73-4.24l6.72-4.23m6.73-4.23l6.73-4.23m6.73-4.24l6.73-4.23m6.73-4.24l6.73-4.24m6.72-4.23l6.72-4.23m6.73-4.23l6.73-4.24m6.73-4.23l6.72-4.23m6.73-4.23l6.73-4.23m6.74-4.22l6.72-4.24m6.73-4.23l6.72-4.22m6.73-4.23l6.72-4.23m6.73-4.23l6.73-4.25m6.73-4.23l6.72-4.23m6.73-4.24l6.74-4.23m6.72-4.24l6.73-4.24m6.72-4.23l6.73-4.23m6.72-4.23l3.37-2.12" stroke="#3a414a" stroke-width="2" fill="none"/><path d="M-4282.6 677.78l9.6-11.52 4.95 7.85zM-3812.74 382.22l-9.6 11.52-4.94-7.85z" stroke="#3a414a" stroke-width="2" fill="#3a414a"/><path d="M-4482.72 669.46l-3.37-2.18m-6.74-4.36l-6.74-4.35m-6.75-4.36l-6.75-4.35m-6.74-4.36l-6.75-4.37m-6.74-4.36l-6.76-4.35m-6.75-4.36l-6.75-4.36m-6.75-4.36l-6.74-4.36m-6.75-4.36l-6.74-4.35m-6.74-4.36l-6.75-4.35m-6.74-4.36l-6.75-4.37m-6.75-4.35l-6.74-4.36m-6.76-4.36l-6.74-4.36m-6.75-4.36l-6.75-4.35m-6.74-4.37l-6.75-4.36m-6.73-4.36l-6.75-4.35m-6.75-4.36l-6.74-4.36m-6.75-4.36l-6.74-4.36m-6.75-4.36l-6.76-4.36m-6.74-4.35l-6.75-4.36m-6.74-4.37l-6.74-4.36m-6.74-4.36l-6.75-4.34m-6.75-4.36l-6.74-4.36m-6.75-4.36l-6.74-4.36m-6.76-4.35l-6.75-4.36m-6.75-4.35l-6.75-4.36m-6.74-4.37l-6.75-4.36m-6.74-4.35l-6.74-4.36m-6.75-4.36l-6.74-4.36m-6.75-4.36l-6.74-4.35m-6.75-4.36l-6.76-4.36m-6.74-4.35l-6.75-4.36m-6.74-4.37l-6.74-4.35m-6.75-4.36l-3.36-2.18" stroke="#3a414a" stroke-width="2" fill="none"/><path d="M-4469.9 677.74l-14.5-3.84 5.03-7.8zM-4927.28 382.26l14.5 3.84-5.03 7.8z" stroke="#3a414a" stroke-width="2" fill="#3a414a"/><path d="M-4797.85 662.74l-1.72-3.68m-3.45-7.38l-3.46-7.37m-3.45-7.37l-3.45-7.37m-3.46-7.38l-3.45-7.37m-3.44-7.37l-3.46-7.37m-3.45-7.38l-3.45-7.37m-3.45-7.37l-3.46-7.37m-3.46-7.37l-3.45-7.4m-3.47-7.36l-3.45-7.38m-3.45-7.37l-3.46-7.4m-3.45-7.36l-3.45-7.38m-3.46-7.37l-3.44-7.4m-3.45-7.36l-3.44-7.38m-3.46-7.37l-3.45-7.38m-3.45-7.38l-3.46-7.37m-3.45-7.38l-3.46-7.38m-3.46-7.38l-3.45-7.37m-3.45-7.38l-3.45-7.38m-3.46-7.38l-1.72-3.68" stroke="#3a414a" stroke-width="2" fill="none"/><path d="M-4791.37 676.57l-10.25-10.96 8.4-3.92zM-4928.63 383.43l10.25 10.95-8.4 3.94z" stroke="#3a414a" stroke-width="2" fill="#3a414a"/><path d="M-4545.44 673.74l-3.65-1.66m-7.3-3.32l-7.3-3.32m-7.28-3.32l-7.3-3.32m-7.3-3.32l-7.3-3.32m-7.3-3.32l-7.3-3.33m-7.3-3.3l-7.3-3.33m-7.3-3.32l-7.3-3.32m-7.3-3.32l-7.3-3.3m-7.3-3.33l-7.3-3.32m-7.3-3.32l-7.3-3.32m-7.3-3.3l-7.3-3.33m-7.3-3.32l-7.3-3.33m-7.3-3.3l-7.3-3.34m-7.28-3.32l-7.3-3.32m-7.3-3.32l-7.3-3.32m-7.3-3.32l-7.3-3.32m-7.3-3.32l-7.3-3.32m-7.3-3.32l-7.3-3.32m-7.3-3.32l-7.3-3.32m-7.3-3.32l-7.3-3.33m-7.3-3.33l-7.3-3.32m-7.3-3.32l-7.3-3.32m-7.3-3.3l-7.3-3.33m-7.3-3.32l-7.28-3.32m-7.3-3.32l-7.3-3.3m-7.3-3.33l-7.3-3.32m-7.3-3.32l-7.3-3.33m-7.3-3.32l-7.3-3.32m-7.3-3.32l-7.3-3.32m-7.3-3.32l-7.3-3.32m-7.3-3.32l-7.3-3.32m-7.3-3.32l-7.3-3.32m-7.3-3.32l-7.3-3.32m-7.3-3.32l-7.3-3.32m-7.3-3.33l-7.28-3.33m-7.3-3.32l-7.3-3.32m-7.3-3.32l-7.3-3.3m-7.3-3.33l-7.3-3.32m-7.3-3.32l-7.3-3.32m-7.3-3.3l-7.3-3.33m-7.3-3.32l-7.3-3.32m-7.3-3.32l-7.3-3.32m-7.3-3.32l-7.3-3.32m-7.3-3.32l-3.64-1.66" stroke="#3a414a" stroke-width="2" fill="none"/><path d="M-4531.54 680.06l-14.9-1.7 3.83-8.42zM-5187.05 381.84l14.9 1.7-3.84 8.43z" stroke="#3a414a" stroke-width="2" fill="#3a414a"/><path d="M-4884.5 666.85l-2.92-2.74m-5.84-5.46l-5.84-5.48m-5.84-5.47l-5.84-5.5m-5.84-5.46l-5.84-5.47m-5.84-5.48l-5.84-5.48m-5.84-5.48l-5.84-5.47m-5.84-5.47l-5.84-5.48m-5.84-5.47l-5.84-5.47m-5.84-5.48l-5.84-5.47m-5.84-5.48l-5.84-5.47m-5.84-5.47l-5.84-5.47m-5.84-5.47l-5.84-5.48m-5.84-5.47l-5.84-5.46m-5.84-5.48l-5.84-5.47m-5.84-5.48l-5.84-5.48m-5.84-5.47l-5.84-5.48m-5.84-5.48l-5.84-5.47m-5.84-5.48l-5.84-5.47m-5.84-5.48l-5.84-5.47m-5.84-5.47l-5.84-5.48m-5.84-5.47l-5.84-5.48m-5.84-5.47l-5.84-5.47m-5.84-5.47l-5.84-5.47m-5.84-5.47l-5.84-5.5m-5.84-5.46l-5.84-5.48m-5.84-5.47l-2.92-2.75" stroke="#3a414a" stroke-width="2" fill="none"/><path d="M-4873.36 677.3l-13.58-6.4 6.34-6.75zM-5187.64 382.7l13.58 6.4-6.34 6.75z" stroke="#3a414a" stroke-width="2" fill="#3a414a"/><path d="M-4214.56 673.74l3.65-1.66m7.3-3.32l7.3-3.32m7.28-3.32l7.3-3.32m7.3-3.32l7.3-3.32m7.3-3.32l7.3-3.33m7.3-3.3l7.3-3.33m7.3-3.32l7.3-3.32m7.3-3.32l7.3-3.3m7.3-3.33l7.3-3.32m7.3-3.32l7.3-3.32m7.3-3.3l7.3-3.33m7.3-3.32l7.3-3.33m7.3-3.3l7.3-3.34m7.28-3.32l7.3-3.32m7.3-3.32l7.3-3.32m7.3-3.32l7.3-3.32m7.3-3.32l7.3-3.32m7.3-3.32l7.3-3.32m7.3-3.32l7.3-3.32m7.3-3.32l7.3-3.33m7.3-3.33l7.3-3.32m7.3-3.32l7.3-3.32m7.3-3.3l7.3-3.33m7.3-3.32l7.28-3.32m7.3-3.32l7.3-3.3m7.3-3.33l7.3-3.32m7.3-3.32l7.3-3.33m7.3-3.32l7.3-3.32m7.3-3.32l7.3-3.32m7.3-3.32l7.3-3.32m7.3-3.32l7.3-3.32m7.3-3.32l7.3-3.32m7.3-3.32l7.3-3.32m7.3-3.32l7.3-3.32m7.3-3.33l7.3-3.33m7.28-3.32l7.3-3.32m7.3-3.32l7.3-3.3m7.3-3.33l7.3-3.32m7.3-3.32l7.3-3.32m7.3-3.3l7.3-3.33m7.3-3.32l7.3-3.32m7.3-3.32l7.3-3.32m7.3-3.32l7.3-3.32m7.3-3.32l3.64-1.66" stroke="#3a414a" stroke-width="2" fill="none"/><path d="M-4228.46 680.06l11.07-10.12 3.85 8.43zM-3572.95 381.84l-11.06 10.13-3.85-8.44z" stroke="#3a414a" stroke-width="2" fill="#3a414a"/><path d="M-4250 241V125a6 6 0 0 1 6-6h542.34a6 6 0 0 1 6 6v88.38" stroke="#3a414a" stroke-width="2" fill="none"/><path d="M-4250 256.26l-4.64-14.26h9.28z" stroke="#3a414a" stroke-width="2" fill="#3a414a"/><path d="M-3695.66 213.36v1.02M-4380 103.17v37.33" stroke="#3a414a" stroke-width="2" fill="none"/><path d="M-4380 87.9l4.64 14.27h-9.28zM-4380 155.76l-4.64-14.26h9.28z" stroke="#3a414a" stroke-width="2" fill="#3a414a"/><path d="M-4500 46a6 6 0 0 1 6-6h228a6 6 0 0 1 6 6v32.67a6 6 0 0 1-6 6h-228a6 6 0 0 1-6-6z" stroke="#000" stroke-opacity="0" fill="#fff" fill-opacity="0"/><use xlink:href="#s" transform="matrix(1,0,0,1,-4495,45) translate(26.929012345679013 25.29861111111111)"/><use xlink:href="#t" transform="matrix(1,0,0,1,-4495,45) translate(108.54012345679013 25.29861111111111)"/><path d="M-3960.27 663.2c0 .54-.45 1-1 1s-1-.46-1-1c0-.57.45-1 1-1s1 .43 1 1zm1.88-3.52c0 .55-.44 1-1 1-.55 0-1-.45-1-1s.45-1 1-1c.56 0 1 .45 1 1zm1.88-3.5c0 .55-.45 1-1 1s-1-.45-1-1 .45-1 1-1 1 .45 1 1zm1.88-3.5c0 .54-.45 1-1 1-.56 0-1-.46-1-1 0-.56.44-1 1-1 .55 0 1 .44 1 1zm1.87-3.5c0 .54-.45 1-1 1s-1-.46-1-1c0-.56.45-1 1-1s1 .44 1 1zm1.88-3.52c0 .56-.44 1-1 1-.55 0-1-.44-1-1 0-.55.45-1 1-1 .56 0 1 .45 1 1zm1.88-3.5c0 .55-.45 1-1 1s-1-.45-1-1 .45-1 1-1 1 .45 1 1zm1.88-3.5c0 .55-.45 1-1 1s-1-.45-1-1c0-.56.45-1 1-1s1 .44 1 1zm1.87-3.5c0 .54-.44 1-1 1-.55 0-1-.46-1-1 0-.56.45-1 1-1 .56 0 1 .44 1 1zm1.88-3.52c0 .56-.44 1-1 1-.54 0-1-.44-1-1 0-.55.46-1 1-1 .56 0 1 .45 1 1zm1.9-3.5c0 .55-.46 1-1 1-.57 0-1-.45-1-1s.43-1 1-1c.54 0 1 .45 1 1zm1.86-3.5c0 .54-.45 1-1 1s-1-.46-1-1c0-.56.45-1 1-1s1 .44 1 1zm1.88-3.5c0 .54-.45 1-1 1-.56 0-1-.46-1-1 0-.56.44-1 1-1 .55 0 1 .44 1 1zm1.87-3.52c0 .55-.44 1-1 1-.54 0-1-.45-1-1s.46-1 1-1c.56 0 1 .45 1 1zm1.9-3.5c0 .55-.46 1-1 1-.57 0-1-.45-1-1s.43-1 1-1c.54 0 1 .45 1 1zm1.86-3.5c0 .54-.45 1-1 1s-1-.46-1-1c0-.56.45-1 1-1s1 .44 1 1zm1.88-3.5c0 .54-.45 1-1 1s-1-.46-1-1c0-.56.45-1 1-1s1 .44 1 1zm1.87-3.52c0 .56-.43 1-1 1-.54 0-1-.44-1-1 0-.55.46-1 1-1 .57 0 1 .45 1 1zm1.9-3.5c0 .55-.46 1-1 1-.56 0-1-.45-1-1s.44-1 1-1c.54 0 1 .45 1 1zm1.86-3.5c0 .55-.44 1-1 1-.55 0-1-.45-1-1 0-.56.45-1 1-1 .56 0 1 .44 1 1zm1.88-3.5c0 .54-.45 1-1 1s-1-.46-1-1c0-.56.45-1 1-1s1 .44 1 1zm1.88-3.52c0 .56-.45 1-1 1-.56 0-1-.44-1-1 0-.55.44-1 1-1 .55 0 1 .45 1 1zm1.87-3.5c0 .55-.46 1-1 1-.56 0-1-.45-1-1s.44-1 1-1c.54 0 1 .45 1 1zm1.87-3.5c0 .55-.45 1-1 1s-1-.45-1-1c0-.56.45-1 1-1s1 .44 1 1zm1.87-3.5c0 .54-.44 1-1 1-.55 0-1-.46-1-1 0-.56.45-1 1-1 .56 0 1 .44 1 1zm1.88-3.52c0 .56-.45 1-1 1s-1-.44-1-1c0-.55.45-1 1-1s1 .45 1 1zm1.87-3.5c0 .55-.45 1-1 1-.56 0-1-.45-1-1s.44-1 1-1c.55 0 1 .45 1 1zm1.87-3.5c0 .55-.45 1-1 1s-1-.45-1-1c0-.56.45-1 1-1s1 .44 1 1zm1.88-3.5c0 .54-.45 1-1 1-.56 0-1-.46-1-1 0-.56.44-1 1-1 .55 0 1 .44 1 1zm1.87-3.52c0 .56-.45 1-1 1s-1-.44-1-1c0-.55.45-1 1-1s1 .45 1 1zm1.88-3.5c0 .55-.45 1-1 1-.56 0-1-.45-1-1s.44-1 1-1c.55 0 1 .45 1 1zm1.87-3.5c0 .55-.45 1-1 1s-1-.45-1-1c0-.56.45-1 1-1s1 .44 1 1zm1.88-3.5c0 .54-.45 1-1 1-.56 0-1-.46-1-1 0-.56.44-1 1-1 .55 0 1 .44 1 1zm1.87-3.5c0 .54-.44 1-1 1-.55 0-1-.46-1-1 0-.57.45-1 1-1 .56 0 1 .43 1 1zm1.88-3.52c0 .55-.45 1-1 1s-1-.45-1-1 .45-1 1-1 1 .45 1 1zm1.87-3.5c0 .55-.44 1-1 1-.55 0-1-.45-1-1 0-.56.45-1 1-1 .56 0 1 .44 1 1zm1.88-3.5c0 .54-.45 1-1 1s-1-.46-1-1c0-.56.45-1 1-1s1 .44 1 1zm1.87-3.5c0 .54-.44 1-1 1-.55 0-1-.46-1-1 0-.57.45-1 1-1 .56 0 1 .43 1 1zm1.88-3.52c0 .55-.45 1-1 1s-1-.45-1-1 .45-1 1-1 1 .45 1 1zm1.88-3.5c0 .55-.45 1-1 1-.56 0-1-.45-1-1 0-.56.44-1 1-1 .55 0 1 .44 1 1zm1.87-3.5c0 .54-.45 1-1 1s-1-.46-1-1c0-.56.45-1 1-1s1 .44 1 1zm1.88-3.5c0 .54-.45 1-1 1-.56 0-1-.46-1-1 0-.57.44-1 1-1 .55 0 1 .43 1 1zm1.87-3.52c0 .55-.45 1-1 1s-1-.45-1-1 .45-1 1-1 1 .45 1 1zm1.88-3.5c0 .55-.45 1-1 1-.56 0-1-.45-1-1 0-.56.44-1 1-1 .55 0 1 .44 1 1zm1.87-3.5c0 .54-.44 1-1 1-.55 0-1-.46-1-1 0-.56.45-1 1-1 .56 0 1 .44 1 1zm1.88-3.5c0 .54-.45 1-1 1s-1-.46-1-1c0-.57.45-1 1-1s1 .43 1 1zm1.87-3.52c0 .55-.44 1-1 1-.55 0-1-.45-1-1s.45-1 1-1c.56 0 1 .45 1 1zm1.88-3.5c0 .55-.45 1-1 1s-1-.45-1-1c0-.56.45-1 1-1s1 .44 1 1zm1.88-3.5c0 .54-.45 1-1 1-.56 0-1-.46-1-1 0-.56.44-1 1-1 .55 0 1 .44 1 1zm1.87-3.5c0 .54-.45 1-1 1s-1-.46-1-1c0-.57.45-1 1-1s1 .43 1 1zm1.88-3.52c0 .55-.44 1-1 1-.55 0-1-.45-1-1s.45-1 1-1c.56 0 1 .45 1 1zm1.88-3.5c0 .55-.45 1-1 1s-1-.45-1-1c0-.56.45-1 1-1s1 .44 1 1zm1.88-3.5c0 .54-.45 1-1 1-.56 0-1-.46-1-1 0-.56.44-1 1-1 .55 0 1 .44 1 1zm1.87-3.5c0 .54-.45 1-1 1s-1-.46-1-1c0-.57.45-1 1-1s1 .43 1 1zm1.88-3.52c0 .55-.44 1-1 1-.54 0-1-.45-1-1s.46-1 1-1c.56 0 1 .45 1 1zm1.88-3.5c0 .55-.44 1-1 1-.55 0-1-.45-1-1 0-.56.45-1 1-1 .56 0 1 .44 1 1zm1.88-3.5c0 .54-.45 1-1 1s-1-.46-1-1c0-.56.45-1 1-1s1 .44 1 1zm1.88-3.5c0 .54-.45 1-1 1-.56 0-1-.46-1-1 0-.57.44-1 1-1 .55 0 1 .43 1 1zm1.87-3.52c0 .55-.44 1-1 1-.54 0-1-.45-1-1s.46-1 1-1c.56 0 1 .45 1 1zm1.9-3.5c0 .55-.46 1-1 1-.57 0-1-.45-1-1 0-.56.43-1 1-1 .54 0 1 .44 1 1zm1.86-3.5c0 .54-.45 1-1 1s-1-.46-1-1c0-.56.45-1 1-1s1 .44 1 1zm1.88-3.5c0 .54-.45 1-1 1s-1-.46-1-1c0-.56.45-1 1-1s1 .44 1 1zm1.87-3.52c0 .55-.43 1-1 1-.54 0-1-.45-1-1s.46-1 1-1c.57 0 1 .45 1 1zm1.9-3.5c0 .55-.46 1-1 1-.56 0-1-.45-1-1 0-.56.44-1 1-1 .54 0 1 .44 1 1zm1.86-3.5c0 .54-.44 1-1 1-.55 0-1-.46-1-1 0-.56.45-1 1-1 .56 0 1 .44 1 1zm1.88-3.5c0 .54-.45 1-1 1s-1-.46-1-1c0-.56.45-1 1-1s1 .44 1 1zm1.88-3.52c0 .56-.45 1-1 1-.56 0-1-.44-1-1 0-.55.44-1 1-1 .55 0 1 .45 1 1zm1.87-3.5c0 .55-.46 1-1 1-.56 0-1-.45-1-1 0-.56.44-1 1-1 .54 0 1 .44 1 1zm1.87-3.5c0 .54-.45 1-1 1-.56 0-1-.46-1-1 0-.56.44-1 1-1 .55 0 1 .44 1 1zm1.87-3.5c0 .54-.45 1-1 1s-1-.46-1-1c0-.56.45-1 1-1s1 .44 1 1zm1.88-3.52c0 .56-.45 1-1 1s-1-.44-1-1c0-.55.45-1 1-1s1 .45 1 1zm1.87-3.5c0 .55-.45 1-1 1-.56 0-1-.45-1-1s.44-1 1-1c.55 0 1 .45 1 1zm1.87-3.5c0 .55-.45 1-1 1s-1-.45-1-1c0-.56.45-1 1-1s1 .44 1 1zm1.87-3.5c0 .54-.44 1-1 1-.55 0-1-.46-1-1 0-.56.45-1 1-1 .56 0 1 .44 1 1zm1.88-3.52c0 .56-.45 1-1 1s-1-.44-1-1c0-.55.45-1 1-1s1 .45 1 1zm1.88-3.5c0 .55-.45 1-1 1-.56 0-1-.45-1-1s.44-1 1-1c.55 0 1 .45 1 1zm1.87-3.5c0 .55-.45 1-1 1s-1-.45-1-1c0-.56.45-1 1-1s1 .44 1 1z" fill="#3a414a"/><path d="M-3968.47 676.65l2.64-14.77 8.17 4.38zM-3811.53 383.35l-2.64 14.77-8.17-4.38z" stroke="#3a414a" stroke-width="2" fill="#3a414a"/><path d="M-3850.03 666.3c0 .56-.45 1-1 1s-1-.44-1-1c0-.54.45-1 1-1s1 .46 1 1zm2.8-2.83c0 .55-.45 1-1 1-.56 0-1-.45-1-1 0-.56.44-1 1-1 .55 0 1 .44 1 1zm2.8-2.84c0 .55-.46 1-1 1-.57 0-1-.45-1-1s.43-1 1-1c.54 0 1 .45 1 1zm2.78-2.84c0 .54-.45 1-1 1s-1-.46-1-1c0-.56.45-1 1-1s1 .44 1 1zm2.8-2.85c0 .55-.46 1-1 1-.56 0-1-.45-1-1s.44-1 1-1c.54 0 1 .45 1 1zm2.78-2.84c0 .56-.44 1-1 1-.55 0-1-.44-1-1 0-.54.45-1 1-1 .56 0 1 .46 1 1zm2.8-2.83c0 .55-.45 1-1 1-.56 0-1-.45-1-1s.44-1 1-1c.55 0 1 .45 1 1zm2.8-2.84c0 .55-.46 1-1 1-.56 0-1-.45-1-1s.44-1 1-1c.54 0 1 .45 1 1zm2.78-2.84c0 .54-.44 1-1 1-.54 0-1-.46-1-1 0-.56.46-1 1-1 .56 0 1 .44 1 1zm2.8-2.85c0 .55-.44 1-1 1-.55 0-1-.45-1-1s.45-1 1-1c.56 0 1 .45 1 1zm2.8-2.84c0 .56-.45 1-1 1-.56 0-1-.44-1-1 0-.54.44-1 1-1 .55 0 1 .46 1 1zm2.8-2.83c0 .55-.46 1-1 1-.56 0-1-.45-1-1s.44-1 1-1c.54 0 1 .45 1 1zm2.78-2.84c0 .55-.45 1-1 1s-1-.45-1-1 .45-1 1-1 1 .45 1 1zm2.8-2.84c0 .54-.46 1-1 1-.56 0-1-.46-1-1 0-.56.44-1 1-1 .54 0 1 .44 1 1zm2.78-2.85c0 .55-.44 1-1 1-.55 0-1-.45-1-1s.45-1 1-1c.56 0 1 .45 1 1zm2.8-2.84c0 .56-.45 1-1 1-.56 0-1-.44-1-1 0-.54.44-1 1-1 .55 0 1 .46 1 1zm2.8-2.83c0 .55-.46 1-1 1-.56 0-1-.45-1-1s.44-1 1-1c.54 0 1 .45 1 1zm2.78-2.84c0 .55-.45 1-1 1s-1-.45-1-1 .45-1 1-1 1 .45 1 1zm2.8-2.84c0 .54-.45 1-1 1-.56 0-1-.46-1-1 0-.56.44-1 1-1 .55 0 1 .44 1 1zm2.8-2.85c0 .55-.46 1-1 1-.57 0-1-.45-1-1s.43-1 1-1c.54 0 1 .45 1 1zm2.78-2.84c0 .57-.45 1-1 1-.56 0-1-.43-1-1 0-.54.44-1 1-1 .55 0 1 .46 1 1zm2.8-2.83c0 .56-.46 1-1 1-.56 0-1-.44-1-1 0-.55.44-1 1-1 .54 0 1 .45 1 1zm2.78-2.84c0 .55-.45 1-1 1s-1-.45-1-1 .45-1 1-1 1 .45 1 1zm2.8-2.84c0 .55-.45 1-1 1-.56 0-1-.45-1-1 0-.56.44-1 1-1 .55 0 1 .44 1 1zm2.8-2.85c0 .56-.46 1-1 1-.57 0-1-.44-1-1 0-.55.43-1 1-1 .54 0 1 .45 1 1zm2.78-2.84c0 .57-.45 1-1 1s-1-.43-1-1c0-.54.45-1 1-1s1 .46 1 1zm2.8-2.83c0 .56-.46 1-1 1-.56 0-1-.44-1-1 0-.55.44-1 1-1 .54 0 1 .45 1 1zm2.78-2.84c0 .56-.45 1-1 1s-1-.44-1-1c0-.55.45-1 1-1s1 .45 1 1zm2.8-2.84c0 .55-.45 1-1 1-.56 0-1-.45-1-1 0-.56.44-1 1-1 .55 0 1 .44 1 1zm2.8-2.84c0 .55-.46 1-1 1-.57 0-1-.45-1-1 0-.56.43-1 1-1 .54 0 1 .44 1 1zm2.78-2.85c0 .57-.45 1-1 1s-1-.43-1-1c0-.54.45-1 1-1s1 .46 1 1zm2.8-2.82c0 .55-.46 1-1 1-.56 0-1-.45-1-1 0-.56.44-1 1-1 .54 0 1 .44 1 1zm2.78-2.84c0 .55-.44 1-1 1-.55 0-1-.45-1-1 0-.56.45-1 1-1 .56 0 1 .44 1 1zm2.8-2.84c0 .55-.45 1-1 1-.56 0-1-.45-1-1 0-.56.44-1 1-1 .55 0 1 .44 1 1zm2.8-2.84c0 .55-.46 1-1 1-.56 0-1-.45-1-1 0-.56.44-1 1-1 .54 0 1 .44 1 1zm2.78-2.84c0 .55-.45 1-1 1s-1-.45-1-1c0-.56.45-1 1-1s1 .44 1 1zm2.8-2.84c0 .55-.45 1-1 1-.56 0-1-.45-1-1 0-.56.44-1 1-1 .55 0 1 .44 1 1zm2.78-2.84c0 .55-.44 1-1 1-.55 0-1-.45-1-1 0-.56.45-1 1-1 .56 0 1 .44 1 1zm2.8-2.84c0 .55-.45 1-1 1s-1-.45-1-1 .45-1 1-1 1 .45 1 1zm2.8-2.84c0 .55-.46 1-1 1-.56 0-1-.45-1-1s.44-1 1-1c.54 0 1 .45 1 1zm2.78-2.84c0 .55-.45 1-1 1s-1-.45-1-1 .45-1 1-1 1 .45 1 1zm2.8-2.84c0 .55-.45 1-1 1-.56 0-1-.45-1-1s.44-1 1-1c.55 0 1 .45 1 1zm2.8-2.84c0 .55-.46 1-1 1-.57 0-1-.45-1-1s.43-1 1-1c.54 0 1 .45 1 1zm2.78-2.84c0 .55-.45 1-1 1s-1-.45-1-1 .45-1 1-1 1 .45 1 1zm2.8-2.84c0 .55-.46 1-1 1-.56 0-1-.45-1-1s.44-1 1-1c.54 0 1 .45 1 1zm2.78-2.84c0 .55-.44 1-1 1-.55 0-1-.45-1-1s.45-1 1-1c.56 0 1 .45 1 1zm2.8-2.84c0 .55-.45 1-1 1-.56 0-1-.45-1-1s.44-1 1-1c.55 0 1 .45 1 1zm2.8-2.84c0 .55-.46 1-1 1-.56 0-1-.45-1-1s.44-1 1-1c.54 0 1 .45 1 1zm2.78-2.84c0 .55-.45 1-1 1s-1-.45-1-1 .45-1 1-1 1 .45 1 1zm2.8-2.84c0 .55-.46 1-1 1-.56 0-1-.45-1-1s.44-1 1-1c.54 0 1 .45 1 1zm2.78-2.84c0 .55-.44 1-1 1-.55 0-1-.45-1-1s.45-1 1-1c.56 0 1 .45 1 1zm2.8-2.84c0 .55-.45 1-1 1-.56 0-1-.45-1-1s.44-1 1-1c.55 0 1 .45 1 1zm2.8-2.84c0 .55-.46 1-1 1-.56 0-1-.45-1-1s.44-1 1-1c.54 0 1 .45 1 1zm2.78-2.84c0 .55-.45 1-1 1s-1-.45-1-1 .45-1 1-1 1 .45 1 1zm2.8-2.84c0 .55-.45 1-1 1-.56 0-1-.45-1-1s.44-1 1-1c.55 0 1 .45 1 1zm2.8-2.84c0 .55-.46 1-1 1-.57 0-1-.45-1-1s.43-1 1-1c.54 0 1 .45 1 1zm2.78-2.84c0 .55-.45 1-1 1s-1-.45-1-1 .45-1 1-1 1 .45 1 1zm2.8-2.84c0 .56-.46 1-1 1-.56 0-1-.44-1-1 0-.55.44-1 1-1 .54 0 1 .45 1 1zm2.78-2.84c0 .55-.45 1-1 1s-1-.45-1-1 .45-1 1-1 1 .45 1 1zm2.8-2.84c0 .56-.45 1-1 1-.56 0-1-.44-1-1 0-.55.44-1 1-1 .55 0 1 .45 1 1zm2.8-2.84c0 .56-.46 1-1 1-.57 0-1-.44-1-1 0-.55.43-1 1-1 .54 0 1 .45 1 1zm2.78-2.84c0 .56-.45 1-1 1s-1-.44-1-1c0-.55.45-1 1-1s1 .45 1 1zm2.8-2.84c0 .56-.46 1-1 1-.56 0-1-.44-1-1 0-.55.44-1 1-1 .54 0 1 .45 1 1zm2.78-2.84c0 .56-.44 1-1 1-.55 0-1-.44-1-1 0-.55.45-1 1-1 .56 0 1 .45 1 1zm2.8-2.84c0 .56-.45 1-1 1-.56 0-1-.44-1-1 0-.55.44-1 1-1 .55 0 1 .45 1 1zm2.8-2.84c0 .56-.46 1-1 1-.56 0-1-.44-1-1 0-.55.44-1 1-1 .54 0 1 .45 1 1zm2.78-2.84c0 .56-.45 1-1 1s-1-.44-1-1c0-.55.45-1 1-1s1 .45 1 1zm2.8-2.83c0 .55-.45 1-1 1-.56 0-1-.45-1-1 0-.56.44-1 1-1 .55 0 1 .44 1 1zm2.78-2.85c0 .56-.44 1-1 1-.55 0-1-.44-1-1 0-.55.45-1 1-1 .56 0 1 .45 1 1zm2.8-2.83c0 .55-.45 1-1 1s-1-.45-1-1c0-.56.45-1 1-1s1 .44 1 1zm2.8-2.84c0 .55-.46 1-1 1-.56 0-1-.45-1-1 0-.56.44-1 1-1 .54 0 1 .44 1 1zm2.78-2.84c0 .54-.45 1-1 1s-1-.46-1-1c0-.57.45-1 1-1s1 .43 1 1zm2.8-2.85c0 .55-.45 1-1 1-.56 0-1-.45-1-1 0-.56.44-1 1-1 .55 0 1 .44 1 1zm2.8-2.84c0 .56-.46 1-1 1-.57 0-1-.44-1-1 0-.55.43-1 1-1 .54 0 1 .45 1 1zm2.78-2.83c0 .55-.45 1-1 1s-1-.45-1-1c0-.56.45-1 1-1s1 .44 1 1zm2.8-2.84c0 .55-.46 1-1 1-.56 0-1-.45-1-1 0-.56.44-1 1-1 .54 0 1 .44 1 1zm2.78-2.84c0 .54-.44 1-1 1-.55 0-1-.46-1-1 0-.56.45-1 1-1 .56 0 1 .44 1 1zm2.8-2.85c0 .55-.45 1-1 1-.56 0-1-.45-1-1s.44-1 1-1c.55 0 1 .45 1 1zm2.8-2.84c0 .56-.46 1-1 1-.57 0-1-.44-1-1 0-.54.43-1 1-1 .54 0 1 .46 1 1zm2.78-2.83c0 .55-.45 1-1 1s-1-.45-1-1 .45-1 1-1 1 .45 1 1zm2.8-2.84c0 .55-.46 1-1 1-.56 0-1-.45-1-1s.44-1 1-1c.54 0 1 .45 1 1zm2.78-2.84c0 .54-.44 1-1 1-.55 0-1-.46-1-1 0-.56.45-1 1-1 .56 0 1 .44 1 1zm2.8-2.85c0 .55-.45 1-1 1-.56 0-1-.45-1-1s.44-1 1-1c.55 0 1 .45 1 1zm2.8-2.84c0 .56-.46 1-1 1-.56 0-1-.44-1-1 0-.54.44-1 1-1 .54 0 1 .46 1 1zm2.78-2.83c0 .55-.45 1-1 1s-1-.45-1-1 .45-1 1-1 1 .45 1 1zm2.8-2.84c0 .55-.46 1-1 1-.56 0-1-.45-1-1s.44-1 1-1c.54 0 1 .45 1 1zm2.78-2.84c0 .54-.44 1-1 1-.55 0-1-.46-1-1 0-.56.45-1 1-1 .56 0 1 .44 1 1zm2.8-2.85c0 .55-.45 1-1 1-.56 0-1-.45-1-1s.44-1 1-1c.55 0 1 .45 1 1zm2.8-2.84c0 .56-.46 1-1 1-.56 0-1-.44-1-1 0-.54.44-1 1-1 .54 0 1 .46 1 1zm2.78-2.83c0 .55-.45 1-1 1s-1-.45-1-1 .45-1 1-1 1 .45 1 1zm2.8-2.84c0 .55-.45 1-1 1-.56 0-1-.45-1-1s.44-1 1-1c.55 0 1 .45 1 1zm2.8-2.84c0 .54-.46 1-1 1-.57 0-1-.46-1-1 0-.56.43-1 1-1 .54 0 1 .44 1 1zm2.78-2.85c0 .55-.45 1-1 1s-1-.45-1-1 .45-1 1-1 1 .45 1 1zm2.8-2.84c0 .56-.46 1-1 1-.56 0-1-.44-1-1 0-.54.44-1 1-1 .54 0 1 .46 1 1zm2.78-2.83c0 .55-.44 1-1 1-.55 0-1-.45-1-1s.45-1 1-1c.56 0 1 .45 1 1zm2.8-2.84c0 .56-.45 1-1 1-.56 0-1-.44-1-1 0-.55.44-1 1-1 .55 0 1 .45 1 1zm2.8-2.84c0 .55-.46 1-1 1-.56 0-1-.45-1-1 0-.56.44-1 1-1 .54 0 1 .44 1 1z" fill="#3a414a"/><path d="M-3861.73 677.2l6.7-13.43 6.6 6.5zM-3572.27 382.8l-6.7 13.43-6.6-6.5z" stroke="#3a414a" stroke-width="2" fill="#3a414a"/><path d="M-3658.5 775h30.26M-3658.46 775h-1.54" stroke="#3a414a" stroke-width="3" fill="none"/><path d="M-3612.47 775l-14.27 4.63v-9.26z" stroke="#3a414a" stroke-width="3" fill="#3a414a"/><path d="M-3658.5 815h7.57m15.13 0h7.56M-3658.46 815h-1.54" stroke="#3a414a" stroke-width="3" fill="none"/><path d="M-3612.47 815l-14.27 4.63v-9.26z" stroke="#3a414a" stroke-width="3" fill="#3a414a"/><path d="M-3657 848.33c0 .83-.67 1.5-1.5 1.5s-1.5-.67-1.5-1.5.67-1.5 1.5-1.5 1.5.67 1.5 1.5zm6.05 0c0 .83-.67 1.5-1.5 1.5s-1.5-.67-1.5-1.5.67-1.5 1.5-1.5 1.5.67 1.5 1.5zm6.05 0c0 .83-.67 1.5-1.5 1.5-.82 0-1.5-.67-1.5-1.5s.68-1.5 1.5-1.5c.83 0 1.5.67 1.5 1.5zm6.06 0c0 .83-.67 1.5-1.5 1.5s-1.5-.67-1.5-1.5.67-1.5 1.5-1.5 1.5.67 1.5 1.5zm6.05 0c0 .83-.66 1.5-1.5 1.5-.82 0-1.5-.67-1.5-1.5s.68-1.5 1.5-1.5c.84 0 1.5.67 1.5 1.5z" fill="#3a414a"/><path d="M-3658.46 848.33h-1.54" stroke="#3a414a" stroke-width="3" fill="none"/><path d="M-3612.47 848.33l-14.27 4.64v-9.27z" stroke="#3a414a" stroke-width="3" fill="#3a414a"/><path d="M-3607.62 766a6 6 0 0 1 6-6h92.76a6 6 0 0 1 6 6v18a6 6 0 0 1-6 6h-92.76a6 6 0 0 1-6-6z" stroke="#000" stroke-opacity="0" fill="#fff" fill-opacity="0"/><use xlink:href="#u" transform="matrix(1,0,0,1,-3602.6190476190477,765) translate(0 19.555555555555554)"/><path d="M-3607.62 839.33a6 6 0 0 1 6-6H-3446a6 6 0 0 1 6 6v18a6 6 0 0 1-6 6h-155.62a6 6 0 0 1-6-6z" stroke="#000" stroke-opacity="0" fill="#fff" fill-opacity="0"/><use xlink:href="#v" transform="matrix(1,0,0,1,-3602.6190476190477,838.3333333333334) translate(0 19.555555555555554)"/><path d="M-3607.62 806a6 6 0 0 1 6-6h113.7a6 6 0 0 1 6 6v18a6 6 0 0 1-6 6h-113.7a6 6 0 0 1-6-6z" stroke="#000" stroke-opacity="0" fill="#fff" fill-opacity="0"/><use xlink:href="#w" transform="matrix(1,0,0,1,-3602.6190476190473,805) translate(0 19.555555555555554)"/><path d="M-3694.76 552a12 12 0 0 1 12-12h276a12 12 0 0 1 12 12v198.96a12 12 0 0 1-12 12h-276a12 12 0 0 1-12-12z" stroke="#000" stroke-opacity="0" stroke-width="2" fill-opacity="0"/><path d="M-3638.76 613.6c0 6.63-5.37 12-12 12s-12-5.37-12-12 5.37-12 12-12 12 5.37 12 12z" stroke="#000" stroke-opacity=".25" fill="#cfe4ff"/><path d="M-3638.76 651.2c0 6.63-5.37 12-12 12s-12-5.37-12-12 5.37-12 12-12 12 5.37 12 12z" stroke="#000" stroke-opacity=".25" fill="#ffdda6"/><path d="M-3638.76 688.8c0 6.63-5.37 12-12 12s-12-5.37-12-12 5.37-12 12-12 12 5.37 12 12z" stroke="#000" stroke-opacity=".25" fill="#dedeff"/><g><use xlink:href="#x" transform="matrix(1,0,0,1,-3662.7619047619046,564) translate(0 19.933333333333334)"/></g><g><use xlink:href="#y" transform="matrix(1,0,0,1,-3626.7619047619046,601.6) translate(0 19.933333333333334)"/><use xlink:href="#z" transform="matrix(1,0,0,1,-3626.7619047619046,601.6) translate(65.57222222222221 19.933333333333334)"/></g><g><use xlink:href="#y" transform="matrix(1,0,0,1,-3626.7619047619046,639.2) translate(0 19.933333333333334)"/><use xlink:href="#A" transform="matrix(1,0,0,1,-3626.7619047619046,639.2) translate(65.57222222222221 19.933333333333334)"/></g><g><use xlink:href="#B" transform="matrix(1,0,0,1,-3626.7619047619046,676.8) translate(0 20.153333333333336)"/><use xlink:href="#C" transform="matrix(1,0,0,1,-3626.7619047619046,676.8) translate(0 52.71333333333334)"/></g><path d="M-3810 241v-20.62a6 6 0 0 1 6-6h228a6 6 0 0 1 6 6V241" stroke="#3a414a" stroke-width="2" fill="none"/><path d="M-3810 256.26l-4.64-14.26h9.28zM-3570 256.26l-4.64-14.26h9.28z" stroke="#3a414a" stroke-width="2" fill="#3a414a"/><defs><path d="M212-179c-10-28-35-45-73-45-59 0-87 40-87 99 0 60 29 101 89 101 43 0 62-24 78-52l27 14C228-24 195 4 139 4 59 4 22-46 18-125c-6-104 99-153 187-111 19 9 31 26 39 46" id="D"/><path d="M100-194c62-1 85 37 85 99 1 63-27 99-86 99S16-35 15-95c0-66 28-99 85-99zM99-20c44 1 53-31 53-75 0-43-8-75-51-75s-53 32-53 75 10 74 51 75" id="E"/><path d="M114-163C36-179 61-72 57 0H25l-1-190h30c1 12-1 29 2 39 6-27 23-49 58-41v29" id="F"/><path d="M85-194c31 0 48 13 60 33l-1-100h32l1 261h-30c-2-10 0-23-3-31C134-8 116 4 85 4 32 4 16-35 15-94c0-66 23-100 70-100zm9 24c-40 0-46 34-46 75 0 40 6 74 45 74 42 0 51-32 51-76 0-42-9-74-50-73" id="G"/><path d="M24-231v-30h32v30H24zM24 0v-190h32V0H24" id="H"/><path d="M117-194c89-4 53 116 60 194h-32v-121c0-31-8-49-39-48C34-167 62-67 57 0H25l-1-190h30c1 10-1 24 2 32 11-22 29-35 61-36" id="I"/><path d="M141-36C126-15 110 5 73 4 37 3 15-17 15-53c-1-64 63-63 125-63 3-35-9-54-41-54-24 1-41 7-42 31l-33-3c5-37 33-52 76-52 45 0 72 20 72 64v82c-1 20 7 32 28 27v20c-31 9-61-2-59-35zM48-53c0 20 12 33 32 33 41-3 63-29 60-74-43 2-92-5-92 41" id="J"/><path d="M59-47c-2 24 18 29 38 22v24C64 9 27 4 27-40v-127H5v-23h24l9-43h21v43h35v23H59v120" id="K"/><g id="a"><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,0,0)" xlink:href="#D"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,20.78395061728395,0)" xlink:href="#E"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,36.83333333333333,0)" xlink:href="#E"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,52.8827160493827,0)" xlink:href="#F"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,62.43209876543209,0)" xlink:href="#G"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,78.48148148148147,0)" xlink:href="#H"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,84.82098765432096,0)" xlink:href="#I"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,100.87037037037035,0)" xlink:href="#J"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,116.91975308641973,0)" xlink:href="#K"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,124.94444444444444,0)" xlink:href="#E"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,140.99382716049382,0)" xlink:href="#F"/></g><path d="M140-251c81 0 123 46 123 126C263-46 219 4 140 4 59 4 17-45 17-125s42-126 123-126zm0 227c63 0 89-41 89-101s-29-99-89-99c-61 0-89 39-89 99S79-25 140-24" id="L"/><path d="M108 0H70L1-190h34L89-25l56-165h34" id="M"/><path d="M100-194c63 0 86 42 84 106H49c0 40 14 67 53 68 26 1 43-12 49-29l28 8c-11 28-37 45-77 45C44 4 14-33 15-96c1-61 26-98 85-98zm52 81c6-60-76-77-97-28-3 7-6 17-6 28h103" id="N"/><path d="M24 0v-261h32V0H24" id="O"/><g id="b"><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,0,0)" xlink:href="#L"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,22.469135802469136,0)" xlink:href="#M"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,36.91358024691358,0)" xlink:href="#N"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,52.96296296296296,0)" xlink:href="#F"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,62.51234567901234,0)" xlink:href="#O"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,68.85185185185185,0)" xlink:href="#E"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,84.90123456790123,0)" xlink:href="#F"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,94.4506172839506,0)" xlink:href="#G"/></g><path d="M240 0l2-218c-23 76-54 145-80 218h-23L58-218 59 0H30v-248h44l77 211c21-75 51-140 76-211h43V0h-30" id="P"/><g id="c"><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,0,0)" xlink:href="#P"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,23.993827160493826,0)" xlink:href="#H"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,30.333333333333332,0)" xlink:href="#G"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,46.382716049382715,0)" xlink:href="#G"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,62.4320987654321,0)" xlink:href="#O"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,68.77160493827161,0)" xlink:href="#N"/></g><path d="M177-190C167-65 218 103 67 71c-23-6-38-20-44-43l32-5c15 47 100 32 89-28v-30C133-14 115 1 83 1 29 1 15-40 15-95c0-56 16-97 71-98 29-1 48 16 59 35 1-10 0-23 2-32h30zM94-22c36 0 50-32 50-73 0-42-14-75-50-75-39 0-46 34-46 75s6 73 46 73" id="Q"/><g id="d"><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,0,0)" xlink:href="#P"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,23.993827160493826,0)" xlink:href="#J"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,40.04320987654321,0)" xlink:href="#I"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,56.092592592592595,0)" xlink:href="#J"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,72.14197530864197,0)" xlink:href="#Q"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,88.19135802469135,0)" xlink:href="#N"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,104.24074074074073,0)" xlink:href="#F"/></g><path d="M160-131c35 5 61 23 61 61C221 17 115-2 30 0v-248c76 3 177-17 177 60 0 33-19 50-47 57zm-97-11c50-1 110 9 110-42 0-47-63-36-110-37v79zm0 115c55-2 124 14 124-45 0-56-70-42-124-44v89" id="R"/><path d="M143 0L79-87 56-68V0H24v-261h32v163l83-92h37l-77 82L181 0h-38" id="S"/><g id="e"><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,0,0)" xlink:href="#R"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,19.25925925925926,0)" xlink:href="#F"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,28.80864197530864,0)" xlink:href="#E"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,44.858024691358025,0)" xlink:href="#S"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,59.30246913580247,0)" xlink:href="#N"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,75.35185185185185,0)" xlink:href="#F"/></g><path d="M233-177c-1 41-23 64-60 70L243 0h-38l-65-103H63V0H30v-248c88 3 205-21 203 71zM63-129c60-2 137 13 137-47 0-61-80-42-137-45v92" id="T"/><path d="M84 4C-5 8 30-112 23-190h32v120c0 31 7 50 39 49 72-2 45-101 50-169h31l1 190h-30c-1-10 1-25-2-33-11 22-28 36-60 37" id="U"/><g id="f"><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,0,0)" xlink:href="#T"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,20.78395061728395,0)" xlink:href="#E"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,36.83333333333333,0)" xlink:href="#U"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,52.8827160493827,0)" xlink:href="#K"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,60.9074074074074,0)" xlink:href="#N"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,76.95679012345678,0)" xlink:href="#F"/></g><path d="M197 0v-115H63V0H30v-248h33v105h134v-105h34V0h-34" id="V"/><path d="M135-143c-3-34-86-38-87 0 15 53 115 12 119 90S17 21 10-45l28-5c4 36 97 45 98 0-10-56-113-15-118-90-4-57 82-63 122-42 12 7 21 19 24 35" id="W"/><path d="M96-169c-40 0-48 33-48 73s9 75 48 75c24 0 41-14 43-38l32 2c-6 37-31 61-74 61-59 0-76-41-82-99-10-93 101-131 147-64 4 7 5 14 7 22l-32 3c-4-21-16-35-41-35" id="X"/><g id="g"><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,0,0)" xlink:href="#V"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,20.78395061728395,0)" xlink:href="#H"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,27.123456790123456,0)" xlink:href="#W"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,41.5679012345679,0)" xlink:href="#K"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,49.59259259259259,0)" xlink:href="#E"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,65.64197530864197,0)" xlink:href="#F"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,75.19135802469135,0)" xlink:href="#H"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,81.53086419753086,0)" xlink:href="#X"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,95.9753086419753,0)" xlink:href="#J"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,112.02469135802468,0)" xlink:href="#O"/></g><path d="M230 0l2-204L168 0h-37L68-204 70 0H24v-248h70l56 185 57-185h69V0h-46" id="Y"/><path d="M133-34C117-15 103 5 69 4 32 3 11-16 11-54c-1-60 55-63 116-61 1-26-3-47-28-47-18 1-26 9-28 27l-52-2c7-38 36-58 82-57s74 22 75 68l1 82c-1 14 12 18 25 15v27c-30 8-71 5-69-32zm-48 3c29 0 43-24 42-57-32 0-66-3-65 30 0 17 8 27 23 27" id="Z"/><path d="M137-138c1-29-70-34-71-4 15 46 118 7 119 86 1 83-164 76-172 9l43-7c4 19 20 25 44 25 33 8 57-30 24-41C81-84 22-81 20-136c-2-80 154-74 161-7" id="aa"/><path d="M115-3C79 11 28 4 28-45v-112H4v-33h27l15-45h31v45h36v33H77v99c-1 23 16 31 38 25v30" id="ab"/><path d="M185-48c-13 30-37 53-82 52C43 2 14-33 14-96s30-98 90-98c62 0 83 45 84 108H66c0 31 8 55 39 56 18 0 30-7 34-22zm-45-69c5-46-57-63-70-21-2 6-4 13-4 21h74" id="ac"/><path d="M135-150c-39-12-60 13-60 57V0H25l-1-190h47c2 13-1 29 3 40 6-28 27-53 61-41v41" id="ad"/><g id="h"><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,0,0)" xlink:href="#Y"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,23.993827160493826,0)" xlink:href="#Z"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,40.04320987654321,0)" xlink:href="#aa"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,56.092592592592595,0)" xlink:href="#ab"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,65.64197530864197,0)" xlink:href="#ac"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,81.69135802469135,0)" xlink:href="#ad"/></g><path d="M128 0H69L1-190h53L99-40l48-150h52" id="ae"/><g id="i"><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,0,0)" xlink:href="#aa"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,16.049382716049383,0)" xlink:href="#ac"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,32.098765432098766,0)" xlink:href="#ad"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,43.33333333333334,0)" xlink:href="#ae"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,59.38271604938272,0)" xlink:href="#ac"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,75.4320987654321,0)" xlink:href="#ad"/></g><path d="M140-251c80 0 125 45 125 126 0 70-33 111-92 124 6 28 34 38 68 31l-1 36C177 83 129 55 120 2 51-6 15-50 15-125c0-81 44-126 125-126zm-1 214c52 0 73-35 73-88 0-50-21-86-72-86-52 0-73 35-73 86s22 88 72 88" id="af"/><path d="M85 4C-2 5 27-109 22-190h50c7 57-23 150 33 157 60-5 35-97 40-157h50l1 190h-47c-2-12 1-28-3-38-12 25-28 42-61 42" id="ag"/><path d="M123 10C108 53 80 86 19 72V37c35 8 53-11 59-39L3-190h52l48 148c12-52 28-100 44-148h51" id="ah"/><g id="j"><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,0,0)" xlink:href="#af"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,22.469135802469136,0)" xlink:href="#ag"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,40.04320987654321,0)" xlink:href="#ac"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,56.092592592592595,0)" xlink:href="#ad"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,67.32716049382717,0)" xlink:href="#ah"/></g><path d="M24-248c120-7 223 5 221 122C244-46 201 0 124 0H24v-248zM76-40c74 7 117-18 117-86 0-67-45-88-117-82v168" id="ai"/><g id="k"><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,0,0)" xlink:href="#ai"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,20.78395061728395,0)" xlink:href="#Z"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,36.83333333333333,0)" xlink:href="#ab"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,46.3827160493827,0)" xlink:href="#Z"/></g><path fill="#3a414a" d="M30-248c87 1 191-15 191 75 0 78-77 80-158 76V0H30v-248zm33 125c57 0 124 11 124-50 0-59-68-47-124-48v98" id="aj"/><path fill="#3a414a" d="M114-163C36-179 61-72 57 0H25l-1-190h30c1 12-1 29 2 39 6-27 23-49 58-41v29" id="ak"/><path fill="#3a414a" d="M100-194c62-1 85 37 85 99 1 63-27 99-86 99S16-35 15-95c0-66 28-99 85-99zM99-20c44 1 53-31 53-75 0-43-8-75-51-75s-53 32-53 75 10 74 51 75" id="al"/><path fill="#3a414a" d="M96-169c-40 0-48 33-48 73s9 75 48 75c24 0 41-14 43-38l32 2c-6 37-31 61-74 61-59 0-76-41-82-99-10-93 101-131 147-64 4 7 5 14 7 22l-32 3c-4-21-16-35-41-35" id="am"/><path fill="#3a414a" d="M100-194c63 0 86 42 84 106H49c0 40 14 67 53 68 26 1 43-12 49-29l28 8c-11 28-37 45-77 45C44 4 14-33 15-96c1-61 26-98 85-98zm52 81c6-60-76-77-97-28-3 7-6 17-6 28h103" id="an"/><path fill="#3a414a" d="M135-143c-3-34-86-38-87 0 15 53 115 12 119 90S17 21 10-45l28-5c4 36 97 45 98 0-10-56-113-15-118-90-4-57 82-63 122-42 12 7 21 19 24 35" id="ao"/><g id="l"><use transform="matrix(0.06172839506172839,0,0,0.06172839506172839,0,0)" xlink:href="#aj"/><use transform="matrix(0.06172839506172839,0,0,0.06172839506172839,14.814814814814813,0)" xlink:href="#ak"/><use transform="matrix(0.06172839506172839,0,0,0.06172839506172839,22.160493827160494,0)" xlink:href="#al"/><use transform="matrix(0.06172839506172839,0,0,0.06172839506172839,34.50617283950617,0)" xlink:href="#am"/><use transform="matrix(0.06172839506172839,0,0,0.06172839506172839,45.61728395061728,0)" xlink:href="#an"/><use transform="matrix(0.06172839506172839,0,0,0.06172839506172839,57.962962962962955,0)" xlink:href="#ao"/><use transform="matrix(0.06172839506172839,0,0,0.06172839506172839,69.07407407407406,0)" xlink:href="#ao"/></g><path d="M209 0H11v-25l151-195H24v-28h176v25L50-27h159V0" id="ap"/><path d="M194 0L95-120 63-95V0H30v-248h33v124l119-124h40L117-140 236 0h-42" id="aq"/><path d="M115-194c55 1 70 41 70 98S169 2 115 4C84 4 66-9 55-30l1 105H24l-1-265h31l2 30c10-21 28-34 59-34zm-8 174c40 0 45-34 45-75s-6-73-45-74c-42 0-51 32-51 76 0 43 10 73 51 73" id="ar"/><g id="m"><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,0,0)" xlink:href="#ap"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,17.574074074074073,0)" xlink:href="#E"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,33.623456790123456,0)" xlink:href="#E"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,49.672839506172835,0)" xlink:href="#aq"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,68.9320987654321,0)" xlink:href="#N"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,84.98148148148148,0)" xlink:href="#N"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,101.03086419753086,0)" xlink:href="#ar"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,117.08024691358024,0)" xlink:href="#N"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,133.12962962962962,0)" xlink:href="#F"/></g><path d="M30-248c118-7 216 8 213 122C240-48 200 0 122 0H30v-248zM63-27c89 8 146-16 146-99s-60-101-146-95v194" id="as"/><g id="n"><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,0,0)" xlink:href="#as"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,20.78395061728395,0)" xlink:href="#N"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,36.83333333333333,0)" xlink:href="#N"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,52.8827160493827,0)" xlink:href="#ar"/></g><g id="o"><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,0,0)" xlink:href="#W"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,14.444444444444443,0)" xlink:href="#K"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,22.469135802469136,0)" xlink:href="#E"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,38.51851851851852,0)" xlink:href="#F"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,48.0679012345679,0)" xlink:href="#J"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,64.11728395061728,0)" xlink:href="#Q"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,80.16666666666666,0)" xlink:href="#N"/></g><g id="p"><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,0,0)" xlink:href="#P"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,23.993827160493826,0)" xlink:href="#N"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,40.04320987654321,0)" xlink:href="#K"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,48.0679012345679,0)" xlink:href="#J"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,64.11728395061728,0)" xlink:href="#G"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,80.16666666666666,0)" xlink:href="#J"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,96.21604938271605,0)" xlink:href="#K"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,104.24074074074073,0)" xlink:href="#J"/></g><path d="M24 0v-248h195v40H76v63h132v40H76v65h150V0H24" id="at"/><path d="M144 0l-44-69L55 0H2l70-98-66-92h53l41 62 40-62h54l-67 91 71 99h-54" id="au"/><path d="M135-194c87-1 58 113 63 194h-50c-7-57 23-157-34-157-59 0-34 97-39 157H25l-1-190h47c2 12-1 28 3 38 12-26 28-41 61-42" id="av"/><path d="M25 0v-261h50V0H25" id="aw"/><g id="q"><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,0,0)" xlink:href="#at"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,19.25925925925926,0)" xlink:href="#au"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,35.308641975308646,0)" xlink:href="#ab"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,44.858024691358025,0)" xlink:href="#ac"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,60.907407407407405,0)" xlink:href="#ad"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,72.14197530864197,0)" xlink:href="#av"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,89.71604938271605,0)" xlink:href="#Z"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,105.76543209876543,0)" xlink:href="#aw"/></g><path d="M88-194c31-1 46 15 58 34l-1-101h50l1 261h-48c-2-10 0-23-3-31C134-8 116 4 84 4 32 4 16-41 15-95c0-56 19-97 73-99zm17 164c33 0 40-30 41-66 1-37-9-64-41-64s-38 30-39 65c0 43 13 65 39 65" id="ax"/><path d="M135-194c53 0 70 44 70 98 0 56-19 98-73 100-31 1-45-17-59-34 3 33 2 69 2 105H25l-1-265h48c2 10 0 23 3 31 11-24 29-35 60-35zM114-30c33 0 39-31 40-66 0-38-9-64-40-64-56 0-55 130 0 130" id="ay"/><path d="M190-63c-7 42-38 67-86 67-59 0-84-38-90-98-12-110 154-137 174-36l-49 2c-2-19-15-32-35-32-30 0-35 28-38 64-6 74 65 87 74 30" id="az"/><path d="M25-224v-37h50v37H25zM25 0v-190h50V0H25" id="aA"/><g id="r"><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,0,0)" xlink:href="#ax"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,17.574074074074073,0)" xlink:href="#ac"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,33.623456790123456,0)" xlink:href="#ay"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,51.197530864197525,0)" xlink:href="#ac"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,67.24691358024691,0)" xlink:href="#av"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,84.82098765432099,0)" xlink:href="#ax"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,102.39506172839505,0)" xlink:href="#ac"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,118.44444444444444,0)" xlink:href="#av"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,136.0185185185185,0)" xlink:href="#az"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,152.0679012345679,0)" xlink:href="#aA"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,160.09259259259258,0)" xlink:href="#ac"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,176.14197530864197,0)" xlink:href="#aa"/></g><g id="s"><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,0,0)" xlink:href="#D"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,20.78395061728395,0)" xlink:href="#O"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,27.123456790123456,0)" xlink:href="#H"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,33.46296296296296,0)" xlink:href="#N"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,49.51234567901234,0)" xlink:href="#I"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,65.56172839506172,0)" xlink:href="#K"/></g><path d="M145-31C134-9 116 4 85 4 32 4 16-35 15-94c0-59 17-99 70-100 32-1 48 14 60 33 0-11-1-24 2-32h30l-1 268h-32zM93-21c41 0 51-33 51-76s-8-73-50-73c-40 0-46 35-46 75s5 74 45 74" id="aB"/><g id="t"><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,0,0)" xlink:href="#aB"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,16.049382716049383,0)" xlink:href="#U"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,32.098765432098766,0)" xlink:href="#N"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,48.14814814814815,0)" xlink:href="#F"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,57.697530864197525,0)" xlink:href="#H"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,64.03703703703704,0)" xlink:href="#N"/><use transform="matrix(0.08024691358024691,0,0,0.08024691358024691,80.08641975308642,0)" xlink:href="#W"/></g><path d="M140-251c81 0 123 46 123 126C263-53 228-8 163 1c7 30 30 48 69 40v23c-55 16-95-15-103-61C56-3 17-48 17-125c0-80 42-126 123-126zm0 227c63 0 89-41 89-101s-29-99-89-99c-61 0-89 39-89 99S79-25 140-24" id="aC"/><g id="u"><use transform="matrix(0.06790123456790122,0,0,0.06790123456790122,0,0)" xlink:href="#aC"/><use transform="matrix(0.06790123456790122,0,0,0.06790123456790122,19.01234567901234,0)" xlink:href="#U"/><use transform="matrix(0.06790123456790122,0,0,0.06790123456790122,32.59259259259258,0)" xlink:href="#N"/><use transform="matrix(0.06790123456790122,0,0,0.06790123456790122,46.17283950617282,0)" xlink:href="#F"/><use transform="matrix(0.06790123456790122,0,0,0.06790123456790122,54.25308641975307,0)" xlink:href="#H"/><use transform="matrix(0.06790123456790122,0,0,0.06790123456790122,59.617283950617264,0)" xlink:href="#N"/><use transform="matrix(0.06790123456790122,0,0,0.06790123456790122,73.1975308641975,0)" xlink:href="#W"/></g><path d="M0 4l72-265h28L28 4H0" id="aD"/><path d="M185-189c-5-48-123-54-124 2 14 75 158 14 163 119 3 78-121 87-175 55-17-10-28-26-33-46l33-7c5 56 141 63 141-1 0-78-155-14-162-118-5-82 145-84 179-34 5 7 8 16 11 25" id="aE"/><path d="M210-169c-67 3-38 105-44 169h-31v-121c0-29-5-50-35-48C34-165 62-65 56 0H25l-1-190h30c1 10-1 24 2 32 10-44 99-50 107 0 11-21 27-35 58-36 85-2 47 119 55 194h-31v-121c0-29-5-49-35-48" id="aF"/><g id="v"><use transform="matrix(0.06790123456790122,0,0,0.06790123456790122,0,0)" xlink:href="#as"/><use transform="matrix(0.06790123456790122,0,0,0.06790123456790122,17.586419753086414,0)" xlink:href="#J"/><use transform="matrix(0.06790123456790122,0,0,0.06790123456790122,31.166666666666657,0)" xlink:href="#K"/><use transform="matrix(0.06790123456790122,0,0,0.06790123456790122,37.95679012345678,0)" xlink:href="#J"/><use transform="matrix(0.06790123456790122,0,0,0.06790123456790122,51.537037037037024,0)" xlink:href="#aD"/><use transform="matrix(0.06790123456790122,0,0,0.06790123456790122,58.327160493827144,0)" xlink:href="#aE"/><use transform="matrix(0.06790123456790122,0,0,0.06790123456790122,74.62345679012344,0)" xlink:href="#N"/><use transform="matrix(0.06790123456790122,0,0,0.06790123456790122,88.20370370370368,0)" xlink:href="#Q"/><use transform="matrix(0.06790123456790122,0,0,0.06790123456790122,101.78395061728392,0)" xlink:href="#aF"/><use transform="matrix(0.06790123456790122,0,0,0.06790123456790122,122.08641975308639,0)" xlink:href="#N"/><use transform="matrix(0.06790123456790122,0,0,0.06790123456790122,135.66666666666663,0)" xlink:href="#I"/><use transform="matrix(0.06790123456790122,0,0,0.06790123456790122,149.24691358024688,0)" xlink:href="#K"/><use transform="matrix(0.06790123456790122,0,0,0.06790123456790122,156.037037037037,0)" xlink:href="#W"/></g><g id="w"><use transform="matrix(0.06790123456790122,0,0,0.06790123456790122,0,0)" xlink:href="#P"/><use transform="matrix(0.06790123456790122,0,0,0.06790123456790122,20.302469135802465,0)" xlink:href="#N"/><use transform="matrix(0.06790123456790122,0,0,0.06790123456790122,33.88271604938271,0)" xlink:href="#K"/><use transform="matrix(0.06790123456790122,0,0,0.06790123456790122,40.67283950617283,0)" xlink:href="#J"/><use transform="matrix(0.06790123456790122,0,0,0.06790123456790122,54.253086419753075,0)" xlink:href="#G"/><use transform="matrix(0.06790123456790122,0,0,0.06790123456790122,67.83333333333331,0)" xlink:href="#J"/><use transform="matrix(0.06790123456790122,0,0,0.06790123456790122,81.41358024691355,0)" xlink:href="#K"/><use transform="matrix(0.06790123456790122,0,0,0.06790123456790122,88.20370370370368,0)" xlink:href="#J"/></g><g id="y"><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,0,0)" xlink:href="#as"/><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,17.746296296296293,0)" xlink:href="#F"/><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,25.899999999999995,0)" xlink:href="#U"/><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,39.603703703703694,0)" xlink:href="#H"/><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,45.01666666666666,0)" xlink:href="#G"/></g><g id="z"><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,0,0)" xlink:href="#W"/><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,12.33333333333333,0)" xlink:href="#N"/><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,26.03703703703703,0)" xlink:href="#F"/><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,34.190740740740736,0)" xlink:href="#M"/><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,46.524074074074065,0)" xlink:href="#N"/><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,60.22777777777777,0)" xlink:href="#F"/><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,68.38148148148147,0)" xlink:href="#W"/></g><g id="A"><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,0,0)" xlink:href="#W"/><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,12.33333333333333,0)" xlink:href="#N"/><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,26.03703703703703,0)" xlink:href="#F"/><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,34.190740740740736,0)" xlink:href="#M"/><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,46.524074074074065,0)" xlink:href="#H"/><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,51.93703703703703,0)" xlink:href="#X"/><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,64.27037037037036,0)" xlink:href="#N"/><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,77.97407407407405,0)" xlink:href="#W"/></g><path d="M30 0v-248h187v28H63v79h144v27H63v87h162V0H30" id="aG"/><path d="M141 0L90-78 38 0H4l68-98-65-92h35l48 74 47-74h35l-64 92 68 98h-35" id="aH"/><g id="B"><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,0,0)" xlink:href="#aG"/><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,16.444444444444443,0)" xlink:href="#aH"/><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,28.77777777777777,0)" xlink:href="#K"/><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,35.62962962962961,0)" xlink:href="#N"/><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,49.33333333333332,0)" xlink:href="#F"/><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,57.48703703703703,0)" xlink:href="#I"/><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,71.19074074074072,0)" xlink:href="#J"/><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,84.89444444444442,0)" xlink:href="#O"/></g><g id="C"><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,0,0)" xlink:href="#G"/><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,13.7037037037037,0)" xlink:href="#N"/><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,27.4074074074074,0)" xlink:href="#ar"/><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,41.11111111111111,0)" xlink:href="#N"/><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,54.8148148148148,0)" xlink:href="#I"/><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,68.5185185185185,0)" xlink:href="#G"/><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,82.22222222222221,0)" xlink:href="#N"/><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,95.9259259259259,0)" xlink:href="#I"/><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,109.62962962962959,0)" xlink:href="#H"/><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,115.04259259259256,0)" xlink:href="#N"/><use transform="matrix(0.0685185185185185,0,0,0.0685185185185185,128.74629629629626,0)" xlink:href="#W"/></g></defs></g></svg>
\ No newline at end of file
diff --git a/docs/35.0.0/assets/druid-column-types.png b/docs/35.0.0/assets/druid-column-types.png
new file mode 100644
index 0000000000..9db56c0681
Binary files /dev/null and b/docs/35.0.0/assets/druid-column-types.png differ
diff --git a/docs/35.0.0/assets/druid-dataflow-2x.png b/docs/35.0.0/assets/druid-dataflow-2x.png
new file mode 100644
index 0000000000..ab1c583e43
Binary files /dev/null and b/docs/35.0.0/assets/druid-dataflow-2x.png differ
diff --git a/docs/35.0.0/assets/druid-dataflow-3.png b/docs/35.0.0/assets/druid-dataflow-3.png
new file mode 100644
index 0000000000..355215cbce
Binary files /dev/null and b/docs/35.0.0/assets/druid-dataflow-3.png differ
diff --git a/docs/35.0.0/assets/druid-manage-1.png b/docs/35.0.0/assets/druid-manage-1.png
new file mode 100644
index 0000000000..0d10c6e7bc
Binary files /dev/null and b/docs/35.0.0/assets/druid-manage-1.png differ
diff --git a/docs/35.0.0/assets/druid-timeline.png b/docs/35.0.0/assets/druid-timeline.png
new file mode 100644
index 0000000000..40380e2794
Binary files /dev/null and b/docs/35.0.0/assets/druid-timeline.png differ
diff --git a/docs/35.0.0/assets/files/kttm-kafka-supervisor.json b/docs/35.0.0/assets/files/kttm-kafka-supervisor.json
new file mode 100644
index 0000000000..2096f9c7cd
--- /dev/null
+++ b/docs/35.0.0/assets/files/kttm-kafka-supervisor.json
@@ -0,0 +1,66 @@
+{
+  "type": "kafka",
+  "spec": {
+    "ioConfig": {
+      "type": "kafka",
+      "consumerProperties": {
+        "bootstrap.servers": "localhost:9092"
+      },
+      "topic": "kttm",
+      "inputFormat": {
+        "type": "json"
+      },
+      "useEarliestOffset": true
+    },
+    "tuningConfig": {
+      "type": "kafka"
+    },
+    "dataSchema": {
+      "dataSource": "kttm-kafka-supervisor-api",
+      "timestampSpec": {
+        "column": "timestamp",
+        "format": "iso"
+      },
+      "dimensionsSpec": {
+        "dimensions": [
+          "session",
+          "number",
+          "client_ip",
+          "language",
+          "adblock_list",
+          "app_version",
+          "path",
+          "loaded_image",
+          "referrer",
+          "referrer_host",
+          "server_ip",
+          "screen",
+          "window",
+          {
+            "type": "long",
+            "name": "session_length"
+          },
+          "timezone",
+          "timezone_offset",
+          {
+            "type": "json",
+            "name": "event"
+          },
+          {
+            "type": "json",
+            "name": "agent"
+          },
+          {
+            "type": "json",
+            "name": "geo_ip"
+          }
+        ]
+      },
+      "granularitySpec": {
+        "queryGranularity": "none",
+        "rollup": false,
+        "segmentGranularity": "day"
+      }
+    }
+  }
+}
\ No newline at end of file
diff --git a/docs/35.0.0/assets/indexing_service.png b/docs/35.0.0/assets/indexing_service.png
new file mode 100644
index 0000000000..a4462a413c
Binary files /dev/null and b/docs/35.0.0/assets/indexing_service.png differ
diff --git a/docs/35.0.0/assets/multi-stage-query/msq-ui-download-query-results.png b/docs/35.0.0/assets/multi-stage-query/msq-ui-download-query-results.png
new file mode 100644
index 0000000000..e428cb2dfd
Binary files /dev/null and b/docs/35.0.0/assets/multi-stage-query/msq-ui-download-query-results.png differ
diff --git a/docs/35.0.0/assets/multi-stage-query/tutorial-msq-convert.png b/docs/35.0.0/assets/multi-stage-query/tutorial-msq-convert.png
new file mode 100644
index 0000000000..f16941af67
Binary files /dev/null and b/docs/35.0.0/assets/multi-stage-query/tutorial-msq-convert.png differ
diff --git a/docs/35.0.0/assets/multi-stage-query/ui-annotated.png b/docs/35.0.0/assets/multi-stage-query/ui-annotated.png
new file mode 100644
index 0000000000..5a98c00d19
Binary files /dev/null and b/docs/35.0.0/assets/multi-stage-query/ui-annotated.png differ
diff --git a/docs/35.0.0/assets/multi-stage-query/ui-empty.png b/docs/35.0.0/assets/multi-stage-query/ui-empty.png
new file mode 100644
index 0000000000..7c30d5a671
Binary files /dev/null and b/docs/35.0.0/assets/multi-stage-query/ui-empty.png differ
diff --git a/docs/35.0.0/assets/native-queries-01.png b/docs/35.0.0/assets/native-queries-01.png
new file mode 100644
index 0000000000..27fd29b632
Binary files /dev/null and b/docs/35.0.0/assets/native-queries-01.png differ
diff --git a/docs/35.0.0/assets/nested-combined-json.png b/docs/35.0.0/assets/nested-combined-json.png
new file mode 100644
index 0000000000..f98bfcf538
Binary files /dev/null and b/docs/35.0.0/assets/nested-combined-json.png differ
diff --git a/docs/35.0.0/assets/nested-display-data-types.png b/docs/35.0.0/assets/nested-display-data-types.png
new file mode 100644
index 0000000000..2776068ee4
Binary files /dev/null and b/docs/35.0.0/assets/nested-display-data-types.png differ
diff --git a/docs/35.0.0/assets/nested-examine-schema.png b/docs/35.0.0/assets/nested-examine-schema.png
new file mode 100644
index 0000000000..11769a162a
Binary files /dev/null and b/docs/35.0.0/assets/nested-examine-schema.png differ
diff --git a/docs/35.0.0/assets/nested-extract-as-type.png b/docs/35.0.0/assets/nested-extract-as-type.png
new file mode 100644
index 0000000000..c54a5eeb62
Binary files /dev/null and b/docs/35.0.0/assets/nested-extract-as-type.png differ
diff --git a/docs/35.0.0/assets/nested-extract-elements.png b/docs/35.0.0/assets/nested-extract-elements.png
new file mode 100644
index 0000000000..9f7076b50d
Binary files /dev/null and b/docs/35.0.0/assets/nested-extract-elements.png differ
diff --git a/docs/35.0.0/assets/nested-group-aggregate.png b/docs/35.0.0/assets/nested-group-aggregate.png
new file mode 100644
index 0000000000..2d1907fe64
Binary files /dev/null and b/docs/35.0.0/assets/nested-group-aggregate.png differ
diff --git a/docs/35.0.0/assets/nested-msq-ingestion-transform.png b/docs/35.0.0/assets/nested-msq-ingestion-transform.png
new file mode 100644
index 0000000000..b46fde8593
Binary files /dev/null and b/docs/35.0.0/assets/nested-msq-ingestion-transform.png differ
diff --git a/docs/35.0.0/assets/nested-msq-ingestion.png b/docs/35.0.0/assets/nested-msq-ingestion.png
new file mode 100644
index 0000000000..0487ee1883
Binary files /dev/null and b/docs/35.0.0/assets/nested-msq-ingestion.png differ
diff --git a/docs/35.0.0/assets/nested-parse-deserialize.png b/docs/35.0.0/assets/nested-parse-deserialize.png
new file mode 100644
index 0000000000..881a67164b
Binary files /dev/null and b/docs/35.0.0/assets/nested-parse-deserialize.png differ
diff --git a/docs/35.0.0/assets/nested-retrieve-json.png b/docs/35.0.0/assets/nested-retrieve-json.png
new file mode 100644
index 0000000000..4f5fa0f969
Binary files /dev/null and b/docs/35.0.0/assets/nested-retrieve-json.png differ
diff --git a/docs/35.0.0/assets/nested-return-json.png b/docs/35.0.0/assets/nested-return-json.png
new file mode 100644
index 0000000000..9a67aaa71d
Binary files /dev/null and b/docs/35.0.0/assets/nested-return-json.png differ
diff --git a/docs/35.0.0/assets/retention-rules.png b/docs/35.0.0/assets/retention-rules.png
new file mode 100644
index 0000000000..59061d5511
Binary files /dev/null and b/docs/35.0.0/assets/retention-rules.png differ
diff --git a/docs/35.0.0/assets/security-model-1.png b/docs/35.0.0/assets/security-model-1.png
new file mode 100644
index 0000000000..55c7f24c54
Binary files /dev/null and b/docs/35.0.0/assets/security-model-1.png differ
diff --git a/docs/35.0.0/assets/security-model-2.png b/docs/35.0.0/assets/security-model-2.png
new file mode 100644
index 0000000000..dcb256bacc
Binary files /dev/null and b/docs/35.0.0/assets/security-model-2.png differ
diff --git a/docs/35.0.0/assets/segmentPropagation.png b/docs/35.0.0/assets/segmentPropagation.png
new file mode 100644
index 0000000000..e1ec82029e
Binary files /dev/null and b/docs/35.0.0/assets/segmentPropagation.png differ
diff --git a/docs/35.0.0/assets/services-overview.png b/docs/35.0.0/assets/services-overview.png
new file mode 100644
index 0000000000..157ce608e5
Binary files /dev/null and b/docs/35.0.0/assets/services-overview.png differ
diff --git a/docs/35.0.0/assets/set-query-context-insert-query.png b/docs/35.0.0/assets/set-query-context-insert-query.png
new file mode 100644
index 0000000000..d156597d2a
Binary files /dev/null and b/docs/35.0.0/assets/set-query-context-insert-query.png differ
diff --git a/docs/35.0.0/assets/set-query-context-open-context-dialog.png b/docs/35.0.0/assets/set-query-context-open-context-dialog.png
new file mode 100644
index 0000000000..765caa0d72
Binary files /dev/null and b/docs/35.0.0/assets/set-query-context-open-context-dialog.png differ
diff --git a/docs/35.0.0/assets/set-query-context-query-view.png b/docs/35.0.0/assets/set-query-context-query-view.png
new file mode 100644
index 0000000000..9d25d3c664
Binary files /dev/null and b/docs/35.0.0/assets/set-query-context-query-view.png differ
diff --git a/docs/35.0.0/assets/set-query-context-run-the-query.png b/docs/35.0.0/assets/set-query-context-run-the-query.png
new file mode 100644
index 0000000000..27f29f8390
Binary files /dev/null and b/docs/35.0.0/assets/set-query-context-run-the-query.png differ
diff --git a/docs/35.0.0/assets/set-query-context-set-context-parameters.png b/docs/35.0.0/assets/set-query-context-set-context-parameters.png
new file mode 100644
index 0000000000..17fa110501
Binary files /dev/null and b/docs/35.0.0/assets/set-query-context-set-context-parameters.png differ
diff --git a/docs/35.0.0/assets/spectator-histogram-size-comparison.png b/docs/35.0.0/assets/spectator-histogram-size-comparison.png
new file mode 100644
index 0000000000..306f45abd8
Binary files /dev/null and b/docs/35.0.0/assets/spectator-histogram-size-comparison.png differ
diff --git a/docs/35.0.0/assets/supervisor-actions.png b/docs/35.0.0/assets/supervisor-actions.png
new file mode 100644
index 0000000000..2797cf69ea
Binary files /dev/null and b/docs/35.0.0/assets/supervisor-actions.png differ
diff --git a/docs/35.0.0/assets/supervisor-info-dialog.png b/docs/35.0.0/assets/supervisor-info-dialog.png
new file mode 100644
index 0000000000..3be424a413
Binary files /dev/null and b/docs/35.0.0/assets/supervisor-info-dialog.png differ
diff --git a/docs/35.0.0/assets/supervisor-view.png b/docs/35.0.0/assets/supervisor-view.png
new file mode 100644
index 0000000000..e3100cdd3b
Binary files /dev/null and b/docs/35.0.0/assets/supervisor-view.png differ
diff --git a/docs/35.0.0/assets/tutorial-batch-data-loader-00.png b/docs/35.0.0/assets/tutorial-batch-data-loader-00.png
new file mode 100644
index 0000000000..793b6c1232
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-batch-data-loader-00.png differ
diff --git a/docs/35.0.0/assets/tutorial-batch-data-loader-01.png b/docs/35.0.0/assets/tutorial-batch-data-loader-01.png
new file mode 100644
index 0000000000..2ff1d6398b
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-batch-data-loader-01.png differ
diff --git a/docs/35.0.0/assets/tutorial-batch-data-loader-015.png b/docs/35.0.0/assets/tutorial-batch-data-loader-015.png
new file mode 100644
index 0000000000..fd588caea4
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-batch-data-loader-015.png differ
diff --git a/docs/35.0.0/assets/tutorial-batch-data-loader-02.png b/docs/35.0.0/assets/tutorial-batch-data-loader-02.png
new file mode 100644
index 0000000000..736188cb13
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-batch-data-loader-02.png differ
diff --git a/docs/35.0.0/assets/tutorial-batch-data-loader-03.png b/docs/35.0.0/assets/tutorial-batch-data-loader-03.png
new file mode 100644
index 0000000000..74bb8c88fe
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-batch-data-loader-03.png differ
diff --git a/docs/35.0.0/assets/tutorial-batch-data-loader-04.png b/docs/35.0.0/assets/tutorial-batch-data-loader-04.png
new file mode 100644
index 0000000000..e4237cda8a
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-batch-data-loader-04.png differ
diff --git a/docs/35.0.0/assets/tutorial-batch-data-loader-05.png b/docs/35.0.0/assets/tutorial-batch-data-loader-05.png
new file mode 100644
index 0000000000..d245dde67a
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-batch-data-loader-05.png differ
diff --git a/docs/35.0.0/assets/tutorial-batch-data-loader-06.png b/docs/35.0.0/assets/tutorial-batch-data-loader-06.png
new file mode 100644
index 0000000000..285fd57ba2
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-batch-data-loader-06.png differ
diff --git a/docs/35.0.0/assets/tutorial-batch-data-loader-07.png b/docs/35.0.0/assets/tutorial-batch-data-loader-07.png
new file mode 100644
index 0000000000..481838d789
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-batch-data-loader-07.png differ
diff --git a/docs/35.0.0/assets/tutorial-batch-data-loader-08.png b/docs/35.0.0/assets/tutorial-batch-data-loader-08.png
new file mode 100644
index 0000000000..b64c5a4e0d
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-batch-data-loader-08.png differ
diff --git a/docs/35.0.0/assets/tutorial-batch-data-loader-09.png b/docs/35.0.0/assets/tutorial-batch-data-loader-09.png
new file mode 100644
index 0000000000..bec3085f67
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-batch-data-loader-09.png differ
diff --git a/docs/35.0.0/assets/tutorial-batch-data-loader-10.png b/docs/35.0.0/assets/tutorial-batch-data-loader-10.png
new file mode 100644
index 0000000000..857a5a5c4f
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-batch-data-loader-10.png differ
diff --git a/docs/35.0.0/assets/tutorial-batch-data-loader-11.png b/docs/35.0.0/assets/tutorial-batch-data-loader-11.png
new file mode 100644
index 0000000000..bf7e304b8a
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-batch-data-loader-11.png differ
diff --git a/docs/35.0.0/assets/tutorial-batch-data-loader-12.png b/docs/35.0.0/assets/tutorial-batch-data-loader-12.png
new file mode 100644
index 0000000000..f195b9ca50
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-batch-data-loader-12.png differ
diff --git a/docs/35.0.0/assets/tutorial-batch-submit-task-01.png b/docs/35.0.0/assets/tutorial-batch-submit-task-01.png
new file mode 100644
index 0000000000..01b91427fc
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-batch-submit-task-01.png differ
diff --git a/docs/35.0.0/assets/tutorial-batch-submit-task-02.png b/docs/35.0.0/assets/tutorial-batch-submit-task-02.png
new file mode 100644
index 0000000000..ba7caeb22c
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-batch-submit-task-02.png differ
diff --git a/docs/35.0.0/assets/tutorial-compaction-01.png b/docs/35.0.0/assets/tutorial-compaction-01.png
new file mode 100644
index 0000000000..aeb9bf36fc
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-compaction-01.png differ
diff --git a/docs/35.0.0/assets/tutorial-compaction-02.png b/docs/35.0.0/assets/tutorial-compaction-02.png
new file mode 100644
index 0000000000..836d8a7a7c
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-compaction-02.png differ
diff --git a/docs/35.0.0/assets/tutorial-compaction-03.png b/docs/35.0.0/assets/tutorial-compaction-03.png
new file mode 100644
index 0000000000..d51f8f8a8a
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-compaction-03.png differ
diff --git a/docs/35.0.0/assets/tutorial-compaction-04.png b/docs/35.0.0/assets/tutorial-compaction-04.png
new file mode 100644
index 0000000000..46c5b1d261
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-compaction-04.png differ
diff --git a/docs/35.0.0/assets/tutorial-compaction-05.png b/docs/35.0.0/assets/tutorial-compaction-05.png
new file mode 100644
index 0000000000..e692694aff
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-compaction-05.png differ
diff --git a/docs/35.0.0/assets/tutorial-compaction-06.png b/docs/35.0.0/assets/tutorial-compaction-06.png
new file mode 100644
index 0000000000..55c999f9d1
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-compaction-06.png differ
diff --git a/docs/35.0.0/assets/tutorial-compaction-07.png b/docs/35.0.0/assets/tutorial-compaction-07.png
new file mode 100644
index 0000000000..661e89784c
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-compaction-07.png differ
diff --git a/docs/35.0.0/assets/tutorial-compaction-08.png b/docs/35.0.0/assets/tutorial-compaction-08.png
new file mode 100644
index 0000000000..6e3f1aa037
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-compaction-08.png differ
diff --git a/docs/35.0.0/assets/tutorial-deletion-01.png b/docs/35.0.0/assets/tutorial-deletion-01.png
new file mode 100644
index 0000000000..942f057d7e
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-deletion-01.png differ
diff --git a/docs/35.0.0/assets/tutorial-deletion-02.png b/docs/35.0.0/assets/tutorial-deletion-02.png
new file mode 100644
index 0000000000..516fdf7fe8
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-deletion-02.png differ
diff --git a/docs/35.0.0/assets/tutorial-deletion-03.png b/docs/35.0.0/assets/tutorial-deletion-03.png
new file mode 100644
index 0000000000..666ff7a89e
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-deletion-03.png differ
diff --git a/docs/35.0.0/assets/tutorial-kafka-data-loader-01.png b/docs/35.0.0/assets/tutorial-kafka-data-loader-01.png
new file mode 100644
index 0000000000..7f8d0daacd
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-kafka-data-loader-01.png differ
diff --git a/docs/35.0.0/assets/tutorial-kafka-data-loader-02.png b/docs/35.0.0/assets/tutorial-kafka-data-loader-02.png
new file mode 100644
index 0000000000..8475eeba2b
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-kafka-data-loader-02.png differ
diff --git a/docs/35.0.0/assets/tutorial-kafka-data-loader-03.png b/docs/35.0.0/assets/tutorial-kafka-data-loader-03.png
new file mode 100644
index 0000000000..dc7400404f
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-kafka-data-loader-03.png differ
diff --git a/docs/35.0.0/assets/tutorial-kafka-data-loader-04.png b/docs/35.0.0/assets/tutorial-kafka-data-loader-04.png
new file mode 100644
index 0000000000..5703066959
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-kafka-data-loader-04.png differ
diff --git a/docs/35.0.0/assets/tutorial-kafka-data-loader-05.png b/docs/35.0.0/assets/tutorial-kafka-data-loader-05.png
new file mode 100644
index 0000000000..c920f05658
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-kafka-data-loader-05.png differ
diff --git a/docs/35.0.0/assets/tutorial-kafka-data-loader-06.png b/docs/35.0.0/assets/tutorial-kafka-data-loader-06.png
new file mode 100644
index 0000000000..4fb96dd47c
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-kafka-data-loader-06.png differ
diff --git a/docs/35.0.0/assets/tutorial-kafka-data-loader-07.png b/docs/35.0.0/assets/tutorial-kafka-data-loader-07.png
new file mode 100644
index 0000000000..b3013b735d
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-kafka-data-loader-07.png differ
diff --git a/docs/35.0.0/assets/tutorial-kafka-data-loader-08.png b/docs/35.0.0/assets/tutorial-kafka-data-loader-08.png
new file mode 100644
index 0000000000..b1cdd2df16
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-kafka-data-loader-08.png differ
diff --git a/docs/35.0.0/assets/tutorial-kafka-data-loader-09.png b/docs/35.0.0/assets/tutorial-kafka-data-loader-09.png
new file mode 100644
index 0000000000..e2045ac895
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-kafka-data-loader-09.png differ
diff --git a/docs/35.0.0/assets/tutorial-kafka-data-loader-10.png b/docs/35.0.0/assets/tutorial-kafka-data-loader-10.png
new file mode 100644
index 0000000000..39eaa3750a
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-kafka-data-loader-10.png differ
diff --git a/docs/35.0.0/assets/tutorial-kafka-data-loader-11.png b/docs/35.0.0/assets/tutorial-kafka-data-loader-11.png
new file mode 100644
index 0000000000..7bd3d9a25e
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-kafka-data-loader-11.png differ
diff --git a/docs/35.0.0/assets/tutorial-kafka-data-loader-12.png b/docs/35.0.0/assets/tutorial-kafka-data-loader-12.png
new file mode 100644
index 0000000000..ed952b135b
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-kafka-data-loader-12.png differ
diff --git a/docs/35.0.0/assets/tutorial-kafka-submit-supervisor-01.png b/docs/35.0.0/assets/tutorial-kafka-submit-supervisor-01.png
new file mode 100644
index 0000000000..809c0c6733
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-kafka-submit-supervisor-01.png differ
diff --git a/docs/35.0.0/assets/tutorial-query-01.png b/docs/35.0.0/assets/tutorial-query-01.png
new file mode 100644
index 0000000000..99354cbdfe
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-query-01.png differ
diff --git a/docs/35.0.0/assets/tutorial-query-02.png b/docs/35.0.0/assets/tutorial-query-02.png
new file mode 100644
index 0000000000..4d789f5989
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-query-02.png differ
diff --git a/docs/35.0.0/assets/tutorial-query-03.png b/docs/35.0.0/assets/tutorial-query-03.png
new file mode 100644
index 0000000000..841d36bfe8
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-query-03.png differ
diff --git a/docs/35.0.0/assets/tutorial-query-04.png b/docs/35.0.0/assets/tutorial-query-04.png
new file mode 100644
index 0000000000..7c713e367c
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-query-04.png differ
diff --git a/docs/35.0.0/assets/tutorial-query-05.png b/docs/35.0.0/assets/tutorial-query-05.png
new file mode 100644
index 0000000000..4b3d78d155
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-query-05.png differ
diff --git a/docs/35.0.0/assets/tutorial-query-06.png b/docs/35.0.0/assets/tutorial-query-06.png
new file mode 100644
index 0000000000..cb35a07871
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-query-06.png differ
diff --git a/docs/35.0.0/assets/tutorial-query-07.png b/docs/35.0.0/assets/tutorial-query-07.png
new file mode 100644
index 0000000000..aa94d629f8
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-query-07.png differ
diff --git a/docs/35.0.0/assets/tutorial-query-deepstorage-retention-rule.png b/docs/35.0.0/assets/tutorial-query-deepstorage-retention-rule.png
new file mode 100644
index 0000000000..9dee37bdea
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-query-deepstorage-retention-rule.png differ
diff --git a/docs/35.0.0/assets/tutorial-quickstart-01.png b/docs/35.0.0/assets/tutorial-quickstart-01.png
new file mode 100644
index 0000000000..649708b7c4
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-quickstart-01.png differ
diff --git a/docs/35.0.0/assets/tutorial-quickstart-02.png b/docs/35.0.0/assets/tutorial-quickstart-02.png
new file mode 100644
index 0000000000..5edec67c3f
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-quickstart-02.png differ
diff --git a/docs/35.0.0/assets/tutorial-quickstart-03.png b/docs/35.0.0/assets/tutorial-quickstart-03.png
new file mode 100644
index 0000000000..917f25d040
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-quickstart-03.png differ
diff --git a/docs/35.0.0/assets/tutorial-quickstart-04.png b/docs/35.0.0/assets/tutorial-quickstart-04.png
new file mode 100644
index 0000000000..e847ef550c
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-quickstart-04.png differ
diff --git a/docs/35.0.0/assets/tutorial-quickstart-05.png b/docs/35.0.0/assets/tutorial-quickstart-05.png
new file mode 100644
index 0000000000..da3ed0dfa6
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-quickstart-05.png differ
diff --git a/docs/35.0.0/assets/tutorial-retention-00.png b/docs/35.0.0/assets/tutorial-retention-00.png
new file mode 100644
index 0000000000..a3f84a9fe6
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-retention-00.png differ
diff --git a/docs/35.0.0/assets/tutorial-retention-01.png b/docs/35.0.0/assets/tutorial-retention-01.png
new file mode 100644
index 0000000000..35a97c2626
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-retention-01.png differ
diff --git a/docs/35.0.0/assets/tutorial-retention-02.png b/docs/35.0.0/assets/tutorial-retention-02.png
new file mode 100644
index 0000000000..f38fad0d27
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-retention-02.png differ
diff --git a/docs/35.0.0/assets/tutorial-retention-03.png b/docs/35.0.0/assets/tutorial-retention-03.png
new file mode 100644
index 0000000000..256836a2d4
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-retention-03.png differ
diff --git a/docs/35.0.0/assets/tutorial-retention-04.png b/docs/35.0.0/assets/tutorial-retention-04.png
new file mode 100644
index 0000000000..d39495f87d
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-retention-04.png differ
diff --git a/docs/35.0.0/assets/tutorial-retention-05.png b/docs/35.0.0/assets/tutorial-retention-05.png
new file mode 100644
index 0000000000..638a752fac
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-retention-05.png differ
diff --git a/docs/35.0.0/assets/tutorial-retention-06.png b/docs/35.0.0/assets/tutorial-retention-06.png
new file mode 100644
index 0000000000..f47cbffbb1
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-retention-06.png differ
diff --git a/docs/35.0.0/assets/tutorial-sql-aggregate-query.png b/docs/35.0.0/assets/tutorial-sql-aggregate-query.png
new file mode 100644
index 0000000000..0ffbff60e0
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-sql-aggregate-query.png differ
diff --git a/docs/35.0.0/assets/tutorial-sql-auto-queries.png b/docs/35.0.0/assets/tutorial-sql-auto-queries.png
new file mode 100644
index 0000000000..dc04a8de6f
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-sql-auto-queries.png differ
diff --git a/docs/35.0.0/assets/tutorial-sql-count-distinct-help.png b/docs/35.0.0/assets/tutorial-sql-count-distinct-help.png
new file mode 100644
index 0000000000..5327972d2a
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-sql-count-distinct-help.png differ
diff --git a/docs/35.0.0/assets/tutorial-sql-count-distinct.png b/docs/35.0.0/assets/tutorial-sql-count-distinct.png
new file mode 100644
index 0000000000..5fb9b2ae0b
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-sql-count-distinct.png differ
diff --git a/docs/35.0.0/assets/tutorial-sql-demo-queries.png b/docs/35.0.0/assets/tutorial-sql-demo-queries.png
new file mode 100644
index 0000000000..16fc040a67
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-sql-demo-queries.png differ
diff --git a/docs/35.0.0/assets/tutorial-sql-query-plan.png b/docs/35.0.0/assets/tutorial-sql-query-plan.png
new file mode 100644
index 0000000000..03f3c3cc6e
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-sql-query-plan.png differ
diff --git a/docs/35.0.0/assets/tutorial-sql-result-column-actions.png b/docs/35.0.0/assets/tutorial-sql-result-column-actions.png
new file mode 100644
index 0000000000..16518d4bff
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-sql-result-column-actions.png differ
diff --git a/docs/35.0.0/assets/tutorial-theta-01.png b/docs/35.0.0/assets/tutorial-theta-01.png
new file mode 100644
index 0000000000..2411fbf194
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-theta-01.png differ
diff --git a/docs/35.0.0/assets/tutorial-theta-02.png b/docs/35.0.0/assets/tutorial-theta-02.png
new file mode 100644
index 0000000000..ce849fd36a
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-theta-02.png differ
diff --git a/docs/35.0.0/assets/tutorial-theta-03.png b/docs/35.0.0/assets/tutorial-theta-03.png
new file mode 100644
index 0000000000..316bf7f0b0
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-theta-03.png differ
diff --git a/docs/35.0.0/assets/tutorial-theta-04.png b/docs/35.0.0/assets/tutorial-theta-04.png
new file mode 100644
index 0000000000..21f383af6d
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-theta-04.png differ
diff --git a/docs/35.0.0/assets/tutorial-theta-05.png b/docs/35.0.0/assets/tutorial-theta-05.png
new file mode 100644
index 0000000000..ec2c8df6d3
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-theta-05.png differ
diff --git a/docs/35.0.0/assets/tutorial-theta-06.png b/docs/35.0.0/assets/tutorial-theta-06.png
new file mode 100644
index 0000000000..4048aa2389
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-theta-06.png differ
diff --git a/docs/35.0.0/assets/tutorial-theta-07.png b/docs/35.0.0/assets/tutorial-theta-07.png
new file mode 100644
index 0000000000..369b5914ad
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-theta-07.png differ
diff --git a/docs/35.0.0/assets/tutorial-theta-08.png b/docs/35.0.0/assets/tutorial-theta-08.png
new file mode 100644
index 0000000000..59a6bc051e
Binary files /dev/null and b/docs/35.0.0/assets/tutorial-theta-08.png differ
diff --git a/docs/35.0.0/assets/web-console-0.7-tasks.png b/docs/35.0.0/assets/web-console-0.7-tasks.png
new file mode 100644
index 0000000000..80080ba8ed
Binary files /dev/null and b/docs/35.0.0/assets/web-console-0.7-tasks.png differ
diff --git a/docs/35.0.0/assets/web-console-01-home-view.png b/docs/35.0.0/assets/web-console-01-home-view.png
new file mode 100644
index 0000000000..39b6e8a1a6
Binary files /dev/null and b/docs/35.0.0/assets/web-console-01-home-view.png differ
diff --git a/docs/35.0.0/assets/web-console-02-data-loader-1.png b/docs/35.0.0/assets/web-console-02-data-loader-1.png
new file mode 100644
index 0000000000..ecd18c01f9
Binary files /dev/null and b/docs/35.0.0/assets/web-console-02-data-loader-1.png differ
diff --git a/docs/35.0.0/assets/web-console-03-data-loader-2.png b/docs/35.0.0/assets/web-console-03-data-loader-2.png
new file mode 100644
index 0000000000..bfb7be59cf
Binary files /dev/null and b/docs/35.0.0/assets/web-console-03-data-loader-2.png differ
diff --git a/docs/35.0.0/assets/web-console-04-datasources.png b/docs/35.0.0/assets/web-console-04-datasources.png
new file mode 100644
index 0000000000..fab3cec452
Binary files /dev/null and b/docs/35.0.0/assets/web-console-04-datasources.png differ
diff --git a/docs/35.0.0/assets/web-console-05-retention.png b/docs/35.0.0/assets/web-console-05-retention.png
new file mode 100644
index 0000000000..96278525a8
Binary files /dev/null and b/docs/35.0.0/assets/web-console-05-retention.png differ
diff --git a/docs/35.0.0/assets/web-console-06-segments.png b/docs/35.0.0/assets/web-console-06-segments.png
new file mode 100644
index 0000000000..9e9e9ab985
Binary files /dev/null and b/docs/35.0.0/assets/web-console-06-segments.png differ
diff --git a/docs/35.0.0/assets/web-console-07-supervisors.png b/docs/35.0.0/assets/web-console-07-supervisors.png
new file mode 100644
index 0000000000..70391bd642
Binary files /dev/null and b/docs/35.0.0/assets/web-console-07-supervisors.png differ
diff --git a/docs/35.0.0/assets/web-console-08-supervisor-status.png b/docs/35.0.0/assets/web-console-08-supervisor-status.png
new file mode 100644
index 0000000000..1bcfccdfe6
Binary files /dev/null and b/docs/35.0.0/assets/web-console-08-supervisor-status.png differ
diff --git a/docs/35.0.0/assets/web-console-09-task-status.png b/docs/35.0.0/assets/web-console-09-task-status.png
new file mode 100644
index 0000000000..100e8ada0e
Binary files /dev/null and b/docs/35.0.0/assets/web-console-09-task-status.png differ
diff --git a/docs/35.0.0/assets/web-console-10-servers.png b/docs/35.0.0/assets/web-console-10-servers.png
new file mode 100644
index 0000000000..a3e0084e12
Binary files /dev/null and b/docs/35.0.0/assets/web-console-10-servers.png differ
diff --git a/docs/35.0.0/assets/web-console-11-query-sql.png b/docs/35.0.0/assets/web-console-11-query-sql.png
new file mode 100644
index 0000000000..a144774f46
Binary files /dev/null and b/docs/35.0.0/assets/web-console-11-query-sql.png differ
diff --git a/docs/35.0.0/assets/web-console-12-query-rune.png b/docs/35.0.0/assets/web-console-12-query-rune.png
new file mode 100644
index 0000000000..8c5e270562
Binary files /dev/null and b/docs/35.0.0/assets/web-console-12-query-rune.png differ
diff --git a/docs/35.0.0/assets/web-console-13-lookups.png b/docs/35.0.0/assets/web-console-13-lookups.png
new file mode 100644
index 0000000000..fa0bd0b060
Binary files /dev/null and b/docs/35.0.0/assets/web-console-13-lookups.png differ
diff --git a/docs/35.0.0/comparisons/druid-vs-elasticsearch.md b/docs/35.0.0/comparisons/druid-vs-elasticsearch.md
new file mode 100644
index 0000000000..82752aa7ad
--- /dev/null
+++ b/docs/35.0.0/comparisons/druid-vs-elasticsearch.md
@@ -0,0 +1,39 @@
+---
+id: druid-vs-elasticsearch
+title: "Apache Druid vs Elasticsearch"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+We are not experts on search systems, if anything is incorrect about our portrayal, please let us know on the mailing list or via some other means.
+
+Elasticsearch is a search system based on Apache Lucene. It provides full text search for schema-free documents
+and provides access to raw event level data. Elasticsearch is increasingly adding more support for analytics and aggregations.
+[Some members of the community](https://groups.google.com/forum/#!msg/druid-development/nlpwTHNclj8/sOuWlKOzPpYJ) have pointed out
+the resource requirements for data ingestion and aggregation in Elasticsearch is much higher than those of Druid.
+
+Elasticsearch also does not support data summarization/roll-up at ingestion time, which can compact the data that needs to be
+stored up to 100x with real-world data sets. This leads to Elasticsearch having greater storage requirements.
+
+Druid focuses on OLAP work flows. Druid is optimized for high performance (fast aggregation and ingestion) at low cost,
+and supports a wide range of analytic operations. Druid has some basic search support for structured event data, but does not support
+full text search. Druid also does not support completely unstructured data. Measures must be defined in a Druid schema such that
+summarization/roll-up can be done.
diff --git a/docs/35.0.0/comparisons/druid-vs-key-value.md b/docs/35.0.0/comparisons/druid-vs-key-value.md
new file mode 100644
index 0000000000..57f3dec66d
--- /dev/null
+++ b/docs/35.0.0/comparisons/druid-vs-key-value.md
@@ -0,0 +1,46 @@
+---
+id: druid-vs-key-value
+title: "Apache Druid vs. Key/Value Stores (HBase/Cassandra/OpenTSDB)"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+Druid is highly optimized for scans and aggregations, it supports arbitrarily deep drill downs into data sets. This same functionality
+is supported in key/value stores in 2 ways:
+
+1. Pre-compute all permutations of possible user queries
+2. Range scans on event data
+
+When pre-computing results, the key is the exact parameters of the query, and the value is the result of the query.
+The queries return extremely quickly, but at the cost of flexibility, as ad-hoc exploratory queries are not possible with
+pre-computing every possible query permutation. Pre-computing all permutations of all ad-hoc queries leads to result sets
+that grow exponentially with the number of columns of a data set, and pre-computing queries for complex real-world data sets
+can require hours of pre-processing time.
+
+The other approach to using key/value stores for aggregations to use the dimensions of an event as the key and the event measures as the value.
+Aggregations are done by issuing range scans on this data. Timeseries specific databases such as OpenTSDB use this approach.
+One of the limitations here is that the key/value storage model does not have indexes for any kind of filtering other than prefix ranges,
+which can be used to filter a query down to a metric and time range, but cannot resolve complex predicates to narrow the exact data to scan.
+When the number of rows to scan gets large, this limitation can greatly reduce performance. It is also harder to achieve good
+locality with key/value stores because most don’t support pushing down aggregates to the storage layer.
+
+For arbitrary exploration of data (flexible data filtering), Druid's custom column format enables ad-hoc queries without pre-computation. The format
+also enables fast scans on columns, which is important for good aggregation performance.
diff --git a/docs/35.0.0/comparisons/druid-vs-kudu.md b/docs/35.0.0/comparisons/druid-vs-kudu.md
new file mode 100644
index 0000000000..b992a1633d
--- /dev/null
+++ b/docs/35.0.0/comparisons/druid-vs-kudu.md
@@ -0,0 +1,39 @@
+---
+id: druid-vs-kudu
+title: "Apache Druid vs Kudu"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+Kudu's storage format enables single row updates, whereas updates to existing Druid segments requires recreating the segment, so theoretically
+the process for updating old values should be higher latency in Druid. However, the requirements in Kudu for maintaining extra head space to store
+updates as well as organizing data by id instead of time has the potential to introduce some extra latency and accessing
+of data that is not needed to answer a query at query time.
+
+Druid summarizes/rollups up data at ingestion time, which in practice reduces the raw data that needs to be
+stored significantly (up to 40 times on average), and increases performance of scanning raw data significantly.
+Druid segments also contain bitmap indexes for fast filtering, which Kudu does not currently support.
+Druid's segment architecture is heavily geared towards fast aggregates and filters, and for OLAP workflows. Appends are very
+fast in Druid, whereas updates of older data are higher latency. This is by design as the data Druid is good for is typically event data,
+and does not need to be updated too frequently. Kudu supports arbitrary primary keys with uniqueness constraints, and
+efficient lookup by ranges of those keys. Kudu chooses not to include the execution engine, but supports sufficient
+operations so as to allow node-local processing from the execution engines. This means that Kudu can support multiple frameworks on the same data (e.g., MR, Spark, and SQL).
+Druid includes its own query layer that allows it to push down aggregations and computations directly to data processes for faster query processing.
diff --git a/docs/35.0.0/comparisons/druid-vs-redshift.md b/docs/35.0.0/comparisons/druid-vs-redshift.md
new file mode 100644
index 0000000000..3e2c7b9ead
--- /dev/null
+++ b/docs/35.0.0/comparisons/druid-vs-redshift.md
@@ -0,0 +1,62 @@
+---
+id: druid-vs-redshift
+title: "Apache Druid vs Redshift"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+### How does Druid compare to Redshift?
+
+In terms of drawing a differentiation, Redshift started out as ParAccel (Actian), which Amazon is licensing and has since heavily modified.
+
+Aside from potential performance differences, there are some functional differences:
+
+### Real-time data ingestion
+
+Because Druid is optimized to provide insight against massive quantities of streaming data; it is able to load and aggregate data in real-time.
+
+Generally traditional data warehouses including column stores work only with batch ingestion and are not optimal for streaming data in regularly.
+
+### Druid is a read oriented analytical data store
+
+Druid’s write semantics are not as fluid and does not support full joins (we support large table to small table joins). Redshift provides full SQL support including joins and insert/update statements.
+
+### Data distribution model
+
+Druid’s data distribution is segment-based and leverages a highly available "deep" storage such as S3 or HDFS. Scaling up (or down) does not require massive copy actions or downtime; in fact, losing any number of Historical processes does not result in data loss because new Historical processes can always be brought up by reading data from "deep" storage.
+
+To contrast, ParAccel’s data distribution model is hash-based. Expanding the cluster requires re-hashing the data across the nodes, making it difficult to perform without taking downtime. Amazon’s Redshift works around this issue with a multi-step process:
+
+* set cluster into read-only mode
+* copy data from cluster to new cluster that exists in parallel
+* redirect traffic to new cluster
+
+### Replication strategy
+
+Druid employs segment-level data distribution meaning that more processes can be added and rebalanced without having to perform a staged swap. The replication strategy also makes all replicas available for querying. Replication is done automatically and without any impact to performance.
+
+ParAccel’s hash-based distribution generally means that replication is conducted via hot spares. This puts a numerical limit on the number of nodes you can lose without losing data, and this replication strategy often does not allow the hot spare to help share query load.
+
+### Indexing strategy
+
+Along with column oriented structures, Druid uses indexing structures to speed up query execution when a filter is provided. Indexing structures do increase storage overhead (and make it more difficult to allow for mutation), but they also significantly speed up queries.
+
+ParAccel does not appear to employ indexing strategies.
diff --git a/docs/35.0.0/comparisons/druid-vs-spark.md b/docs/35.0.0/comparisons/druid-vs-spark.md
new file mode 100644
index 0000000000..4d3a6b43da
--- /dev/null
+++ b/docs/35.0.0/comparisons/druid-vs-spark.md
@@ -0,0 +1,42 @@
+---
+id: druid-vs-spark
+title: "Apache Druid vs Spark"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+Druid and Spark are complementary solutions as Druid can be used to accelerate OLAP queries in Spark.
+
+Spark is a general cluster computing framework initially designed around the concept of Resilient Distributed Datasets (RDDs).
+RDDs enable data reuse by persisting intermediate results
+in memory and enable Spark to provide fast computations for iterative algorithms.
+This is especially beneficial for certain work flows such as machine
+learning, where the same operation may be applied over and over
+again until some result is converged upon. The generality of Spark makes it very suitable as an engine to process (clean or transform) data.
+Although Spark provides the ability to query data through Spark SQL, much like Hadoop, the query latencies are not specifically targeted to be interactive (sub-second).
+
+Druid's focus is on extremely low latency queries, and is ideal for powering applications used by thousands of users, and where each query must
+return fast enough such that users can interactively explore through data. Druid fully indexes all data, and can act as a middle layer between Spark and your application.
+One typical setup seen in production is to process data in Spark, and load the processed data into Druid for faster access.
+
+For more information about using Druid and Spark together, including benchmarks of the two systems, please see:
+
+https://www.linkedin.com/pulse/combining-druid-spark-interactive-flexible-analytics-scale-butani
diff --git a/docs/35.0.0/comparisons/druid-vs-sql-on-hadoop.md b/docs/35.0.0/comparisons/druid-vs-sql-on-hadoop.md
new file mode 100644
index 0000000000..00e4473125
--- /dev/null
+++ b/docs/35.0.0/comparisons/druid-vs-sql-on-hadoop.md
@@ -0,0 +1,82 @@
+---
+id: druid-vs-sql-on-hadoop
+title: "Apache Druid vs SQL-on-Hadoop"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+SQL-on-Hadoop engines provide an
+execution engine for various data formats and data stores, and
+many can be made to push down computations down to Druid, while providing a SQL interface to Druid.
+
+For a direct comparison between the technologies and when to only use one or the other, things basically comes down to your
+product requirements and what the systems were designed to do.
+
+Druid was designed to
+
+1. be an always on service
+1. ingest data in real-time
+1. handle slice-n-dice style ad-hoc queries
+
+SQL-on-Hadoop engines generally sidestep Map/Reduce, instead querying data directly from HDFS or, in some cases, other storage systems.
+Some of these engines (including Impala and Presto) can be co-located with HDFS data nodes and coordinate with them to achieve data locality for queries.
+What does this mean?  We can talk about it in terms of three general areas
+
+1. Queries
+1. Data Ingestion
+1. Query Flexibility
+
+### Queries
+
+Druid segments stores data in a custom column format. Segments are scanned directly as part of queries and each Druid server
+calculates a set of results that are eventually merged at the Broker level. This means the data that is transferred between servers
+are queries and results, and all computation is done internally as part of the Druid servers.
+
+Most SQL-on-Hadoop engines are responsible for query planning and execution for underlying storage layers and storage formats.
+They are processes that stay on even if there is no query running (eliminating the JVM startup costs from Hadoop MapReduce).
+Some (Impala/Presto) SQL-on-Hadoop engines have daemon processes that can be run where the data is stored, virtually eliminating network transfer costs. There is still
+some latency overhead (e.g. serialization/deserialization time) associated with pulling data from the underlying storage layer into the computation layer. We are unaware of exactly
+how much of a performance impact this makes.
+
+### Data Ingestion
+
+Druid is built to allow for real-time ingestion of data.  You can ingest data and query it immediately upon ingestion,
+the latency between how quickly the event is reflected in the data is dominated by how long it takes to deliver the event to Druid.
+
+SQL-on-Hadoop, being based on data in HDFS or some other backing store, are limited in their data ingestion rates by the
+rate at which that backing store can make data available.  Generally, the backing store is the biggest bottleneck for
+how quickly data can become available.
+
+### Query Flexibility
+
+Druid's query language is fairly low level and maps to how Druid operates internally. Although Druid can be combined with a high level query
+planner to support most SQL queries and analytic SQL queries (minus joins among large tables),
+base Druid is less flexible than SQL-on-Hadoop solutions for generic processing.
+
+SQL-on-Hadoop support SQL style queries with full joins.
+
+## Druid vs Parquet
+
+Parquet is a column storage format that is designed to work with SQL-on-Hadoop engines. Parquet doesn't have a query execution engine, and instead
+relies on external sources to pull data out of it.
+
+Druid's storage format is highly optimized for linear scans. Although Druid has support for nested data, Parquet's storage format is much
+more hierarchical, and is more designed for binary chunking. In theory, this should lead to faster scans in Druid.
diff --git a/docs/35.0.0/configuration/extensions.md b/docs/35.0.0/configuration/extensions.md
new file mode 100644
index 0000000000..ae8d5987d2
--- /dev/null
+++ b/docs/35.0.0/configuration/extensions.md
@@ -0,0 +1,178 @@
+---
+id: extensions
+title: "Extensions"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+Druid implements an extension system that allows for adding functionality at runtime. Extensions
+are commonly used to add support for deep storages (like HDFS and S3), metadata stores (like MySQL
+and PostgreSQL), new aggregators, new input formats, and so on.
+
+Production clusters will generally use at least two extensions; one for deep storage and one for a
+metadata store. Many clusters will also use additional extensions.
+
+## Core extensions
+
+Core extensions are maintained by Druid committers.
+
+|Name|Description|Docs|
+|----|-----------|----|
+|druid-avro-extensions|Support for data in Apache Avro data format.|[link](../development/extensions-core/avro.md)|
+|druid-azure-extensions|Microsoft Azure deep storage.|[link](../development/extensions-core/azure.md)|
+|druid-basic-security|Support for Basic HTTP authentication and role-based access control.|[link](../development/extensions-core/druid-basic-security.md)|
+|druid-bloom-filter|Support for providing Bloom filters in druid queries.|[link](../development/extensions-core/bloom-filter.md)|
+|druid-catalog|This extension allows users to configure, update, retrieve, and manage metadata stored in Druid's catalog. |[link](../development/extensions-core/catalog.md)|
+|druid-datasketches|Support for approximate counts and set operations with [Apache DataSketches](https://datasketches.apache.org/).|[link](../development/extensions-core/datasketches-extension.md)|
+|druid-google-extensions|Google Cloud Storage deep storage.|[link](../development/extensions-core/google.md)|
+|druid-hdfs-storage|HDFS deep storage.|[link](../development/extensions-core/hdfs.md)|
+|druid-histogram|Approximate histograms and quantiles aggregator. Deprecated, please use the [DataSketches quantiles aggregator](../development/extensions-core/datasketches-quantiles.md) from the `druid-datasketches` extension instead.|[link](../development/extensions-core/approximate-histograms.md)|
+|druid-kafka-extraction-namespace|Apache Kafka-based namespaced lookup. Requires namespace lookup extension.|[link](../querying/kafka-extraction-namespace.md)|
+|druid-kafka-indexing-service|Supervised exactly-once Apache Kafka ingestion for the indexing service.|[link](../ingestion/kafka-ingestion.md)|
+|druid-kinesis-indexing-service|Supervised exactly-once Kinesis ingestion for the indexing service.|[link](../ingestion/kinesis-ingestion.md)|
+|druid-kerberos|Kerberos authentication for druid processes.|[link](../development/extensions-core/druid-kerberos.md)|
+|druid-lookups-cached-global|A module for [lookups](../querying/lookups.md) providing a jvm-global eager caching for lookups. It provides JDBC and URI implementations for fetching lookup data.|[link](../querying/lookups-cached-global.md)|
+|druid-lookups-cached-single| Per lookup caching module to support the use cases where a lookup need to be isolated from the global pool of lookups |[link](../development/extensions-core/druid-lookups.md)|
+|druid-multi-stage-query| Support for the multi-stage query architecture for Apache Druid and the multi-stage query task engine.|[link](../multi-stage-query/index.md)|
+|druid-orc-extensions|Support for data in Apache ORC data format.|[link](../development/extensions-core/orc.md)|
+|druid-parquet-extensions|Support for data in Apache Parquet data format. Requires druid-avro-extensions to be loaded.|[link](../development/extensions-core/parquet.md)|
+|druid-protobuf-extensions| Support for data in Protobuf data format.|[link](../development/extensions-core/protobuf.md)|
+|druid-s3-extensions|Interfacing with data in Amazon S3, and using S3 as deep storage.|[link](../development/extensions-core/s3.md)|
+|druid-ec2-extensions|Interfacing with AWS EC2 for autoscaling middle managers|UNDOCUMENTED|
+|druid-aws-rds-extensions|Support for AWS token based access to AWS RDS DB Cluster.|[link](../development/extensions-core/druid-aws-rds.md)|
+|druid-stats|Statistics related module including variance and standard deviation.|[link](../development/extensions-core/stats.md)|
+|mysql-metadata-storage|MySQL metadata store.|[link](../development/extensions-core/mysql.md)|
+|postgresql-metadata-storage|PostgreSQL metadata store.|[link](../development/extensions-core/postgresql.md)|
+|simple-client-sslcontext|Simple SSLContext provider module to be used by Druid's internal HttpClient when talking to other Druid processes over HTTPS.|[link](../development/extensions-core/simple-client-sslcontext.md)|
+|druid-pac4j|OpenID Connect authentication for druid processes.|[link](../development/extensions-core/druid-pac4j.md)|
+|druid-kubernetes-extensions|Druid cluster deployment on Kubernetes without Zookeeper.|[link](../development/extensions-core/kubernetes.md)|
+|druid-kubernetes-overlord-extensions|Support for launching tasks in k8s without Middle Managers|[link](../development/extensions-core/k8s-jobs.md)|
+
+## Community extensions
+
+:::info
+ Community extensions are not maintained by Druid committers, although we accept patches from community members using these extensions. They may not have been as extensively tested as the core extensions.
+:::
+
+A number of community members have contributed their own extensions to Druid that are not packaged with the default Druid tarball.
+If you'd like to take on maintenance for a community extension, please post on [dev@druid.apache.org](https://lists.apache.org/list.html?dev@druid.apache.org) to let us know!
+
+All of these community extensions can be downloaded using [pull-deps](../operations/pull-deps.md) while specifying a `-c` coordinate option to pull `org.apache.druid.extensions.contrib:{EXTENSION_NAME}:{DRUID_VERSION}`.
+
+|Name|Description|Docs|
+|----|-----------|----|
+|aliyun-oss-extensions|Aliyun OSS deep storage |[link](../development/extensions-contrib/aliyun-oss-extensions.md)|
+|ambari-metrics-emitter|Ambari Metrics Emitter |[link](../development/extensions-contrib/ambari-metrics-emitter.md)|
+|druid-cassandra-storage|Apache Cassandra deep storage.|[link](../development/extensions-contrib/cassandra.md)|
+|druid-cloudfiles-extensions|Rackspace Cloudfiles deep storage.|[link](../development/extensions-contrib/cloudfiles.md)|
+|druid-compressed-bigdecimal|Compressed Big Decimal Type | [link](../development/extensions-contrib/compressed-big-decimal.md)|
+|druid-ddsketch|Support for DDSketch approximate quantiles based on [DDSketch](https://github.com/datadog/sketches-java) | [link](../development/extensions-contrib/ddsketch-quantiles.md)|
+|druid-deltalake-extensions|Support for ingesting Delta Lake tables.|[link](../development/extensions-contrib/delta-lake.md)|
+|druid-distinctcount|DistinctCount aggregator|[link](../development/extensions-contrib/distinctcount.md)|
+|druid-exact-count-bitmap|Support for exact cardinality counting using Roaring Bitmap over a Long column.|[link](../development/extensions-contrib/druid-exact-count-bitmap.md)|
+|druid-iceberg-extensions|Support for ingesting Iceberg tables.|[link](../development/extensions-contrib/iceberg.md)|
+|druid-redis-cache|A cache implementation for Druid based on Redis.|[link](../development/extensions-contrib/redis-cache.md)|
+|druid-time-min-max|Min/Max aggregator for timestamp.|[link](../development/extensions-contrib/time-min-max.md)|
+|sqlserver-metadata-storage|Microsoft SQLServer metadata store.|[link](../development/extensions-contrib/sqlserver.md)|
+|graphite-emitter|Graphite metrics emitter|[link](../development/extensions-contrib/graphite.md)|
+|statsd-emitter|StatsD metrics emitter|[link](../development/extensions-contrib/statsd.md)|
+|kafka-emitter|Kafka metrics emitter|[link](../development/extensions-contrib/kafka-emitter.md)|
+|druid-thrift-extensions|Support thrift ingestion |[link](../development/extensions-contrib/thrift.md)|
+|druid-opentsdb-emitter|OpenTSDB metrics emitter |[link](../development/extensions-contrib/opentsdb-emitter.md)|
+|materialized-view-selection, materialized-view-maintenance|Materialized View|[link](../development/extensions-contrib/materialized-view.md)|
+|druid-moving-average-query|Support for [Moving Average](https://en.wikipedia.org/wiki/Moving_average) and other Aggregate [Window Functions](https://en.wikibooks.org/wiki/Structured_Query_Language/Window_functions) in Druid queries.|[link](../development/extensions-contrib/moving-average-query.md)|
+|druid-influxdb-emitter|InfluxDB metrics emitter|[link](../development/extensions-contrib/influxdb-emitter.md)|
+|druid-momentsketch|Support for approximate quantile queries using the [momentsketch](https://github.com/stanford-futuredata/momentsketch) library|[link](../development/extensions-contrib/momentsketch-quantiles.md)|
+|druid-tdigestsketch|Support for approximate sketch aggregators based on [T-Digest](https://github.com/tdunning/t-digest)|[link](../development/extensions-contrib/tdigestsketch-quantiles.md)|
+|gce-extensions|GCE Extensions|[link](../development/extensions-contrib/gce-extensions.md)|
+|prometheus-emitter|Exposes [Druid metrics](../operations/metrics.md) for [Prometheus](https://prometheus.io/)|[link](../development/extensions-contrib/prometheus.md)|
+|druid-spectator-histogram|Support for efficient approximate percentile queries|[link](../development/extensions-contrib/spectator-histogram.md)|
+|druid-rabbit-indexing-service|Support for creating and managing [RabbitMQ](https://www.rabbitmq.com/) indexing tasks|[link](../development/extensions-contrib/rabbit-stream-ingestion.md)|
+|druid-ranger-security|Support for access control through Apache Ranger.|[link](../development/extensions-contrib/druid-ranger-security.md)|
+
+## Promoting community extensions to core extensions
+
+Please post on [dev@druid.apache.org](https://lists.apache.org/list.html?dev@druid.apache.org) if you'd like an extension to be promoted to core.
+If we see a community extension actively supported by the community, we can promote it to core based on community feedback.
+
+For information how to create your own extension, please see [here](../development/modules.md).
+
+## Loading extensions
+
+### Loading core extensions
+
+Apache Druid bundles all [core extensions](../configuration/extensions.md#core-extensions) out of the box.
+See the [list of extensions](../configuration/extensions.md#core-extensions) for your options. You
+can load bundled extensions by adding their names to your common.runtime.properties
+`druid.extensions.loadList` property. For example, to load the postgresql-metadata-storage and
+druid-hdfs-storage extensions, use the configuration:
+
+```properties
+druid.extensions.loadList=["postgresql-metadata-storage", "druid-hdfs-storage"]
+```
+
+These extensions are located in the `extensions` directory of the distribution.
+
+:::info
+ Druid bundles two sets of configurations: one for the [quickstart](../tutorials/index.md) and
+ one for a [clustered configuration](../tutorials/cluster.md). Make sure you are updating the correct
+ `common.runtime.properties` for your setup.
+:::
+
+:::info
+ Because of licensing, the mysql-metadata-storage extension does not include the required MySQL JDBC driver. For instructions
+ on how to install this library, see the [MySQL extension page](../development/extensions-core/mysql.md).
+:::
+
+### Loading community extensions
+
+You can also load community and third-party extensions not already bundled with Druid. To do this, first download the extension and
+then install it into your `extensions` directory. You can download extensions from their distributors directly, or
+if they are available from Maven, the included [pull-deps](../operations/pull-deps.md) can download them for you. To use *pull-deps*,
+specify the full Maven coordinate of the extension in the form `groupId:artifactId:version`. For example,
+for the (hypothetical) extension *com.example:druid-example-extension:1.0.0*, run:
+
+```shell
+java \
+  -cp "lib/*" \
+  -Ddruid.extensions.directory="extensions" \
+  -Ddruid.extensions.hadoopDependenciesDir="hadoop-dependencies" \
+  org.apache.druid.cli.Main tools pull-deps \
+  --no-default-hadoop \
+  -c "com.example:druid-example-extension:1.0.0"
+```
+
+You only have to install the extension once. Then, add `"druid-example-extension"` to
+`druid.extensions.loadList` in common.runtime.properties to instruct Druid to load the extension.
+
+:::info
+ Please make sure all the Extensions related configuration properties listed [here](../configuration/index.md#extensions) are set correctly.
+:::
+
+:::info
+ The Maven `groupId` for almost every [community extension](../configuration/extensions.md#community-extensions) is `org.apache.druid.extensions.contrib`. The `artifactId` is the name
+ of the extension, and the version is the latest Druid stable version.
+:::
+
+### Loading extensions from the classpath
+
+If you add your extension jar to the classpath at runtime, Druid will also load it into the system. This mechanism is relatively easy to reason about,
+but it also means that you have to ensure that all dependency jars on the classpath are compatible. That is, Druid makes no provisions while using
+this method to maintain class loader isolation so you must make sure that the jars on your classpath are mutually compatible.
diff --git a/docs/35.0.0/configuration/human-readable-byte.md b/docs/35.0.0/configuration/human-readable-byte.md
new file mode 100644
index 0000000000..0f412b69ab
--- /dev/null
+++ b/docs/35.0.0/configuration/human-readable-byte.md
@@ -0,0 +1,98 @@
+---
+id: human-readable-byte
+title: "Human-readable Byte Configuration Reference"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+This page documents configuration properties related to bytes.
+
+These properties can be configured through 2 ways: 
+1. a simple number in bytes
+2. a number with a unit suffix
+
+## A number in bytes
+
+Given that cache size is 3G, there's a configuration as below
+
+```properties
+# 3G bytes = 3_000_000_000 bytes
+druid.cache.sizeInBytes=3000000000 
+```
+
+
+## A number with a unit suffix
+
+When you have to put a large number for some configuration as above, it is easy to make a mistake such as extra or missing 0s. Druid supports a better way, a number with a unit suffix.
+
+Given a disk of 1T, the configuration can be
+
+```properties
+druid.segmentCache.locations=[{"path":"/segment-cache-00","maxSize":"1t"},{"path":"/segment-cache-01","maxSize":"1200g"}]
+```
+
+Note: in above example, both `1t` and `1T` are acceptable since it's case-insensitive.
+Also, only integers are valid as the number part. For example, you can't replace `1200g` with `1.2t`.
+
+### Supported Units
+In the world of computer, a unit like `K` is ambiguous. It means 1000 or 1024 in different contexts, for more information please see [Here](https://en.wikipedia.org/wiki/Binary_prefix).
+
+To make it clear, the base of units are defined in Druid as below
+
+| Unit | Description | Base |
+|---|---|---|
+| K | Kilo Decimal Byte | 1_000 |
+| M | Mega Decimal Byte | 1_000_000 |
+| G | Giga Decimal Byte | 1_000_000_000 |
+| T | Tera Decimal Byte | 1_000_000_000_000 |
+| P | Peta Decimal Byte | 1_000_000_000_000_000 |
+| Ki | Kilo Binary Byte | 1024 |
+| Mi  | Mega Binary Byte | 1024 * 1024 |
+| Gi | Giga Binary Byte | 1024 * 1024 * 1024 |
+| Ti  | Tera Binary Byte | 1024 * 1024 * 1024 * 1024 |
+| Pi  | Peta Binary Byte | 1024 * 1024 * 1024 * 1024 * 1024 |
+| KiB | Kilo Binary Byte | 1024 |
+| MiB  | Mega Binary Byte | 1024 * 1024 |
+| GiB | Giga Binary Byte | 1024 * 1024 * 1024 |
+| TiB  | Tera Binary Byte | 1024 * 1024 * 1024 * 1024 |
+| PiB  | Peta Binary Byte | 1024 * 1024 * 1024 * 1024 * 1024 |
+
+Unit is case-insensitive. `k`, `kib`, `ki`, `KiB`, `Ki`, `kiB` are all acceptable.
+
+Here are some examples
+
+```properties
+# 1G bytes = 1_000_000_000 bytes
+druid.cache.sizeInBytes=1g 
+```
+
+```properties
+# 256MiB bytes = 256 * 1024 * 1024 bytes
+druid.cache.sizeInBytes=256MiB 
+```
+
+```properties
+# 256Mi = 256MiB = 256 * 1024 * 1024 bytes
+druid.cache.sizeInBytes=256Mi
+```
+
+
+ 
diff --git a/docs/35.0.0/configuration/index.md b/docs/35.0.0/configuration/index.md
new file mode 100644
index 0000000000..8aa5e81846
--- /dev/null
+++ b/docs/35.0.0/configuration/index.md
@@ -0,0 +1,2320 @@
+---
+id: index
+title: "Configuration reference"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+This page documents all of the configuration properties for each Druid service type.
+
+## Recommended configuration file organization
+
+A recommended way of organizing Druid configuration files can be seen in the `conf` directory in the Druid package root, shown below:
+
+```sh
+$ ls -R conf
+druid
+
+conf/druid:
+_common       broker        coordinator   historical    middleManager overlord
+
+conf/druid/_common:
+common.runtime.properties log4j2.xml
+
+conf/druid/broker:
+jvm.config         runtime.properties
+
+conf/druid/coordinator:
+jvm.config         runtime.properties
+
+conf/druid/historical:
+jvm.config         runtime.properties
+
+conf/druid/middleManager:
+jvm.config         runtime.properties
+
+conf/druid/overlord:
+jvm.config         runtime.properties
+```
+
+Each directory has a `runtime.properties` file containing configuration properties for the specific Druid service corresponding to the directory, such as `historical`.
+
+The `jvm.config` files contain JVM flags such as heap sizing properties for each service.
+
+Common properties shared by all services are placed in `_common/common.runtime.properties`.
+
+## Configuration interpolation
+
+Configuration values can be interpolated from System Properties, Environment Variables, or local files. Below is an example of how this can be used:
+
+```properties
+druid.metadata.storage.type=${env:METADATA_STORAGE_TYPE}
+druid.processing.tmpDir=${sys:java.io.tmpdir}
+druid.segmentCache.locations=${file:UTF-8:/config/segment-cache-def.json}
+```
+
+Interpolation is also recursive so you can do:
+
+```properties
+druid.segmentCache.locations=${file:UTF-8:${env:SEGMENT_DEF_LOCATION}}
+```
+
+If the property is not set, an exception will be thrown on startup, but a default can be provided if desired. Setting a default value will not work with file interpolation as an exception will be thrown if the file does not exist.
+
+```properties
+druid.metadata.storage.type=${env:METADATA_STORAGE_TYPE:-mysql}
+druid.processing.tmpDir=${sys:java.io.tmpdir:-/tmp}
+```
+
+If you need to set a variable that is wrapped by `${...}` but do not want it to be interpolated, you can escape it by adding another `$`. For example:
+
+```properties
+config.name=$${value}
+```
+
+## Common configurations
+
+The properties under this section are common configurations that should be shared across all Druid services in a cluster.
+
+### JVM configuration best practices
+
+There are four JVM parameters that we set on all of our services:
+
+* `-Duser.timezone=UTC`: This sets the default timezone of the JVM to UTC. We always set this and do not test with other default timezones, so local timezones might work, but they also might uncover weird and interesting bugs. To issue queries in a non-UTC timezone, see [query granularities](../querying/granularities.md#period-granularities)
+* `-Dfile.encoding=UTF-8` This is similar to timezone, we test assuming UTF-8. Local encodings might work, but they also might result in weird and interesting bugs.
+* `-Djava.io.tmpdir=<a path>` Various parts of Druid use temporary files to interact with the file system. These files can become quite large. This means that systems that have small `/tmp` directories can cause problems for Druid. Therefore, set the JVM tmp directory to a location with ample space.
+
+     Also consider the following when configuring the JVM tmp directory:
+  * The temp directory should not be volatile tmpfs.
+  * This directory should also have good read and write speed.
+  * Avoid NFS mount.
+  * The `org.apache.druid.java.util.metrics.SysMonitor` requires execute privileges on files in `java.io.tmpdir`. If you are using the system monitor, do not set `java.io.tmpdir` to `noexec`.
+* `-Djava.util.logging.manager=org.apache.logging.log4j.jul.LogManager` This allows log4j2 to handle logs for non-log4j2 components (like jetty) which use standard java logging.
+
+### Extensions
+
+Many of Druid's external dependencies can be plugged in as modules. Extensions can be provided using the following configs:
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.extensions.directory`|The root extension directory where user can put extensions related files. Druid will load extensions stored under this directory.|`extensions` (This is a relative path to Druid's working directory)|
+|`druid.extensions.hadoopDependenciesDir`|The root Hadoop dependencies directory where user can put Hadoop related dependencies files. Druid will load the dependencies based on the Hadoop coordinate specified in the Hadoop index task.|`hadoop-dependencies` (This is a relative path to Druid's working directory|
+|`druid.extensions.loadList`|A JSON array of extensions to load from extension directories by Druid. If it is not specified, its value will be `null` and Druid will load all the extensions under `druid.extensions.directory`. If its value is empty list `[]`, then no extensions will be loaded at all. It is also allowed to specify absolute path of other custom extensions not stored in the common extensions directory.|null|
+|`druid.extensions.searchCurrentClassloader`|This is a boolean flag that determines if Druid will search the main classloader for extensions. It defaults to true but can be turned off if you have reason to not automatically add all modules on the classpath.|true|
+|`druid.extensions.useExtensionClassloaderFirst`|This is a boolean flag that determines if Druid extensions should prefer loading classes from their own jars rather than jars bundled with Druid. If false, extensions must be compatible with classes provided by any jars bundled with Druid. If true, extensions may depend on conflicting versions.|false|
+|`druid.extensions.hadoopContainerDruidClasspath`|Hadoop Indexing launches Hadoop jobs and this configuration provides way to explicitly set the user classpath for the Hadoop job. By default, this is computed automatically by Druid based on the Druid service classpath and set of extensions. However, sometimes you might want to be explicit to resolve dependency conflicts between Druid and Hadoop.|null|
+|`druid.extensions.addExtensionsToHadoopContainer`|Only applicable if `druid.extensions.hadoopContainerDruidClasspath` is provided. If set to true, then extensions specified in the loadList are added to Hadoop container classpath. Note that when `druid.extensions.hadoopContainerDruidClasspath` is not provided then extensions are always added to Hadoop container classpath.|false|
+
+### Modules
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.modules.excludeList`|A JSON array of canonical class names (e.g., `"org.apache.druid.somepackage.SomeModule"`) of module classes which shouldn't be loaded, even if they are found in extensions specified by `druid.extensions.loadList`, or in the list of core modules specified to be loaded on a particular Druid service type. Useful when some useful extension contains some module, which shouldn't be loaded on some Druid service type because some dependencies of that module couldn't be satisfied.|[]|
+
+### ZooKeeper
+
+We recommend just setting the base ZK path and the ZK service host, but all ZK paths that Druid uses can be overwritten to absolute paths.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.zk.paths.base`|Base ZooKeeper path.|`/druid`|
+|`druid.zk.service.host`|The ZooKeeper hosts to connect to. This is a REQUIRED property and therefore a host address must be supplied.|none|
+|`druid.zk.service.user`|The username to authenticate with ZooKeeper. This is an optional property.|none|
+|`druid.zk.service.pwd`|The [Password Provider](../operations/password-provider.md) or the string password to authenticate with ZooKeeper. This is an optional property.|none|
+|`druid.zk.service.authScheme`|digest is the only authentication scheme supported. |digest|
+
+#### ZooKeeper behavior
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.zk.service.sessionTimeoutMs`|ZooKeeper session timeout, in milliseconds.|`30000`|
+|`druid.zk.service.connectionTimeoutMs`|ZooKeeper connection timeout, in milliseconds.|`15000`|
+|`druid.zk.service.compress`|Boolean flag for whether or not created Znodes should be compressed.|`true`|
+|`druid.zk.service.acl`|Boolean flag for whether or not to enable ACL security for ZooKeeper. If ACL is enabled, zNode creators will have all permissions.|`false`|
+|`druid.zk.service.pathChildrenCacheStrategy`|Dictates the underlying caching strategy for service announcements. Set true to let announcers to use Apache Curator's PathChildrenCache strategy, otherwise NodeCache strategy. Consider using NodeCache strategy when you are dealing with huge number of ZooKeeper watches in your cluster.|`true`|
+
+#### Path configuration
+
+Druid interacts with ZooKeeper through a set of standard path configurations. We recommend just setting the base ZooKeeper path, but all ZooKeeper paths that Druid uses can be overwritten to absolute paths.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.zk.paths.base`|Base ZooKeeper path.|`/druid`|
+|`druid.zk.paths.propertiesPath`|ZooKeeper properties path.|`${druid.zk.paths.base}/properties`|
+|`druid.zk.paths.announcementsPath`|Druid service announcement path.|`${druid.zk.paths.base}/announcements`|
+|`druid.zk.paths.liveSegmentsPath`|Current path for where Druid services announce their segments.|`${druid.zk.paths.base}/segments`|
+|`druid.zk.paths.coordinatorPath`|Used by the Coordinator for leader election.|`${druid.zk.paths.base}/coordinator`|
+
+The indexing service also uses its own set of paths. These configs can be included in the common configuration.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.zk.paths.indexer.base`|Base ZooKeeper path for |`${druid.zk.paths.base}/indexer`|
+|`druid.zk.paths.indexer.announcementsPath`|Middle Managers announce themselves here.|`${druid.zk.paths.indexer.base}/announcements`|
+|`druid.zk.paths.indexer.tasksPath`|Used to assign tasks to Middle Managers.|`${druid.zk.paths.indexer.base}/tasks`|
+|`druid.zk.paths.indexer.statusPath`|Parent path for announcement of task statuses.|`${druid.zk.paths.indexer.base}/status`|
+
+If `druid.zk.paths.base` and `druid.zk.paths.indexer.base` are both set, and none of the other `druid.zk.paths.*` or `druid.zk.paths.indexer.*` values are set, then the other properties will be evaluated relative to their respective `base`.
+For example, if `druid.zk.paths.base` is set to `/druid1` and `druid.zk.paths.indexer.base` is set to `/druid2` then `druid.zk.paths.announcementsPath` will default to `/druid1/announcements` while `druid.zk.paths.indexer.announcementsPath` will default to `/druid2/announcements`.
+
+The following path is used for service discovery. It is **not** affected by `druid.zk.paths.base` and **must** be specified separately.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.discovery.curator.path`|Services announce themselves under this ZooKeeper path.|`/druid/discovery`|
+
+### TLS
+
+#### General configuration
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.enablePlaintextPort`|Enable/Disable HTTP connector.|`true`|
+|`druid.enableTlsPort`|Enable/Disable HTTPS connector.|`false`|
+
+Although not recommended but both HTTP and HTTPS connectors can be enabled at a time and respective ports are configurable using `druid.plaintextPort`
+and `druid.tlsPort` properties on each service. Please see `Configuration` section of individual services to check the valid and default values for these ports.
+
+#### Jetty server TLS configuration
+
+Druid uses Jetty as an embedded web server. To learn more about TLS/SSL, certificates, and related concepts in Jetty, including explanations of the configuration settings below, see "Configuring SSL/TLS KeyStores" in the [Jetty Operations Guide](https://www.eclipse.org/jetty/documentation.php).
+
+For information about TLS/SSL support in Java in general, see the [Java Secure Socket Extension (JSSE) Reference Guide](https://docs.oracle.com/en/java/javase/17/security/java-secure-socket-extension-jsse-reference-guide.html).
+The [Java Cryptography Architecture
+Standard Algorithm Name Documentation for JDK 17](https://docs.oracle.com/en/java/javase/17/docs/specs/security/standard-names.html) lists all possible
+values for the following properties, among others provided by the Java implementation.
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|--------|
+|`druid.server.https.keyStorePath`|The file path or URL of the TLS/SSL KeyStore.|none|yes|
+|`druid.server.https.keyStoreType`|The type of the KeyStore.|none|yes|
+|`druid.server.https.certAlias`|Alias of TLS/SSL certificate for the connector.|none|yes|
+|`druid.server.https.keyStorePassword`|The [Password Provider](../operations/password-provider.md) or String password for the KeyStore.|none|yes|
+
+Following table contains non-mandatory advanced configuration options, use caution.
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|--------|
+|`druid.server.https.keyManagerFactoryAlgorithm`|Algorithm to use for creating KeyManager, more details [here](https://docs.oracle.com/javase/7/docs/technotes/guides/security/jsse/JSSERefGuide.html#KeyManager).|`javax.net.ssl.KeyManagerFactory.getDefaultAlgorithm()`|no|
+|`druid.server.https.keyManagerPassword`|The [Password Provider](../operations/password-provider.md) or String password for the Key Manager.|none|no|
+|`druid.server.https.includeCipherSuites`|List of cipher suite names to include. You can either use the exact cipher suite name or a regular expression.|Jetty's default include cipher list|no|
+|`druid.server.https.excludeCipherSuites`|List of cipher suite names to exclude. You can either use the exact cipher suite name or a regular expression.|Jetty's default exclude cipher list|no|
+|`druid.server.https.includeProtocols`|List of exact protocols names to include.|Jetty's default include protocol list|no|
+|`druid.server.https.excludeProtocols`|List of exact protocols names to exclude.|Jetty's default exclude protocol list|no|
+
+#### Internal client TLS configuration (requires `simple-client-sslcontext` extension)
+
+These properties apply to the SSLContext that will be provided to the internal HTTP client that Druid services use to communicate with each other. These properties require the `simple-client-sslcontext` extension to be loaded. Without it, Druid services will be unable to communicate with each other when TLS is enabled.
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|--------|
+|`druid.client.https.protocol`|SSL protocol to use.|`TLSv1.2`|no|
+|`druid.client.https.trustStoreType`|The type of the key store where trusted root certificates are stored.|`java.security.KeyStore.getDefaultType()`|no|
+|`druid.client.https.trustStorePath`|The file path or URL of the TLS/SSL Key store where trusted root certificates are stored.|none|yes|
+|`druid.client.https.trustStoreAlgorithm`|Algorithm to be used by TrustManager to validate certificate chains|`javax.net.ssl.TrustManagerFactory.getDefaultAlgorithm()`|no|
+|`druid.client.https.trustStorePassword`|The [Password Provider](../operations/password-provider.md) or String password for the Trust Store.|none|yes|
+
+This [document](https://docs.oracle.com/en/java/javase/17/docs/specs/security/standard-names.html) lists all the possible
+values for the above mentioned configs among others provided by Java implementation.
+
+### Authentication and authorization
+
+|Property|Type|Description|Default|Required|
+|--------|-----------|--------|--------|--------|
+|`druid.auth.authenticatorChain`|JSON List of Strings|List of Authenticator type names|["allowAll"]|no|
+|`druid.escalator.type`|String|Type of the Escalator that should be used for internal Druid communications. This Escalator must use an authentication scheme that is supported by an Authenticator in `druid.auth.authenticatorChain`.|`noop`|no|
+|`druid.auth.authorizers`|JSON List of Strings|List of Authorizer type names |["allowAll"]|no|
+|`druid.auth.unsecuredPaths`| List of Strings|List of paths for which security checks will not be performed. All requests to these paths will be allowed.|[]|no|
+|`druid.auth.allowUnauthenticatedHttpOptions`|Boolean|If true, skip authentication checks for HTTP OPTIONS requests. This is needed for certain use cases, such as supporting CORS pre-flight requests. Note that disabling authentication checks for OPTIONS requests will allow unauthenticated users to determine what Druid endpoints are valid (by checking if the OPTIONS request returns a 200 instead of 404), so enabling this option may reveal information about server configuration, including information about what extensions are loaded (if those extensions add endpoints).|false|no|
+
+For more information, please see [Authentication and Authorization](../operations/auth.md).
+
+For configuration options for specific auth extensions, please refer to the extension documentation.
+
+### Startup logging
+
+All services can log debugging information on startup.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.startup.logging.logProperties`|Log all properties on startup (from common.runtime.properties, runtime.properties, and the JVM command line).|false|
+|`druid.startup.logging.maskProperties`|Masks sensitive properties (passwords, for example) containing theses words.|["password"]|
+
+Note that some sensitive information may be logged if these settings are enabled.
+
+### Request logging
+
+All services that can serve queries can also log the query requests they see. Broker services can additionally log the SQL requests (both from HTTP and JDBC) they see.
+For an example of setting up request logging, see [Request logging](../operations/request-logging.md).
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.request.logging.type`|How to log every query request. Choices: `noop`, [`file`](#file-request-logging), [`emitter`](#emitter-request-logging), [`slf4j`](#slf4j-request-logging), [`filtered`](#filtered-request-logging), [`composing`](#composing-request-logging), [`switching`](#switching-request-logging)|`noop` (request logging disabled by default)|
+
+To enable sending all the HTTP requests to a log, set `org.apache.druid.jetty.RequestLog` to the `DEBUG` level. See [Logging](../configuration/logging.md) for more information.
+
+#### File request logging
+
+The `file` request logger stores daily request logs on disk.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.request.logging.dir`| Historical, Realtime, and Broker services maintain request logs of all of the requests they get (interaction is via POST, so normal request logs don’t generally capture information about the actual query), this specifies the directory to store the request logs in. | none|
+|`druid.request.logging.filePattern`| [Joda datetime format](http://www.joda.org/joda-time/apidocs/org/joda/time/format/DateTimeFormat.html) for each file.| "yyyy-MM-dd'.log'"|
+|`druid.request.logging.durationToRetain`| Period to retain the request logs on disk. The period should be at least as long as roll period.| none|
+|`druid.request.logging.rollPeriod`| Defines the log rotation period for request logs. The period should be at least `PT1H`. For periods smaller than 1 day, it is recommended to use `"yyyy-MM-dd-HH'.log'"` as the file pattern.| P1D|
+
+The format of request logs is TSV, one line per requests, with five fields: timestamp, remote\_addr, native\_query, query\_context, sql\_query.
+
+For native JSON request, the `sql_query` field is empty. For example:
+
+```txt
+2019-01-14T10:00:00.000Z        127.0.0.1   {"queryType":"topN","dataSource":{"type":"table","name":"wikiticker"},"virtualColumns":[],"dimension":{"type":"LegacyDimensionSpec","dimension":"page","outputName":"page","outputType":"STRING"},"metric":{"type":"LegacyTopNMetricSpec","metric":"count"},"threshold":10,"intervals":{"type":"LegacySegmentSpec","intervals":["2015-09-12T00:00:00.000Z/2015-09-13T00:00:00.000Z"]},"filter":null,"granularity":{"type":"all"},"aggregations":[{"type":"count","name":"count"}],"postAggregations":[],"context":{"queryId":"74c2d540-d700-4ebd-b4a9-3d02397976aa"},"descending":false}    {"query/time":100,"query/bytes":800,"success":true,"identity":"user1"}
+```
+
+For SQL query request, the `native_query` field is empty. For example:
+
+```txt
+2019-01-14T10:00:00.000Z        127.0.0.1       {"sqlQuery/time":100, "sqlQuery/planningTimeMs":10, "sqlQuery/bytes":600, "success":true, "identity":"user1"}  {"query":"SELECT page, COUNT(*) AS Edits FROM wikiticker WHERE TIME_IN_INTERVAL(\"__time\", '2015-09-12/2015-09-13') GROUP BY page ORDER BY Edits DESC LIMIT 10","context":{"sqlQueryId":"c9d035a0-5ffd-4a79-a865-3ffdadbb5fdd","nativeQueryIds":"[490978e4-f5c7-4cf6-b174-346e63cf8863]"}}
+```
+
+#### Emitter request logging
+
+The `emitter` request logger emits every request to the external location specified in the [emitter](#metrics-monitors) configuration.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.request.logging.feed`|Feed name for requests.|none|
+
+#### SLF4J request logging
+
+The `slf4j` request logger logs every request using SLF4J. It serializes native queries into JSON in the log message regardless of the SLF4J format specification. Requests are logged under the class `org.apache.druid.server.log.LoggingRequestLogger`.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.request.logging.setMDC`|If you want to set MDC entries within the log entry, set this value to `true`. Your logging system must be configured to support MDC in order to format this data.|false|
+|`druid.request.logging.setContextMDC`|Set to "true" to add  the Druid query `context` to the MDC entries. Only applies when `setMDC` is `true`.|false|
+
+For a native query, the following MDC fields are populated when `setMDC` is `true`:
+
+|MDC field|Description|
+|---------|-----------|
+|`queryId`   |The query ID|
+|`sqlQueryId`|The SQL query ID if this query is part of a SQL request|
+|`dataSource`|The datasource the query was against|
+|`queryType` |The type of the query|
+|`hasFilters`|If the query has any filters|
+|`remoteAddr`|The remote address of the requesting client|
+|`duration`  |The duration of the query interval|
+|`resultOrdering`|The ordering of results|
+|`descending`|If the query is a descending query|
+
+#### Filtered request logging
+
+The `filtered` request logger filters requests based on the query type or how long a query takes to complete.
+For native queries, the logger only logs requests when the `query/time` metric exceeds the threshold provided in `queryTimeThresholdMs`.
+For SQL queries, it only logs requests when the `sqlQuery/time` metric exceeds threshold provided in `sqlQueryTimeThresholdMs`.
+See [Metrics](../operations/metrics.md) for more details on query metrics.
+
+Requests that meet the threshold are logged using the request logger type set in `druid.request.logging.delegate.type`.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.request.logging.queryTimeThresholdMs`|Threshold value for the `query/time` metric in milliseconds.|0, i.e., no filtering|
+|`druid.request.logging.sqlQueryTimeThresholdMs`|Threshold value for the `sqlQuery/time` metric in milliseconds.|0, i.e., no filtering|
+|`druid.request.logging.mutedQueryTypes` | Query requests of these types are not logged. Query types are defined as string objects corresponding to the "queryType" value for the specified query in the Druid's [native JSON query API](../querying/querying.md). Misspelled query types will be ignored. Example to ignore scan and timeBoundary queries: `["scan", "timeBoundary"]`| []|
+|`druid.request.logging.delegate.type`|Type of delegate request logger to log requests.|none|
+
+#### Composing request logging
+
+The `composing` request logger emits request logs to multiple request loggers.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.request.logging.loggerProviders`|List of request loggers for emitting request logs.|none|
+
+#### Switching request logging
+
+The `switching` request logger routes native query request logs to one request logger and SQL query request logs to another request logger.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.request.logging.nativeQueryLogger`|Request logger for emitting native query request logs.|none|
+|`druid.request.logging.sqlQueryLogger`|Request logger for emitting SQL query request logs.|none|
+
+### Audit logging
+
+Coordinator and Overlord log changes to lookups, segment load/drop rules, and dynamic configuration changes for auditing.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.audit.manager.type`|Type of audit manager used for handling audited events. Audited events are logged when set to `log` or persisted in metadata store when set to `sql`.|sql|
+|`druid.audit.manager.logLevel`|Log level of audit events with possible values DEBUG, INFO, WARN. This property is used only when `druid.audit.manager.type` is set to `log`.|INFO|
+|`druid.audit.manager.auditHistoryMillis`|Default duration for querying audit history.|1 week|
+|`druid.audit.manager.includePayloadAsDimensionInMetric`|Boolean flag on whether to add `payload` column in service metric.|false|
+|`druid.audit.manager.maxPayloadSizeBytes`|The maximum size of audit payload to store in Druid's metadata store audit table. If the size of audit payload exceeds this value, the audit log would be stored with a message indicating that the payload was omitted instead. Setting `maxPayloadSizeBytes` to -1 (default value) disables this check, meaning Druid will always store audit payload regardless of it's size. Setting to any negative number other than `-1` is invalid. Human-readable format is supported, see [here](human-readable-byte.md).  |-1|
+|`druid.audit.manager.skipNullField`|If true, the audit payload stored in metadata store will exclude any field with null value. |false|
+
+### Metadata storage
+
+These properties specify the JDBC connection and other configuration around the metadata storage. The only services that connect to the metadata storage with these properties are the [Coordinator](../design/coordinator.md) and [Overlord](../design/overlord.md).
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.metadata.storage.type`|The type of metadata storage to use. One of `mysql`, `postgresql`, or `derby`.|`derby`|
+|`druid.metadata.storage.connector.connectURI`|The JDBC URI for the database to connect to|none|
+|`druid.metadata.storage.connector.user`|The username to connect with.|none|
+|`druid.metadata.storage.connector.password`|The [Password Provider](../operations/password-provider.md) or String password used to connect with.|none|
+|`druid.metadata.storage.connector.createTables`|If Druid requires a table and it doesn't exist, create it?|true|
+|`druid.metadata.storage.tables.base`|The base name for tables.|`druid`|
+|`druid.metadata.storage.tables.dataSource`|The table to use to look for datasources created by [Kafka Indexing Service](../ingestion/kafka-ingestion.md).|`druid_dataSource`|
+|`druid.metadata.storage.tables.pendingSegments`|The table to use to look for pending segments.|`druid_pendingSegments`|
+|`druid.metadata.storage.tables.segments`|The table to use to look for segments.|`druid_segments`|
+|`druid.metadata.storage.tables.rules`|The table to use to look for segment load/drop rules.|`druid_rules`|
+|`druid.metadata.storage.tables.config`|The table to use to look for configs.|`druid_config`|
+|`druid.metadata.storage.tables.tasks`|Used by the indexing service to store tasks.|`druid_tasks`|
+|`druid.metadata.storage.tables.taskLog`|Used by the indexing service to store task logs.|`druid_tasklogs`|
+|`druid.metadata.storage.tables.taskLock`|Used by the indexing service to store task locks.|`druid_tasklocks`|
+|`druid.metadata.storage.tables.supervisors`|Used by the indexing service to store supervisor configurations.|`druid_supervisors`|
+|`druid.metadata.storage.tables.audit`|The table to use for audit history of configuration changes, such as Coordinator rules.|`druid_audit`|
+|`druid.metadata.storage.tables.useShortIndexNames`|Whether to use SHA-based unique index names to ensure all indices are created.|`false`|
+
+### Deep storage
+
+The configurations concern how to push and pull [Segments](../design/segments.md) from deep storage.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.storage.type`|The type of deep storage to use. One of `local`, `noop`, `s3`, `hdfs`, `c*`.|local|
+
+#### Local deep storage
+
+Local deep storage uses the local filesystem.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.storage.storageDirectory`|Directory on disk to use as deep storage.|`/tmp/druid/localStorage`|
+
+#### Noop deep storage
+
+This deep storage doesn't do anything. There are no configs.
+
+#### S3 deep storage
+
+This deep storage is used to interface with Amazon's S3. Note that the `druid-s3-extensions` extension must be loaded.
+The below table shows some important configurations for S3. See [S3 Deep Storage](../development/extensions-core/s3.md) for full configurations.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.storage.bucket`|S3 bucket name.|none|
+|`druid.storage.baseKey`|S3 object key prefix for storage.|none|
+|`druid.storage.disableAcl`|Boolean flag for ACL. If this is set to `false`, the full control would be granted to the bucket owner. This may require to set additional permissions. See [S3 permissions settings](../development/extensions-core/s3.md#s3-permissions-settings).|false|
+|`druid.storage.archiveBucket`|S3 bucket name for archiving when running the _archive task_.|none|
+|`druid.storage.archiveBaseKey`|S3 object key prefix for archiving.|none|
+|`druid.storage.sse.type`|Server-side encryption type. Should be one of `s3`, `kms`, and `custom`. See the below [Server-side encryption section](../development/extensions-core/s3.md#server-side-encryption) for more details.|None|
+|`druid.storage.sse.kms.keyId`|AWS KMS key ID. This is used only when `druid.storage.sse.type` is `kms` and can be empty to use the default key ID.|None|
+|`druid.storage.sse.custom.base64EncodedKey`|Base64-encoded key. Should be specified if `druid.storage.sse.type` is `custom`.|None|
+|`druid.storage.useS3aSchema`|If true, use the "s3a" filesystem when using Hadoop-based ingestion. If false, the "s3n" filesystem will be used. Only affects Hadoop-based ingestion.|false|
+
+#### HDFS deep storage
+
+This deep storage is used to interface with HDFS. You must load the `druid-hdfs-storage` extension.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.storage.storageDirectory`|HDFS directory to use as deep storage.|none|
+
+#### Cassandra deep storage
+
+This deep storage is used to interface with Cassandra. You must load the `druid-cassandra-storage` extension.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.storage.host`|Cassandra host.|none|
+|`druid.storage.keyspace`|Cassandra key space.|none|
+
+#### Centralized datasource schema (Experimental)
+
+This is an [experimental feature](../development/experimental.md) to improve datasource schema management by persisting segment schemas to the metadata store and caching them on the Coordinator.
+Traditionally, Brokers issue segment metadata queries to data nodes and tasks to fetch the schemas of all available segments.
+Each Broker then individually builds the schema of a datasource by combining the schemas of all the segments of that datasource.
+This mechanism is redundant and prone to errors as there is no single source of truth for schemas.
+
+Centralized schema management improves upon this design as follows:
+- Tasks publish segment schema along with segment metadata to the database.
+- Tasks announce schema for realtime segments periodically to the Coordinator.
+- Coordinator caches segment schemas and builds a combined schema for each datasource.
+- Broker poll the datasource schema cached on the Coordinator rather than building it on their own.
+- Brokers still retain the ability to build a datasource schema if they are unable to fetch it from the Coordinator.
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|--------|
+|`druid.centralizedDatasourceSchema.enabled`|Boolean flag for enabling datasource schema building and caching on the Coordinator. This property should be specified in the common runtime properties.|false|No.|
+|`druid.indexer.fork.property.druid.centralizedDatasourceSchema.enabled`| This config should be set when CentralizedDatasourceSchema feature is enabled. This should be specified in the Middle Manager runtime properties.|false|No.|
+
+If you enable this feature, you can query datasources that are only stored in deep storage and are not loaded on a Historical. For more information, see [Query from deep storage](../querying/query-from-deep-storage.md).
+
+For stale schema cleanup configs, refer to properties with the prefix `druid.coordinator.kill.segmentSchema` in [Metadata Management](#metadata-management). 
+
+### Ingestion security configuration
+
+#### HDFS input source
+
+You can set the following property to specify permissible protocols for
+the [HDFS input source](../ingestion/input-sources.md#hdfs-input-source).
+
+|Property|Possible values|Description|Default|
+|--------|---------------|-----------|-------|
+|`druid.ingestion.hdfs.allowedProtocols`|List of protocols|Allowed protocols for the HDFS input source.|`["hdfs"]`|
+
+#### HTTP input source
+
+You can set the following property to specify permissible protocols for
+the [HTTP input source](../ingestion/input-sources.md#http-input-source).
+
+|Property| Possible values                                                                                                                                                  | Description                                                                                                                               |Default|
+|--------|------------------------------------------------------------------------------------------------------------------------------------------------------------------|-------------------------------------------------------------------------------------------------------------------------------------------|-------|
+|`druid.ingestion.http.allowedProtocols`| List of protocols                                                                                                                                                | Allowed protocols for the HTTP input source.                                                                                              |`["http", "https"]`|
+|`druid.ingestion.http.allowedHeaders`| A list of permitted request headers for the HTTP input source. By default, the list is empty, which means no headers are allowed in the ingestion specification. |`[]`|
+
+### External data access security configuration
+
+#### JDBC connections to external databases
+
+You can use the following properties to specify permissible JDBC options for:
+
+* [SQL input source](../ingestion/input-sources.md#sql-input-source)
+* [globally cached JDBC lookups](../querying/lookups-cached-global.md#jdbc-lookup)
+* [JDBC Data Fetcher for per-lookup caching](../development/extensions-core/druid-lookups.md#data-fetcher-layer).
+
+These properties do not apply to metadata storage connections.
+
+|Property|Possible values| Description                                                                                                                                                                                                                                                                                                                                                                                                                                                                    |Default|
+|--------|---------------|--------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|-------|
+|`druid.access.jdbc.enforceAllowedProperties`|Boolean| When true, Druid applies `druid.access.jdbc.allowedProperties` to JDBC connections starting with `jdbc:postgresql:`, `jdbc:mysql:`, or `jdbc:mariadb:`. When false, Druid allows any kind of JDBC connections without JDBC property validation. This config is for backward compatibility especially during upgrades since enforcing allow list can break existing ingestion jobs or lookups based on JDBC. This config is deprecated and will be removed in a future release. |true|
+|`druid.access.jdbc.allowedProperties`|List of JDBC properties| Defines a list of allowed JDBC properties. Druid always enforces the list for all JDBC connections starting with `jdbc:postgresql:`, `jdbc:mysql:`, and `jdbc:mariadb:` if `druid.access.jdbc.enforceAllowedProperties` is set to true.<br/><br/>This option is tested against MySQL connector 8.2.0, MariaDB connector 2.7.4, and PostgreSQL connector 42.2.14. Other connector versions might not work.                                                                           |`["useSSL", "requireSSL", "ssl", "sslmode"]`|
+|`druid.access.jdbc.allowUnknownJdbcUrlFormat`|Boolean| When false, Druid only accepts JDBC connections starting with `jdbc:postgresql:` or `jdbc:mysql:`. When true, Druid allows JDBC connections to any kind of database, but only enforces `druid.access.jdbc.allowedProperties` for PostgreSQL and MySQL/MariaDB.                                                                                                                                                                                                                 |true|
+
+### Task logging
+
+You can use the `druid.indexer` configuration to set a [long-term storage](#log-long-term-storage) location for task log files, and to set a [retention policy](#log-retention-policy).
+
+For more information about ingestion tasks and the services of generating logs, see the [task reference](../ingestion/tasks.md).
+
+#### Log long-term storage
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.indexer.logs.type`|Where to store task logs.  `noop`, [`s3`](#s3-task-logs), [`azure`](#azure-blob-store-task-logs), [`google`](#google-cloud-storage-task-logs), [`hdfs`](#hdfs-task-logs), [`file`](#file-task-logs) |`file`|
+
+##### File task logs
+
+Store task logs in the local filesystem.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.indexer.logs.directory`|Local filesystem path.|log|
+
+##### S3 task logs
+
+Store task logs in S3. Note that the `druid-s3-extensions` extension must be loaded.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.indexer.logs.s3Bucket`|S3 bucket name.|none|
+|`druid.indexer.logs.s3Prefix`|S3 key prefix.|none|
+|`druid.indexer.logs.disableAcl`|Boolean flag for ACL. If this is set to `false`, the full control would be granted to the bucket owner. If the task logs bucket is the same as the deep storage (S3) bucket, then the value of this property will need to be set to true if druid.storage.disableAcl has been set to true.|false|
+
+##### Azure Blob Store task logs
+
+Store task logs in Azure Blob Store. To enable this feature, load the `druid-azure-extensions` extension, and configure deep storage for Azure. Druid uses the same authentication method configured for deep storage and stores task logs in the same storage account (set in `druid.azure.account`).
+
+| Property | Description | Default |
+|---|---|---|
+| `druid.indexer.logs.container` | The Azure Blob Store container to write logs to. | Must be set. |
+| `druid.indexer.logs.prefix` | The path to prepend to logs. | Must be set. |
+
+##### Google Cloud Storage task logs
+
+Store task logs in Google Cloud Storage.
+
+Note: The `druid-google-extensions` extension must be loaded, and this uses the same storage settings as the deep storage module for google.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.indexer.logs.bucket`|The Google Cloud Storage bucket to write logs to|none|
+|`druid.indexer.logs.prefix`|The path to prepend to logs|none|
+
+##### HDFS task logs
+
+Store task logs in HDFS. Note that the `druid-hdfs-storage` extension must be loaded.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.indexer.logs.directory`|The directory to store logs.|none|
+
+#### Log retention policy
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.indexer.logs.kill.enabled`|Boolean value for whether to enable deletion of old task logs. If set to true, Overlord will submit kill tasks periodically based on `druid.indexer.logs.kill.delay` specified, which will delete task logs from the log directory as well as tasks and tasklogs table entries in metadata storage except for tasks created in the last `druid.indexer.logs.kill.durationToRetain` period. |false|
+|`druid.indexer.logs.kill.durationToRetain`| Required if kill is enabled. In milliseconds, task logs and entries in task-related metadata storage tables to be retained created in last x milliseconds. |None|
+|`druid.indexer.logs.kill.initialDelay`| Optional. Number of milliseconds after Overlord start when first auto kill is run. |random value less than 300000 (5 mins)|
+|`druid.indexer.logs.kill.delay`|Optional. Number of milliseconds of delay between successive executions of auto kill run. |21600000 (6 hours)|
+
+### API error response
+
+You can configure Druid API error responses to hide internal information like the Druid class name, stack trace, thread name, servlet name, code, line/column number, host, or IP address.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.server.http.showDetailedJettyErrors`|When set to true, any error from the Jetty layer / Jetty filter includes the following fields  in the JSON response: `servlet`, `message`, `url`, `status`, and `cause`, if it exists. When set to false, the JSON response only includes `message`, `url`, and `status`. The field values remain unchanged.|true|
+|`druid.server.http.errorResponseTransform.strategy`|Error response transform strategy. The strategy controls how Druid transforms error responses from Druid services. When unset or set to `none`, Druid leaves error responses unchanged.|`none`|
+
+#### Error response transform strategy
+
+You can use an error response transform strategy to transform error responses from within Druid services to hide internal information.
+When you specify an error response transform strategy other than `none`, Druid transforms the error responses from Druid services as follows:
+
+* For any query API that fails in the Router service, Druid sets the fields `errorClass` and `host` to null. Druid applies the transformation strategy to the `errorMessage` field.
+* For any SQL query API that fails, for example `POST /druid/v2/sql/...`, Druid sets the fields `errorClass` and `host` to null. Druid applies the transformation strategy to the `errorMessage` field.
+* For any JDBC related exceptions, Druid will turn all checked exceptions into `QueryInterruptedException` otherwise druid will attempt to keep the exception as the same type. For example if the original exception isn't owned by Druid it will become `QueryInterruptedException`. Druid applies the transformation strategy to the `errorMessage` field.
+
+##### No error response transform strategy
+
+In this mode, Druid leaves error responses from underlying services unchanged and returns the unchanged errors to the API client.
+This is the default Druid error response mode. To explicitly enable this strategy, set `druid.server.http.errorResponseTransform.strategy` to `none`.
+
+##### Allowed regular expression error response transform strategy
+
+In this mode, Druid validates the error responses from underlying services against a list of regular expressions. Only error messages that match a configured regular expression are returned. To enable this strategy, set `druid.server.http.errorResponseTransform.strategy` to `allowedRegex`.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.server.http.errorResponseTransform.allowedRegex`|The list of regular expressions Druid uses to validate error messages. If the error message matches any of the regular expressions, then Druid includes it in the response unchanged. If the error message does not match any of the regular expressions, Druid replaces the error message with null or with a default message depending on the type of underlying Exception. |`[]`|
+
+For example, consider the following error response:
+
+```json
+{"error":"Plan validation failed","errorMessage":"org.apache.calcite.runtime.CalciteContextException: From line 1, column 15 to line 1, column 38: Object 'nonexistent-datasource' not found","errorClass":"org.apache.calcite.tools.ValidationException","host":null}
+```
+
+If `druid.server.http.errorResponseTransform.allowedRegex` is set to `[]`, Druid transforms the query error response to the following:
+
+```json
+{"error":"Plan validation failed","errorMessage":null,"errorClass":null,"host":null}
+```
+
+On the other hand, if `druid.server.http.errorResponseTransform.allowedRegex` is set to `[".*CalciteContextException.*"]` then Druid transforms the query error response to the following:
+
+```json
+{"error":"Plan validation failed","errorMessage":"org.apache.calcite.runtime.CalciteContextException: From line 1, column 15 to line 1, column 38: Object 'nonexistent-datasource' not found","errorClass":null,"host":null}
+```
+
+##### Persona based error response transform strategy
+
+In this mode, Druid transforms any exceptions which are targeted at non-users personas. Instead of returning such exception directly, the strategy logs the exception against a random id and returns the id along with a generic error message to the user.
+
+To enable this strategy, set `druid.server.http.errorResponseTransform.strategy` to `persona`.
+
+### Overlord discovery
+
+This config is used to find the [Overlord](../design/overlord.md) using Curator service discovery. Only required if you are actually running an Overlord.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.selectors.indexing.serviceName`|The druid.service name of the Overlord service. To start the Overlord with a different name, set it with this property. |druid/overlord|
+
+### Coordinator discovery
+
+This config is used to find the [Coordinator](../design/coordinator.md) using Curator service discovery. This config is used by the realtime indexing services to get information about the segments loaded in the cluster.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.selectors.coordinator.serviceName`|The druid.service name of the Coordinator service. To start the Coordinator with a different name, set it with this property. |druid/coordinator|
+
+### Announcing segments
+
+You can configure how to announce and unannounce Znodes in ZooKeeper (using Curator). For normal operations you do not need to override any of these configs.
+
+#### Batch data segment announcer
+
+In current Druid, multiple data segments may be announced under the same Znode.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.announcer.segmentsPerNode`|Each Znode contains info for up to this many segments.|50|
+|`druid.announcer.maxBytesPerNode`|Max byte size for Znode. Allowed range is [1024, 1048576].|524288|
+|`druid.announcer.skipDimensionsAndMetrics`|Skip Dimensions and Metrics list from segment announcements. NOTE: Enabling this will also remove the dimensions and metrics list from Coordinator and Broker endpoints.|false|
+|`druid.announcer.skipLoadSpec`|Skip segment LoadSpec from segment announcements. NOTE: Enabling this will also remove the loadspec from Coordinator and Broker endpoints.|false|
+
+If you want to turn off the batch data segment announcer, you can add a property to skip announcing segments. **You do not want to enable this config if you have any services using `batch` for `druid.serverview.type`**
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.announcer.skipSegmentAnnouncementOnZk`|Skip announcing segments to ZooKeeper. Note that the batch server view will not work if this is set to true.|false|
+
+### JavaScript
+
+Druid supports dynamic runtime extension through JavaScript functions. This functionality can be configured through
+the following properties.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.javascript.enabled`|Set to "true" to enable JavaScript functionality. This affects the JavaScript parser, filter, extractionFn, aggregator, post-aggregator, router strategy, and worker selection strategy.|false|
+
+:::info
+ JavaScript-based functionality is disabled by default. Please refer to the Druid [JavaScript programming guide](../development/javascript.md) for guidelines about using Druid's JavaScript functionality, including instructions on how to enable it.
+:::
+
+### Double column storage
+
+Prior to version 0.13.0, Druid's storage layer used a 32-bit float representation to store columns created by the
+doubleSum, doubleMin, and doubleMax aggregators at indexing time.
+Starting from version 0.13.0 the default will be 64-bit floats for Double columns.
+Using 64-bit representation for double column will lead to avoid precision loss at the cost of doubling the storage size of such columns.
+To keep the old format set the system-wide property `druid.indexing.doubleStorage=float`.
+You can also use `floatSum`, `floatMin`, and `floatMax` to use 32-bit float representation.
+Support for 64-bit floating point columns was released in Druid 0.11.0, so if you use this feature then older versions of Druid will not be able to read your data segments.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.indexing.doubleStorage`|Set to "float" to use 32-bit double representation for double columns.|double|
+
+### HTTP client
+
+All Druid components can communicate with each other over HTTP.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.global.http.numConnections`|Size of connection pool per destination URL. If there are more HTTP requests than this number that all need to speak to the same URL, then they will queue up.|`20`|
+|`druid.global.http.eagerInitialization`|Indicates that http connections should be eagerly initialized. If set to true, `numConnections` connections are created upon initialization|`false`|
+|`druid.global.http.compressionCodec`|Compression codec to communicate with others. May be "gzip" or "identity".|`gzip`|
+|`druid.global.http.readTimeout`|The timeout for data reads.|`PT15M`|
+|`druid.global.http.unusedConnectionTimeout`|The timeout for idle connections in connection pool. The connection in the pool will be closed after this timeout and a new one will be established. This timeout should be less than `druid.global.http.readTimeout`. Set this timeout = ~90% of `druid.global.http.readTimeout`|`PT4M`|
+|`druid.global.http.numMaxThreads`|Maximum number of I/O worker threads|`(number of cores) * 3 / 2 + 1`|
+|`druid.global.http.clientConnectTimeout`|The timeout (in milliseconds) for establishing client connections.|500|
+
+### Common endpoints configuration
+
+This section contains the configuration options for endpoints that are supported by all services.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.server.hiddenProperties`| If property names or substring of property names (case insensitive) is in this list, responses of the `/status/properties` endpoint do not show these properties | `["druid.s3.accessKey","druid.s3.secretKey","druid.metadata.storage.connector.password", "password", "key", "token", "pwd"]` |
+
+## Master server
+
+This section contains the configuration options for the services that reside on Master servers (Coordinators and Overlords) in the suggested [three-server configuration](../design/architecture.md#druid-servers).
+
+### Coordinator
+
+For general Coordinator services information, see [Coordinator service](../design/coordinator.md).
+
+#### Static Configuration
+
+These Coordinator static configurations can be defined in the `coordinator/runtime.properties` file.
+
+##### Coordinator service config
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.host`|The host for the current service. This is used to advertise the current service location as reachable from another service and should generally be specified such that `http://${druid.host}/` could actually talk to this service.|`InetAddress.getLocalHost().getCanonicalHostName()`|
+|`druid.bindOnHost`|Indicating whether the service's internal jetty server bind on `druid.host`. Default is false, which means binding to all interfaces.|false|
+|`druid.plaintextPort`|This is the port to actually listen on; unless port mapping is used, this will be the same port as is on `druid.host`|8081|
+|`druid.tlsPort`|TLS port for HTTPS connector, if [druid.enableTlsPort](../operations/tls-support.md) is set then this config will be used. If `druid.host` contains port then that port will be ignored. This should be a non-negative integer.|8281|
+|`druid.service`|The name of the service. This is used as a dimension when emitting metrics and alerts to differentiate between the various services.|`druid/coordinator`|
+|`druid.labels`|Optional JSON object of key-value pairs that define custom labels for the server. These labels are displayed in the web console under the "Services" tab. Example: `druid.labels={"location":"Airtrunk"}` or `druid.labels.location=Airtrunk`|`null`|
+
+##### Coordinator operation
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.coordinator.period`|The run period for the Coordinator. The Coordinator operates by maintaining the current state of the world in memory and periodically looking at the set of "used" segments and segments being served to make decisions about whether any changes need to be made to the data topology. This property sets the delay between each of these runs.|`PT60S`|
+|`druid.coordinator.startDelay`|The operation of the Coordinator works on the assumption that it has an up-to-date view of the state of the world when it runs, the current ZooKeeper interaction code, however, is written in a way that doesn’t allow the Coordinator to know for a fact that it’s done loading the current state of the world. This delay is a hack to give it enough time to believe that it has all the data.|`PT300S`|
+|`druid.coordinator.load.timeout`|The timeout duration for when the Coordinator assigns a segment to a Historical service.|`PT15M`|
+|`druid.coordinator.balancer.strategy`|The [balancing strategy](../design/coordinator.md#balancing-segments-in-a-tier) used by the Coordinator to distribute segments among the Historical servers in a tier. The `cost` strategy distributes segments by minimizing a cost function, `diskNormalized` weights these costs with the disk usage ratios of the servers and `random` distributes segments randomly.|`cost`|
+|`druid.coordinator.loadqueuepeon.http.repeatDelay`|The start and repeat delay (in milliseconds) for the load queue peon, which manages the load/drop queue of segments for any server.|1 minute|
+|`druid.coordinator.loadqueuepeon.http.batchSize`|Number of segment load/drop requests to batch in one HTTP request. Note that it must be smaller than or equal to the `druid.segmentCache.numLoadingThreads` config on Historical service. If this value is not configured, the coordinator uses the value of the `numLoadingThreads` for the respective server. | `druid.segmentCache.numLoadingThreads` |
+|`druid.coordinator.asOverlord.enabled`|Boolean value for whether this Coordinator service should act like an Overlord as well. This configuration allows users to simplify a Druid cluster by not having to deploy any standalone Overlord services. If set to true, then Overlord console is available at `http://coordinator-host:port/console.html` and be sure to set `druid.coordinator.asOverlord.overlordService` also.|false|
+|`druid.coordinator.asOverlord.overlordService`| Required, if `druid.coordinator.asOverlord.enabled` is `true`. This must be same value as `druid.service` on standalone Overlord services and `druid.selectors.indexing.serviceName` on Middle Managers.|NULL|
+
+##### Data management
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.coordinator.period.indexingPeriod`|Period to run data management duties on the Coordinator including launching compact tasks and performing clean up of unused data. It is recommended to keep this value longer than `druid.manager.segments.pollDuration`.|`PT1800S` (30 mins)|
+|`druid.coordinator.kill.pendingSegments.on`|Boolean flag for whether or not the Coordinator clean up old entries in the `pendingSegments` table of metadata store. If set to true, Coordinator will check the created time of most recently complete task. If it doesn't exist, it finds the created time of the earliest running/pending/waiting tasks. Once the created time is found, then for all datasources not in the `killPendingSegmentsSkipList` (see [Dynamic configuration](#dynamic-configuration)), Coordinator will ask the Overlord to clean up the entries 1 day or more older than the found created time in the `pendingSegments` table. This will be done periodically based on `druid.coordinator.period.indexingPeriod` specified.|true|
+|`druid.coordinator.kill.on`|Boolean flag to enable the Coordinator to submit a kill task for unused segments and delete them permanently from the metadata store and deep storage.|false|
+|`druid.coordinator.kill.period`| The frequency of sending kill tasks to the indexing service. The value must be greater than or equal to `druid.coordinator.period.indexingPeriod`. Only applies if kill is turned on.|Same as `druid.coordinator.period.indexingPeriod`|
+|`druid.coordinator.kill.durationToRetain`|Duration, in ISO 8601 format, relative to the current time that identifies the data interval of segments to retain. When `druid.coordinator.kill.on` is true, any segment with a data interval ending before `now - durationToRetain` is eligible for permanent deletion. For example, if `durationToRetain` is set to `P90D`, unused segments with time intervals ending 90 days in the past are eligible for deletion. If `durationToRetain` is set to a negative ISO 8601 period, segments with future intervals ending before `now - durationToRetain` are also eligible for deletion.|`P90D`|
+|`druid.coordinator.kill.ignoreDurationToRetain`|A way to override `druid.coordinator.kill.durationToRetain` and tell the coordinator that you do not care about the end date of unused segment intervals when it comes to killing them. If true, the coordinator considers all unused segments as eligible to be killed.|false|
+|`druid.coordinator.kill.bufferPeriod`|The amount of time that a segment must be unused before it is able to be permanently removed from metadata and deep storage. This can serve as a buffer period to prevent data loss if data ends up being needed after being marked unused.|`P30D`|
+|`druid.coordinator.kill.maxSegments`|The number of unused segments to kill per kill task. This number must be greater than 0. This only applies when `druid.coordinator.kill.on=true`.|100|
+|`druid.coordinator.kill.maxInterval`|The largest interval, as an [ISO 8601 duration](https://en.wikipedia.org/wiki/ISO_8601#Durations), of segments to delete per kill task. Set to zero, e.g. `PT0S`, for unlimited. This only applies when `druid.coordinator.kill.on=true`.|`P30D`|
+
+##### Metadata management
+
+|Property|Description|Required|Default|
+|--------|-----------|---------|-------|
+|`druid.coordinator.period.metadataStoreManagementPeriod`|How often to run metadata management tasks in [ISO 8601](https://en.wikipedia.org/wiki/ISO_8601) duration format. |No | `PT1H`|
+|`druid.coordinator.kill.supervisor.on`| Boolean value for whether to enable automatic deletion of terminated supervisors. If set to true, Coordinator will periodically remove terminated supervisors from the supervisor table in metadata storage.| No |true|
+|`druid.coordinator.kill.supervisor.period`| How often to do automatic deletion of terminated supervisor in [ISO 8601](https://en.wikipedia.org/wiki/ISO_8601) duration format. Value must be equal to or greater than  `druid.coordinator.period.metadataStoreManagementPeriod`. Only applies if `druid.coordinator.kill.supervisor.on` is set to true.| No| `P1D`|
+|`druid.coordinator.kill.supervisor.durationToRetain`| Duration of terminated supervisor to be retained from created time in [ISO 8601](https://en.wikipedia.org/wiki/ISO_8601) duration format. Only applies if `druid.coordinator.kill.supervisor.on` is set to true.| Yes if `druid.coordinator.kill.supervisor.on` is set to true.| `P90D`|
+|`druid.coordinator.kill.audit.on`| Boolean value for whether to enable automatic deletion of audit logs. If set to true, Coordinator will periodically remove audit logs from the audit table entries in metadata storage.| No | True|
+|`druid.coordinator.kill.audit.period`| How often to do automatic deletion of audit logs in [ISO 8601](https://en.wikipedia.org/wiki/ISO_8601) duration format. Value must be equal to or greater than  `druid.coordinator.period.metadataStoreManagementPeriod`. Only applies if `druid.coordinator.kill.audit.on` is set to true.| No| `P1D`|
+|`druid.coordinator.kill.audit.durationToRetain`| Duration of audit logs to be retained from created time in [ISO 8601](https://en.wikipedia.org/wiki/ISO_8601) duration format. Only applies if `druid.coordinator.kill.audit.on` is set to true.| Yes if `druid.coordinator.kill.audit.on` is set to true.| `P90D`|
+|`druid.coordinator.kill.compaction.on`| Boolean value for whether to enable automatic deletion of compaction configurations. If set to true, Coordinator will periodically remove compaction configuration of inactive datasource (datasource with no used and unused segments) from the config table in metadata storage.  | No |True|
+|`druid.coordinator.kill.compaction.period`| How often to do automatic deletion of compaction configurations in [ISO 8601](https://en.wikipedia.org/wiki/ISO_8601) duration format. Value must be equal to or greater than  `druid.coordinator.period.metadataStoreManagementPeriod`. Only applies if `druid.coordinator.kill.compaction.on` is set to true.| No| `P1D`|
+|`druid.coordinator.kill.rule.on`| Boolean value for whether to enable automatic deletion of rules. If set to true, Coordinator will periodically remove rules of inactive datasource (datasource with no used and unused segments) from the rule table in metadata storage.| No | True|
+|`druid.coordinator.kill.rule.period`| How often to do automatic deletion of rules in [ISO 8601](https://en.wikipedia.org/wiki/ISO_8601) duration format. Value must be equal to or greater than  `druid.coordinator.period.metadataStoreManagementPeriod`. Only applies if `druid.coordinator.kill.rule.on` is set to true.| No| `P1D`|
+|`druid.coordinator.kill.rule.durationToRetain`| Duration of rules to be retained from created time in [ISO 8601](https://en.wikipedia.org/wiki/ISO_8601) duration format. Only applies if `druid.coordinator.kill.rule.on` is set to true.| Yes if `druid.coordinator.kill.rule.on` is set to true.| `P90D`|
+|`druid.coordinator.kill.datasource.on`| Boolean value for whether to enable automatic deletion of datasource metadata (Note: datasource metadata only exists for datasource created from supervisor). If set to true, Coordinator will periodically remove datasource metadata of terminated supervisor from the datasource table in metadata storage.  | No | True|
+|`druid.coordinator.kill.datasource.period`| How often to do automatic deletion of datasource metadata in [ISO 8601](https://en.wikipedia.org/wiki/ISO_8601) duration format. Value must be equal to or greater than  `druid.coordinator.period.metadataStoreManagementPeriod`. Only applies if `druid.coordinator.kill.datasource.on` is set to true.| No| `P1D`|
+|`druid.coordinator.kill.datasource.durationToRetain`| Duration of datasource metadata to be retained from created time in [ISO 8601](https://en.wikipedia.org/wiki/ISO_8601) duration format. Only applies if `druid.coordinator.kill.datasource.on` is set to true.| Yes if `druid.coordinator.kill.datasource.on` is set to true.| `P90D`|
+|`druid.coordinator.kill.segmentSchema.on`| Boolean value for whether to enable automatic deletion of unused segment schemas. If set to true, Coordinator will periodically identify segment schemas which are not referenced by any used segment and mark them as unused. At a later point, these unused schemas are deleted. Only applies if [Centralized Datasource schema](#centralized-datasource-schema-experimental) feature is enabled. | No | True|
+|`druid.coordinator.kill.segmentSchema.period`| How often to do automatic deletion of segment schemas in [ISO 8601](https://en.wikipedia.org/wiki/ISO_8601) duration format. Value must be equal to or greater than `druid.coordinator.period.metadataStoreManagementPeriod`. Only applies if `druid.coordinator.kill.segmentSchema.on` is set to true.| No| `P1D`|
+|`druid.coordinator.kill.segmentSchema.durationToRetain`| Duration of segment schemas to be retained from the time it was marked as unused in [ISO 8601](https://en.wikipedia.org/wiki/ISO_8601) duration format. Only applies if `druid.coordinator.kill.segmentSchema.on` is set to true.| Yes, if `druid.coordinator.kill.segmentSchema.on` is set to true.| `P90D`|
+
+##### Segment management
+
+|Property|Possible values|Description|Default|
+|--------|---------------|-----------|-------|
+|`druid.serverview.type`|batch or http|Segment discovery method to use. "http" enables discovering segments using HTTP instead of ZooKeeper.|http|
+|`druid.coordinator.segment.awaitInitializationOnStart`|true or false|Whether the Coordinator will wait for its view of segments to fully initialize before starting up. If set to 'true', the Coordinator's HTTP server will not start up, and the Coordinator will not announce itself as available, until the server view is initialized.|true|
+
+##### Metadata retrieval
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.manager.config.pollDuration`|How often the manager polls the config table for updates.|`PT1M`|
+|`druid.manager.segments.pollDuration`|The duration between polls the Coordinator does for updates to the set of active segments. Generally defines the amount of lag time it can take for the Coordinator to notice new segments.|`PT1M`|
+|`druid.manager.segments.useIncrementalCache`|(Experimental) Denotes the usage mode of the segment metadata incremental cache. This cache provides a performance improvement over the polling mechanism currently employed by the Coordinator as it retrieves payloads of only updated segments. Possible cache modes are: (a) `never`: Incremental cache is disabled. (b) `always`: Incremental cache is enabled. Service start-up will be blocked until cache has synced with the metadata store at least once. (c) `ifSynced`: Cache is enabled. This mode does not block service start-up and is a way to retain existing behavior of the Coordinator. If the incremental cache is in modes `always` or `ifSynced`, reads from the cache will block until it has synced with the metadata store at least once after becoming leader. The Coordinator never writes to this cache.|`never`|
+|`druid.manager.rules.pollDuration`|The duration between polls the Coordinator does for updates to the set of active rules. Generally defines the amount of lag time it can take for the Coordinator to notice rules.|`PT1M`|
+|`druid.manager.rules.defaultRule`|The default rule for the cluster|`_default`|
+|`druid.manager.rules.alertThreshold`|The duration after a failed poll upon which an alert should be emitted.|`PT10M`|
+
+#### Dynamic configuration
+
+The Coordinator has dynamic configurations to tune certain behavior on the fly, without requiring a service restart.
+You can configure these parameters using the [web console](../operations/web-console.md)(recommended) or through the [Coordinator dynamic configuration API](../api-reference/dynamic-configuration-api.md#coordinator-dynamic-configuration).
+
+The following table shows the dynamic configuration properties for the Coordinator.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`millisToWaitBeforeDeleting`|How long does the Coordinator need to be a leader before it can start marking overshadowed segments as unused in metadata storage.| 900000 (15 mins)|
+|`smartSegmentLoading`|Enables ["smart" segment loading mode](#smart-segment-loading) which dynamically computes the optimal values of several properties that maximize Coordinator performance.|true|
+|`maxSegmentsToMove`|The maximum number of segments that can be moved in a Historical tier at any given time.|100|
+|`replicantLifetime`|The maximum number of Coordinator runs for which a segment can wait in the load queue of a Historical before Druid raises an alert.|15|
+|`replicationThrottleLimit`|The maximum number of segment replicas that can be assigned to a historical tier in a single Coordinator run. This property prevents Historical services from becoming overwhelmed when loading extra replicas of segments that are already available in the cluster.|500|
+|`balancerComputeThreads`|Thread pool size for computing moving cost of segments during segment balancing. Consider increasing this if you have a lot of segments and moving segments begins to stall.|`num_cores` / 2|
+|`killDataSourceWhitelist`|List of specific data sources for which kill tasks can be issued if `druid.coordinator.kill.on` is true. It can be a comma-separated list of data source names or a JSON array. If `killDataSourceWhitelist` is empty, the Coordinator issues kill tasks for all data sources.|none|
+|`killTaskSlotRatio`|Ratio of total available task slots, including autoscaling if applicable that will be allowed for kill tasks. This value must be between 0 and 1. Only applicable for kill tasks that are spawned automatically by the coordinator's auto kill duty, which is enabled when `druid.coordinator.kill.on` is true.|0.1|
+|`maxKillTaskSlots`|Maximum number of tasks that will be allowed for kill tasks. This limit only applies for kill tasks that are spawned automatically by the coordinator's auto kill duty, which is enabled when `druid.coordinator.kill.on` is true.|`Integer.MAX_VALUE` - no limit|
+|`killPendingSegmentsSkipList`|List of data sources for which pendingSegments are _NOT_ cleaned up if property `druid.coordinator.kill.pendingSegments.on` is true. This can be a list of comma-separated data sources or a JSON array.|none|
+|`maxSegmentsInNodeLoadingQueue`|The maximum number of segments allowed in the load queue of any given server. Use this parameter to load segments faster if, for example, the cluster contains slow-loading nodes or if there are too many segments to be replicated to a particular node (when faster loading is preferred to better segments distribution). The optimal value depends on the loading speed of segments, acceptable replication time and number of nodes.|500|
+|`useRoundRobinSegmentAssignment`|Boolean flag for whether segments should be assigned to Historical services in a round robin fashion. When disabled, segment assignment is done using the chosen balancer strategy. When enabled, this can speed up segment assignments leaving balancing to move the segments to their optimal locations (based on the balancer strategy) lazily.|true|
+|`decommissioningNodes`|List of Historical servers to decommission. Coordinator will not assign new segments to decommissioning servers, and segments will be moved away from them to be placed on non-decommissioning servers at the maximum rate specified by `maxSegmentsToMove`.|none|
+|`pauseCoordination`|Boolean flag for whether or not the Coordinator should execute its various duties of coordinating the cluster. Setting this to true essentially pauses all coordination work while allowing the API to remain up. Duties that are paused include all classes that implement the `CoordinatorDuty` interface. Such duties include: segment balancing, segment compaction, submitting kill tasks for unused segments (if enabled), logging of used segments in the cluster, marking of newly unused or overshadowed segments, matching and execution of load/drop rules for used segments, unloading segments that are no longer marked as used from Historical servers. An example of when an admin may want to pause coordination would be if they are doing deep storage maintenance on HDFS name nodes with downtime and don't want the Coordinator to be directing Historical nodes to hit the name node with API requests until maintenance is done and the deep store is declared healthy for use again.|false|
+|`replicateAfterLoadTimeout`|Boolean flag for whether or not additional replication is needed for segments that have failed to load due to the expiry of `druid.coordinator.load.timeout`. If this is set to true, the Coordinator will attempt to replicate the failed segment on a different historical server. This helps improve the segment availability if there are a few slow Historicals in the cluster. However, the slow Historical may still load the segment later and the Coordinator may issue drop requests if the segment is over-replicated.|false|
+|`turboLoadingNodes`| Experimental. List of Historical servers to place in turbo loading mode. These servers use a larger thread-pool to load segments faster but at the cost of query performance. For servers specified in `turboLoadingNodes`, `druid.coordinator.loadqueuepeon.http.batchSize` is ignored and the coordinator uses the value of the respective `numLoadingThreads` instead.<br/>Please use this config with caution. All servers should eventually be removed from this list once the segment loading on the respective historicals is finished. |none|
+|`cloneServers`| Experimental. Map from target Historical server to source Historical server which should be cloned by the target. The target Historical does not participate in regular segment assignment or balancing. Instead, the Coordinator mirrors any segment assignment made to the source Historical onto the target Historical, so that the target becomes an exact copy of the source. Segments on the target Historical do not count towards replica counts either. If the source disappears, the target remains in the last known state of the source server until removed from the configuration. <br/>Use this config with caution. All servers should eventually be removed from this list once the desired state on the respective Historicals is achieved. |none|
+
+##### Smart segment loading
+
+The `smartSegmentLoading` mode simplifies Coordinator configuration for segment loading and balancing.
+If you enable this mode, do not provide values for the properties in the table below as the Coordinator computes them automatically.
+Druid computes the values to optimize Coordinator performance, based on the current state of the cluster.
+
+If you enable `smartSegmentLoading` mode, Druid ignores any value you provide for the following properties.
+
+|Property|Computed value|Description|
+|--------|--------------|-----------|
+|`useRoundRobinSegmentAssignment`|true|Speeds up segment assignment.|
+|`maxSegmentsInNodeLoadingQueue`|0|Removes the limit on load queue size.|
+|`replicationThrottleLimit`|5% of used segments, minimum value 100|Prevents aggressive replication when a Historical disappears only intermittently.|
+|`replicantLifetime`|60|Allows segments to wait about an hour (assuming a Coordinator period of 1 minute) in the load queue before an alert is raised. In `smartSegmentLoading` mode, load queues are not limited by size. Segments might therefore assigned to a load queue even if the corresponding server is slow to load them.|
+|`maxSegmentsToMove`|2% of used segments, minimum value 100, maximum value 1000|Ensures that some segments are always moving in the cluster to keep it well balanced. The maximum value keeps the Coordinator run times bounded.|
+|`balancerComputeThreads`|`num_cores` / 2|Ensures that there are enough threads to perform balancing computations without hogging all Coordinator resources.|
+
+When `smartSegmentLoading` is disabled, Druid uses the configured values of these properties.
+Disable `smartSegmentLoading` only if you want to explicitly set the values of any of the above properties.
+
+##### Lookups dynamic configuration
+
+These configuration options control Coordinator lookup management. For configurations that affect lookup propagation, see [Dynamic configuration for lookups](../querying/lookups.md#dynamic-configuration).
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.manager.lookups.hostDeleteTimeout`|How long to wait for a `DELETE` request to a particular service before considering the `DELETE` a failure.|`PT1S`|
+|`druid.manager.lookups.hostUpdateTimeout`|How long to wait for a `POST` request to a particular service before considering the `POST` a failure.|`PT10S`|
+|`druid.manager.lookups.deleteAllTimeout`|How long to wait for all `DELETE` requests to finish before considering the delete attempt a failure.|`PT10S`|
+|`druid.manager.lookups.updateAllTimeout`|How long to wait for all `POST` requests to finish before considering the attempt a failure.|`PT60S`|
+|`druid.manager.lookups.threadPoolSize`|How many services can be managed concurrently (concurrent `POST` and `DELETE` requests). Requests this limit will wait in a queue until a slot becomes available.|10|
+|`druid.manager.lookups.period`|Number of milliseconds between checks for configuration changes.|120000 (2 minutes)|
+
+##### Automatic compaction dynamic configuration
+
+You can set or update [automatic compaction](../data-management/automatic-compaction.md) properties dynamically using the
+[Automatic compaction API](../api-reference/automatic-compaction-api.md) without restarting Coordinators.
+
+For details about segment compaction, see [Segment size optimization](../operations/segment-optimization.md).
+
+You can configure automatic compaction through the following properties:
+
+|Property|Description|Required|
+|--------|-----------|--------|
+|`dataSource`|The datasource name to be compacted.|yes|
+|`taskPriority`|[Priority](../ingestion/tasks.md#lock-priority) of compaction task.|no (default = 25)|
+|`inputSegmentSizeBytes`|Maximum number of total segment bytes processed per compaction task. Since a time chunk must be processed in its entirety, if the segments for a particular time chunk have a total size in bytes greater than this parameter, compaction will not run for that time chunk.|no (default = 100,000,000,000,000 i.e. 100TB)|
+|`skipOffsetFromLatest`|The offset for searching segments to be compacted in [ISO 8601](https://en.wikipedia.org/wiki/ISO_8601) duration format. Strongly recommended to set for realtime datasources. See [Data handling with compaction](../data-management/compaction.md#data-handling-with-compaction).|no (default = "P1D")|
+|`tuningConfig`|Tuning config for compaction tasks. See below [Automatic compaction tuningConfig](#automatic-compaction-tuningconfig).|no|
+|`taskContext`|[Task context](../ingestion/tasks.md#context-parameters) for compaction tasks.|no|
+|`granularitySpec`|Custom `granularitySpec`. See [Automatic compaction granularitySpec](#automatic-compaction-granularityspec).|no|
+|`dimensionsSpec`|Custom `dimensionsSpec`. See [Automatic compaction dimensionsSpec](#automatic-compaction-dimensionsspec).|no|
+|`transformSpec`|Custom `transformSpec`. See [Automatic compaction transformSpec](#automatic-compaction-transformspec).|no|
+|`metricsSpec`|Custom [`metricsSpec`](../ingestion/ingestion-spec.md#metricsspec). The compaction task preserves any existing metrics regardless of whether `metricsSpec` is specified. If `metricsSpec` is specified, Druid does not reapply any aggregators matching the metric names specified in `metricsSpec` to rows that already have the associated metrics. For rows that do not already have the metric specified in `metricsSpec`, Druid applies the metric aggregator on the source column, then proceeds to combine the metrics across segments as usual. If `metricsSpec` is not specified, Druid automatically discovers the metrics in the existing segments and combines existing metrics with the same metric name across segments. Aggregators for metrics with the same name are assumed to be compatible for combining across segments, otherwise the compaction task may fail.|no|
+|`ioConfig`|IO config for compaction tasks. See [Automatic compaction ioConfig](#automatic-compaction-ioconfig).|no|
+
+Automatic compaction config example:
+
+```json
+{
+  "dataSource": "wikiticker",
+  "granularitySpec" : {
+    "segmentGranularity" : "none"
+  }
+}
+```
+
+Compaction tasks fail when higher priority tasks cause Druid to revoke their locks. By default, realtime tasks like ingestion have a higher priority than compaction tasks. Frequent conflicts between compaction tasks and realtime tasks can cause the Coordinator's automatic compaction to hang.
+You may see this issue with streaming ingestion from Kafka and Kinesis, which ingest late-arriving data.
+
+To mitigate this problem, set `skipOffsetFromLatest` to a value large enough so that arriving data tends to fall outside the offset value from the current time. This way you can avoid conflicts between compaction tasks and realtime ingestion tasks.
+For example, if you want to skip over segments from thirty days prior to the end time of the most recent segment, assign `"skipOffsetFromLatest": "P30D"`.
+For more information, see [Avoid conflicts with ingestion](../data-management/automatic-compaction.md#avoid-conflicts-with-ingestion).
+
+###### Automatic compaction tuningConfig
+
+Auto-compaction supports a subset of the [tuningConfig for Parallel task](../ingestion/native-batch.md#tuningconfig).
+
+The following table shows the supported configurations for auto-compaction.
+
+|Property|Description|Required|
+|--------|-----------|--------|
+|type|The task type. If you're using Coordinator duties for auto-compaction, set it to `index_parallel`. If you're using compaction supervisors, set it to `autocompact`. |yes|
+|`maxRowsInMemory`|Used in determining when intermediate persists to disk should occur. Normally user does not need to set this, but depending on the nature of data, if rows are short in terms of bytes, user may not want to store a million rows in memory and this value should be set.|no (default = 1000000)|
+|`maxBytesInMemory`|Used in determining when intermediate persists to disk should occur. Normally this is computed internally and user does not need to set it. This value represents number of bytes to aggregate in heap memory before persisting. This is based on a rough estimate of memory usage and not actual usage. The maximum heap memory usage for indexing is `maxBytesInMemory` * (2 + `maxPendingPersists`)|no (default = 1/6 of max JVM memory)|
+|`splitHintSpec`|Used to give a hint to control the amount of data that each first phase task reads. This hint could be ignored depending on the implementation of the input source. See [Split hint spec](../ingestion/native-batch.md#split-hint-spec) for more details.|no (default = size-based split hint spec)|
+|`partitionsSpec`|Defines how to partition data in each time chunk, see [`PartitionsSpec`](../ingestion/native-batch.md#partitionsspec)|no (default = `dynamic`)|
+|`indexSpec`|Defines segment storage format options to be used at indexing time, see [IndexSpec](../ingestion/ingestion-spec.md#indexspec)|no|
+|`indexSpecForIntermediatePersists`|Defines segment storage format options to be used at indexing time for intermediate persisted temporary segments. this can be used to disable dimension/metric compression on intermediate segments to reduce memory required for final merging. however, disabling compression on intermediate segments might increase page cache use while they are used before getting merged into final segment published, see [IndexSpec](../ingestion/ingestion-spec.md#indexspec) for possible values.|no|
+|`maxPendingPersists`|Maximum number of persists that can be pending but not started. If this limit would be exceeded by a new intermediate persist, ingestion will block until the currently-running persist finishes. Maximum heap memory usage for indexing scales with `maxRowsInMemory` * (2 + `maxPendingPersists`).|no (default = 0, meaning one persist can be running concurrently with ingestion, and none can be queued up)|
+|`pushTimeout`|Milliseconds to wait for pushing segments. It must be >= 0, where 0 means to wait forever.|no (default = 0)|
+|`segmentWriteOutMediumFactory`|Segment write-out medium to use when creating segments. See [SegmentWriteOutMediumFactory](../ingestion/native-batch.md#segmentwriteoutmediumfactory).|no (default is the value from `druid.peon.defaultSegmentWriteOutMediumFactory.type` is used)|
+|`maxNumConcurrentSubTasks`|Maximum number of worker tasks which can be run in parallel at the same time. The supervisor task would spawn worker tasks up to `maxNumConcurrentSubTasks` regardless of the current available task slots. If this value is set to 1, the Supervisor task processes data ingestion on its own instead of spawning worker tasks. If this value is set to too large, too many worker tasks can be created which might block other ingestion. Check [Capacity Planning](../ingestion/native-batch.md#capacity-planning) for more details.|no (default = 1)|
+|`maxRetry`|Maximum number of retries on task failures.|no (default = 3)|
+|`maxNumSegmentsToMerge`|Max limit for the number of segments that a single task can merge at the same time in the second phase. Used only with `hashed` or `single_dim` partitionsSpec.|no (default = 100)|
+|`totalNumMergeTasks`|Total number of tasks to merge segments in the merge phase when `partitionsSpec` is set to `hashed` or `single_dim`.|no (default = 10)|
+|`taskStatusCheckPeriodMs`|Polling period in milliseconds to check running task statuses.|no (default = 1000)|
+|`chatHandlerTimeout`|Timeout for reporting the pushed segments in worker tasks.|no (default = PT10S)|
+|`chatHandlerNumRetries`|Retries for reporting the pushed segments in worker tasks.|no (default = 5)|
+|`engine` | Engine for compaction. Can be either `native` or `msq`. `msq`  uses the MSQ task engine and is only supported with [compaction supervisors](../data-management/automatic-compaction.md#auto-compaction-using-compaction-supervisors). | no (default = native)|
+
+###### Automatic compaction granularitySpec
+
+|Field|Description|Required|
+|-----|-----------|--------|
+|`segmentGranularity`|Time chunking period for the segment granularity. Defaults to 'null', which preserves the original segment granularity. Accepts all [Query granularity](../querying/granularities.md) values.|No|
+|`queryGranularity`|The resolution of timestamp storage within each segment. Defaults to 'null', which preserves the original query granularity. Accepts all [Query granularity](../querying/granularities.md) values.|No|
+|`rollup`|Whether to enable ingestion-time rollup or not. Defaults to null, which preserves the original setting. Note that once data is rollup, individual records can no longer be recovered. |No|
+
+###### Automatic compaction dimensionsSpec
+
+|Field|Description|Required|
+|-----|-----------|--------|
+|`dimensions`| A list of dimension names or objects. Defaults to null, which preserves the original dimensions. Note that setting this will cause segments manually compacted with `dimensionExclusions` to be compacted again.|No|
+
+###### Automatic compaction transformSpec
+
+|Field|Description|Required|
+|-----|-----------|--------|
+|`filter`| Conditionally filters input rows during compaction. Only rows that pass the filter will be included in the compacted segments. Any of Druid's standard [query filters](../querying/filters.md) can be used. Defaults to null, which will not filter any row. |No|
+
+###### Automatic compaction ioConfig
+
+Auto-compaction supports a subset of the [ioConfig for Parallel task](../ingestion/native-batch.md).
+The below is a list of the supported configurations for auto-compaction.
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|--------|
+|`dropExisting`|If `true` the compaction task replaces all existing segments fully contained by the umbrella interval of the compacted segments when the task publishes new segments and tombstones. If compaction fails, Druid does not publish any segments or tombstones. WARNING: this functionality is still in beta. Note that changing this config does not cause intervals to be compacted again.|false|no|
+
+### Overlord
+
+For general Overlord service information, see [Overlord](../design/overlord.md).
+
+#### Overlord static configuration
+
+These Overlord static configurations can be defined in the `overlord/runtime.properties` file.
+
+##### Overlord service configs
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.host`|The host for the current service. This is used to advertise the current service location as reachable from another service and should generally be specified such that `http://${druid.host}/` could actually talk to this service.|`InetAddress.getLocalHost().getCanonicalHostName()`|
+|`druid.bindOnHost`|Indicating whether the service's internal jetty server bind on `druid.host`. Default is false, which means binding to all interfaces.|false|
+|`druid.plaintextPort`|This is the port to actually listen on; unless port mapping is used, this will be the same port as is on `druid.host`.|8090|
+|`druid.tlsPort`|TLS port for HTTPS connector, if [druid.enableTlsPort](../operations/tls-support.md) is set then this config will be used. If `druid.host` contains port then that port will be ignored. This should be a non-negative Integer.|8290|
+|`druid.service`|The name of the service. This is used as a dimension when emitting metrics and alerts to differentiate between the various services.|`druid/overlord`|
+|`druid.labels`|Optional JSON object of key-value pairs that define custom labels for the server. These labels are displayed in the web console under the "Services" tab. Example: `druid.labels={"location":"Airtrunk"}` or `druid.labels.location=Airtrunk`|`null`|
+
+##### Overlord operations
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.indexer.runner.type`|Indicates whether tasks should be run locally using `local` or in a distributed environment using `remote`. The recommended option is `httpRemote`, which is similar to `remote` but uses HTTP to interact with Middle Managers instead of ZooKeeper.|`httpRemote`|
+|`druid.indexer.storage.type`|Indicates whether incoming tasks should be stored locally (in heap) or in metadata storage. One of `local` or `metadata`. `local` is mainly for internal testing while `metadata` is recommended in production because storing incoming tasks in metadata storage allows for tasks to be resumed if the Overlord should fail.|`local`|
+|`druid.indexer.storage.recentlyFinishedThreshold`|Duration of time to store task results. Default is 24 hours. If you have hundreds of tasks running in a day, consider increasing this threshold.|`PT24H`|
+|`druid.indexer.tasklock.forceTimeChunkLock`|**Setting this to false is still experimental**<br/> If set, all tasks are enforced to use time chunk lock. If not set, each task automatically chooses a lock type to use. This configuration can be overwritten by setting `forceTimeChunkLock` in the [task context](../ingestion/tasks.md#context-parameters). See [Task lock system](../ingestion/tasks.md#task-lock-system) for more details about locking in tasks.|true|
+|`druid.indexer.tasklock.batchSegmentAllocation`| If set to true, Druid performs segment allocate actions in batches to improve throughput and reduce the average `task/action/run/time`. See [batching `segmentAllocate` actions](../ingestion/tasks.md#batching-segmentallocate-actions) for details.|true|
+|`druid.indexer.tasklock.batchAllocationWaitTime`|Number of milliseconds after Druid adds the first segment allocate action to a batch, until it executes the batch. Allows the batch to add more requests and improve the average segment allocation run time. This configuration takes effect only if `batchSegmentAllocation` is enabled.|0|
+|`druid.indexer.tasklock.batchAllocationNumThreads`|Number of worker threads to use for batch segment allocation. This represents the maximum number of allocation batches that can be processed in parallel for distinct datasources. Batches for a single datasource are always processed sequentially. This configuration takes effect only if `batchSegmentAllocation` is enabled.|5|
+|`druid.indexer.task.default.context`|Default task context that is applied to all tasks submitted to the Overlord. Any default in this config does not override neither the context values the user provides nor `druid.indexer.tasklock.forceTimeChunkLock`.|empty context|
+|`druid.indexer.queue.maxSize`|Maximum number of active tasks at one time.|`Integer.MAX_VALUE`|
+|`druid.indexer.queue.startDelay`|Sleep this long before starting Overlord queue management. This can be useful to give a cluster time to re-orient itself (for example, after a widespread network issue).|`PT1M`|
+|`druid.indexer.queue.restartDelay`|Sleep this long when Overlord queue management throws an exception before trying again.|`PT30S`|
+|`druid.indexer.queue.storageSyncRate`|Sync Overlord state this often with an underlying task persistence mechanism.|`PT1M`|
+|`druid.indexer.queue.maxTaskPayloadSize`|Maximum allowed size in bytes of a single task payload accepted by the Overlord.|none (allow all task payload sizes)|
+
+The following configs only apply if the Overlord is running in remote mode. For a description of local vs. remote mode, see [Overlord service](../design/overlord.md).
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.indexer.runner.taskAssignmentTimeout`|How long to wait after a task has been assigned to a Middle Manager before throwing an error.|`PT5M`|
+|`druid.indexer.runner.minWorkerVersion`|The minimum Middle Manager version to send tasks to. The version number is a string. This affects the expected behavior during certain operations like comparison against `druid.worker.version`. Specifically, the version comparison follows dictionary order. Use ISO8601 date format for the version to accommodate date comparisons. |"0"|
+| `druid.indexer.runner.parallelIndexTaskSlotRatio`| The ratio of task slots available for parallel indexing supervisor tasks per worker. The specified value must be in the range `[0, 1]`. |1|
+|`druid.indexer.runner.compressZnodes`|Indicates whether or not the Overlord should expect Middle Managers to compress Znodes.|true|
+|`druid.indexer.runner.maxZnodeBytes`|The maximum size Znode in bytes that can be created in ZooKeeper, should be in the range of `[10KiB, 2GiB)`. [Human-readable format](human-readable-byte.md) is supported.| 512 KiB |
+|`druid.indexer.runner.taskCleanupTimeout`|How long to wait before failing a task after a Middle Manager is disconnected from ZooKeeper.|`PT15M`|
+|`druid.indexer.runner.taskShutdownLinkTimeout`|How long to wait on a shutdown request to a Middle Manager before timing out|`PT1M`|
+|`druid.indexer.runner.pendingTasksRunnerNumThreads`|Number of threads to allocate pending-tasks to workers, must be at least 1.|1|
+|`druid.indexer.runner.maxRetriesBeforeBlacklist`|Number of consecutive times the Middle Manager can fail tasks,  before the worker is blacklisted, must be at least 1|5|
+|`druid.indexer.runner.workerBlackListBackoffTime`|How long to wait before a task is whitelisted again. This value should be greater that the value set for taskBlackListCleanupPeriod.|`PT15M`|
+|`druid.indexer.runner.workerBlackListCleanupPeriod`|A duration after which the cleanup thread will start up to clean blacklisted workers.|`PT5M`|
+|`druid.indexer.runner.maxPercentageBlacklistWorkers`|The maximum percentage of workers to blacklist, this must be between 0 and 100.|20|
+
+If autoscaling is enabled, you can set these additional configs:
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.indexer.autoscale.strategy`|Sets the strategy to run when autoscaling is required. One of `noop`, `ec2` or `gce`.|`noop`|
+|`druid.indexer.autoscale.doAutoscale`|If set to true, autoscaling will be enabled.|false|
+|`druid.indexer.autoscale.provisionPeriod`|How often to check whether or not new Middle Managers should be added.|`PT1M`|
+|`druid.indexer.autoscale.terminatePeriod`|How often to check when Middle Managers should be removed.|`PT5M`|
+|`druid.indexer.autoscale.originTime`|The starting reference timestamp that the terminate period increments upon.|`2012-01-01T00:55:00.000Z`|
+|`druid.indexer.autoscale.workerIdleTimeout`|How long can a worker be idle (not a run task) before it can be considered for termination.|`PT90M`|
+|`druid.indexer.autoscale.maxScalingDuration`|How long the Overlord will wait around for a Middle Manager to show up before giving up.|`PT15M`|
+|`druid.indexer.autoscale.numEventsToTrack`|The number of autoscaling related events (node creation and termination) to track.|10|
+|`druid.indexer.autoscale.pendingTaskTimeout`|How long a task can be in "pending" state before the Overlord tries to scale up.|`PT30S`|
+|`druid.indexer.autoscale.workerVersion`|If set, will only create nodes of set version during autoscaling. Overrides dynamic configuration. |null|
+|`druid.indexer.autoscale.workerPort`|The port that Middle Managers will run on.|8080|
+|`druid.indexer.autoscale.workerCapacityHint`| An estimation of the number of task slots available for each worker launched by the auto scaler when there are no workers running. The auto scaler uses the worker capacity hint to launch workers with an adequate capacity to handle pending tasks. When unset or set to a value less than or equal to 0, the auto scaler scales workers equal to the value for `minNumWorkers` in autoScaler config instead. The auto scaler assumes that each worker, either a Middle Manager or indexer, has the same amount of task slots. Therefore, when all your workers have the same capacity (homogeneous capacity), set the value for `autoscale.workerCapacityHint` equal to `druid.worker.capacity`. If your workers have different capacities (heterogeneous capacity), set the value to the average of `druid.worker.capacity` across the workers. For example, if two workers have `druid.worker.capacity=10`, and one has `druid.worker.capacity=4`, set `autoscale.workerCapacityHint=8`. Only applies to `pendingTaskBased` provisioning strategy.|-1|
+
+##### Supervisors
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.supervisor.healthinessThreshold`|The number of successful runs before an unhealthy supervisor is again considered healthy.|3|
+|`druid.supervisor.unhealthinessThreshold`|The number of failed runs before the supervisor is considered unhealthy.|3|
+|`druid.supervisor.taskHealthinessThreshold`|The number of consecutive task successes before an unhealthy supervisor is again considered healthy.|3|
+|`druid.supervisor.taskUnhealthinessThreshold`|The number of consecutive task failures before the supervisor is considered unhealthy.|3|
+|`druid.supervisor.storeStackTrace`|Whether full stack traces of supervisor exceptions should be stored and returned by the supervisor `/status` endpoint.|false|
+|`druid.supervisor.maxStoredExceptionEvents`|The maximum number of exception events that can be returned through the supervisor `/status` endpoint.|`max(healthinessThreshold, unhealthinessThreshold)`|
+|`druid.supervisor.idleConfig.enabled`|If `true`, supervisor can become idle if there is no data on input stream/topic for some time.|false|
+|`druid.supervisor.idleConfig.inactiveAfterMillis`|Supervisor is marked as idle if all existing data has been read from input topic and no new data has been published for `inactiveAfterMillis` milliseconds.|`600_000`|
+
+The `druid.supervisor.idleConfig.*` specification in the Overlord runtime properties defines the default behavior for the entire cluster. See [Idle Configuration in Kafka Supervisor IOConfig](../ingestion/kinesis-ingestion.md#io-configuration) to override it for an individual supervisor.
+
+##### Segment metadata cache (Experimental)
+
+The following properties pertain to segment metadata caching on the Overlord that may be used to speed up segment allocation and other metadata operations.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.manager.segments.useIncrementalCache`|Denotes the usage mode of the segment metadata incremental cache. Possible modes are: (a) `never`: Cache is disabled. (b) `always`: Reads are always done from the cache. Service start-up will be blocked until cache has synced with the metadata store at least once. Transactions will block until cache has synced with the metadata store at least once after becoming leader. (c) `ifSynced`: Reads are done from the cache only if it has already synced with the metadata store. This mode does not block service start-up or transactions.|`never`|
+|`druid.manager.segments.pollDuration`|Duration (in ISO 8601 format) between successive syncs of the cache with the metadata store. This property is used only when `druid.manager.segments.useIncrementalCache` is set to `always` or `ifSynced`.|`PT1M` (1 minute)|
+
+##### Auto-kill unused segments (Experimental)
+
+These configs pertain to the new embedded mode of running [kill tasks on the Overlord](../data-management/delete.md#auto-kill-data-on-the-overlord-experimental).
+None of the configs that apply to [auto-kill performed by the Coordinator](../data-management/delete.md#auto-kill-data-using-coordinator-duties) are used by this feature.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.manager.segments.killUnused.enabled`|Boolean flag to enable auto-kill of eligible unused segments on the Overlord. This feature can be used only when [segment metadata caching](#segment-metadata-cache-experimental) is enabled on the Overlord and MUST NOT be enabled if `druid.coordinator.kill.on` is already set to `true` on the Coordinator.|`true`|
+|`druid.manager.segments.killUnused.bufferPeriod`|Period after which a segment marked as unused becomes eligible for auto-kill on the Overlord. This config is effective only if `druid.manager.segments.killUnused.enabled` is set to `true`.|`P30D` (30 days)|
+
+#### Overlord dynamic configuration
+
+The Overlord has dynamic configurations to tune how Druid assigns tasks to workers.
+You can configure these parameters using the [web console](../operations/web-console.md) or through the [Overlord dynamic configuration API](../api-reference/dynamic-configuration-api.md#overlord-dynamic-configuration).
+
+The following table shows the dynamic configuration properties for the Overlord.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`selectStrategy`| Describes how to assign tasks to Middle Managers. The type can be `equalDistribution`, `equalDistributionWithCategorySpec`, `fillCapacity`, `fillCapacityWithCategorySpec`, and `javascript`. | `{"type":"equalDistribution"}` |
+|`autoScaler`| Only used if [autoscaling](#autoscaler) is enabled.| null |
+
+The following is an example of an Overlord dynamic config:
+
+<details>
+<summary>Click to view the example</summary>
+
+```json
+{
+  "selectStrategy": {
+    "type": "fillCapacity",
+    "affinityConfig": {
+      "affinity": {
+        "datasource1": ["host1:port", "host2:port"],
+        "datasource2": ["host3:port"]
+      }
+    }
+  },
+  "autoScaler": {
+    "type": "ec2",
+    "minNumWorkers": 2,
+    "maxNumWorkers": 12,
+    "envConfig": {
+      "availabilityZone": "us-east-1a",
+      "nodeData": {
+        "amiId": "${AMI}",
+        "instanceType": "c3.8xlarge",
+        "minInstances": 1,
+        "maxInstances": 1,
+        "securityGroupIds": ["${IDs}"],
+        "keyName": "${KEY_NAME}"
+      },
+      "userData": {
+        "impl": "string",
+        "data": "${SCRIPT_COMMAND}",
+        "versionReplacementString": ":VERSION:",
+        "version": null
+      }
+    }
+  }
+}
+```
+
+</details>
+
+##### Worker select strategy
+
+The select strategy controls how Druid assigns tasks to workers (Middle Managers).
+At a high level, the select strategy determines the list of eligible workers for a given task using
+either an `affinityConfig` or a `categorySpec`. Then, Druid assigns the task by either trying to distribute load equally
+(`equalDistribution`) or to fill as many workers as possible to capacity (`fillCapacity`).
+There are 4 options for select strategies:
+
+* [`equalDistribution`](#equaldistribution)
+* [`equalDistributionWithCategorySpec`](#equaldistributionwithcategoryspec)
+* [`fillCapacity`](#fillcapacity)
+* [`fillCapacityWithCategorySpec`](#fillcapacitywithcategoryspec)
+
+A `javascript` option is also available but should only be used for prototyping new strategies.
+
+If an `affinityConfig` is provided (as part of `fillCapacity` and `equalDistribution` strategies) for a given task, the list of workers eligible to be assigned is determined as follows:
+
+* a non-affinity worker if no affinity is specified for that datasource. Any worker not listed in the `affinityConfig` is considered a non-affinity worker.
+* a non-affinity worker if preferred workers are not available and the affinity is _weak_ i.e. `strong: false`.
+* a preferred worker listed in the `affinityConfig` for this datasource if it has available capacity
+* no worker if preferred workers are not available and affinity is _strong_ i.e. `strong: true`. In this case, the task remains in "pending" state. The chosen provisioning strategy (e.g. `pendingTaskBased`) may then use the total number of pending tasks to determine if a new node should be provisioned.
+
+Note that every worker listed in the `affinityConfig` will only be used for the assigned datasources and no other.
+
+If a `categorySpec` is provided (as part of `fillCapacityWithCategorySpec` and `equalDistributionWithCategorySpec` strategies), then a task of a given datasource may be assigned to:
+
+* any worker if no category config is given for task type
+* any worker if category config is given for task type but no category is given for datasource and there's no default category
+* a preferred worker (based on category config and category for datasource) if available
+* any worker if category config and category are given but no preferred worker is available and category config is `weak`
+* not assigned at all if preferred workers are not available and category config is `strong`
+
+In both the cases, Druid determines the list of eligible workers and selects one depending on their load with the goal of either distributing the load equally or filling as few workers as possible.
+
+If you are using auto-scaling, use the `fillCapacity` select strategy since auto-scaled nodes can
+not be assigned a category, and you want the work to be concentrated on the fewest number of workers to allow the empty ones to scale down.
+
+###### `equalDistribution`
+
+Tasks are assigned to the Middle Manager with the most free slots at the time the task begins running.
+This evenly distributes work across your Middle Managers.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`type`|`equalDistribution`|required; must be `equalDistribution`|
+|`affinityConfig`|[`AffinityConfig`](#affinityconfig) object|null (no affinity)|
+|`taskLimits`|[`TaskLimits`](#tasklimits) object|null (no limits)|
+
+###### `equalDistributionWithCategorySpec`
+
+This strategy is a variant of `equalDistribution`, which supports `workerCategorySpec` field rather than `affinityConfig`.
+By specifying `workerCategorySpec`, you can assign tasks to run on different categories of Middle Managers based on the **type** and **dataSource** of the task.
+This strategy doesn't work with `AutoScaler` since the behavior is undefined.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`type`|`equalDistributionWithCategorySpec`|required; must be `equalDistributionWithCategorySpec`|
+|`workerCategorySpec`|[`WorkerCategorySpec`](#workercategoryspec) object|null (no worker category spec)|
+|`taskLimits`|[`TaskLimits`](#tasklimits) object|null (no limits)|
+
+The following example shows tasks of type `index_kafka` that default to running on Middle Managers of category `c1`, except for tasks that write to datasource `ds1`, which run on Middle Managers of category `c2`.
+
+```json
+{
+  "selectStrategy": {
+    "type": "equalDistributionWithCategorySpec",
+    "workerCategorySpec": {
+      "strong": false,
+      "categoryMap": {
+        "index_kafka": {
+          "defaultCategory": "c1",
+          "categoryAffinity": {
+            "ds1": "c2"
+          }
+        }
+      }
+    }
+  }
+}
+```
+
+###### `fillCapacity`
+
+Tasks are assigned to the worker with the most currently-running tasks. This is
+useful when you are auto-scaling Middle Managers since it tends to pack some full and
+leave others empty. The empty ones can be safely terminated.
+
+Note that if `druid.indexer.runner.pendingTasksRunnerNumThreads` is set to _N_ > 1, then this strategy will fill _N_
+Middle Managers up to capacity simultaneously, rather than a single Middle Manager.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`type`| `fillCapacity`|required; must be `fillCapacity`|
+|`affinityConfig`| [`AffinityConfig`](#affinityconfig) object |null (no affinity)|
+|`taskLimits`|[`TaskLimits`](#tasklimits) object|null (no limits)|
+
+###### `fillCapacityWithCategorySpec`
+
+This strategy is a variant of `fillCapacity`, which supports `workerCategorySpec` instead of an `affinityConfig`.
+The usage is the same as `equalDistributionWithCategorySpec` strategy.
+This strategy doesn't work with `AutoScaler` since the behavior is undefined.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`type`|`fillCapacityWithCategorySpec`.|required; must be `fillCapacityWithCategorySpec`|
+|`workerCategorySpec`|[`WorkerCategorySpec`](#workercategoryspec) object|null (no worker category spec)|
+|`taskLimits`|[`TaskLimits`](#tasklimits) object|null (no limits)|
+
+<a name="javascript-worker-select-strategy"></a>
+
+###### `javascript`
+
+Allows defining arbitrary logic for selecting workers to run task using a JavaScript function.
+The function is passed remoteTaskRunnerConfig, map of workerId to available workers and task to be executed and returns the workerId on which the task should be run or null if the task cannot be run.
+It can be used for rapid development of missing features where the worker selection logic is to be changed or tuned often.
+If the selection logic is quite complex and cannot be easily tested in JavaScript environment,
+its better to write a druid extension module with extending current worker selection strategies written in java.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`type`|`javascript`|required; must be `javascript`|
+|`function`|String representing JavaScript function| |
+
+The following example shows a function that sends `batch_index_task` to workers `10.0.0.1` and `10.0.0.2` and all other tasks to other available workers.
+
+```json
+{
+  "type":"javascript",
+  "function":"function (config, zkWorkers, task) {\nvar batch_workers = new java.util.ArrayList();\nbatch_workers.add(\"middleManager1_hostname:8091\");\nbatch_workers.add(\"middleManager2_hostname:8091\");\nworkers = zkWorkers.keySet().toArray();\nvar sortedWorkers = new Array()\n;for(var i = 0; i < workers.length; i++){\n sortedWorkers[i] = workers[i];\n}\nArray.prototype.sort.call(sortedWorkers,function(a, b){return zkWorkers.get(b).getCurrCapacityUsed() - zkWorkers.get(a).getCurrCapacityUsed();});\nvar minWorkerVer = config.getMinWorkerVersion();\nfor (var i = 0; i < sortedWorkers.length; i++) {\n var worker = sortedWorkers[i];\n  var zkWorker = zkWorkers.get(worker);\n  if(zkWorker.canRunTask(task) && zkWorker.isValidVersion(minWorkerVer)){\n    if(task.getType() == 'index_hadoop' && batch_workers.contains(worker)){\n      return worker;\n    } else {\n      if(task.getType() != 'index_hadoop' && !batch_workers.contains(worker)){\n        return worker;\n      }\n    }\n  }\n}\nreturn null;\n}"
+}
+```
+
+:::info
+ JavaScript-based functionality is disabled by default. Refer to the Druid [JavaScript programming guide](../development/javascript.md) for guidelines about using Druid's JavaScript functionality, including instructions on how to enable it.
+:::
+
+###### affinityConfig
+
+Use the `affinityConfig` field to pass affinity configuration to the `equalDistribution` and `fillCapacity` strategies.
+If not provided, the default is to have no affinity.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`affinity`|JSON object mapping a datasource String name to a list of indexing service Middle Manager `host:port` values. Druid doesn't perform DNS resolution, so the 'host' value must match what is configured on the Middle Manager and what the Middle Manager announces itself as (examine the Overlord logs to see what your Middle Manager announces itself as).|`{}`|
+|`strong`|When `true` tasks for a datasource must be assigned to affinity-mapped Middle Managers. Tasks remain queued until a slot becomes available. When `false`, Druid may assign tasks for a datasource to other Middle Managers when affinity-mapped Middle Managers are unavailable to run queued tasks.|false|
+
+###### workerCategorySpec
+
+You can provide `workerCategorySpec` to the `equalDistributionWithCategorySpec` and `fillCapacityWithCategorySpec` strategies using the `workerCategorySpec`
+field. If not provided, the default is to not use it at all.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`categoryMap`|A JSON map object mapping a task type String name to a [CategoryConfig](#categoryconfig) object, by which you can specify category config for different task type.|`{}`|
+|`strong`|With weak workerCategorySpec (the default), tasks for a dataSource may be assigned to other Middle Managers if the Middle Managers specified in `categoryMap` are not able to run all pending tasks in the queue for that dataSource. With strong workerCategorySpec, tasks for a dataSource will only ever be assigned to their specified Middle Managers, and will wait in the pending queue if necessary.|false|
+
+###### `taskLimits`
+
+The `taskLimits` field can be used with the `equalDistribution`, `fillCapacity`, `equalDistributionWithCategorySpec` and `fillCapacityWithCategorySpec` strategies.
+If you don't provide it, it will default to not being used.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`maxSlotCountByType`|A map where each key is a task type (`String`), and the corresponding value represents the absolute limit on the number of task slots that tasks of this type can occupy. The value is an `Integer` that is greater than or equal to 0. For example, a value of 5 means that tasks of this type can occupy up to 5 task slots in total. If both absolute and ratio limits are specified for the same task type, the effective limit will be the smaller of the absolute limit and the limit derived from the corresponding ratio. `maxSlotCountByType = {"index_parallel": 3, "query_controller": 5}`. In this example, parallel indexing tasks can occupy up to 3 task slots, and query controllers can occupy up to 5 task slots.|`{}`|
+|`maxSlotRatioByType`|A map where each key is a task type (`String`), and the corresponding value is a `Double` which should be in the range [0, 1], representing the ratio of task slots that tasks of this type can occupy. This ratio defines the proportion of total task slots a task type can use, calculated as `ratio * totalSlots`. If both absolute and ratio limits are specified for the same task type, the effective limit will be the smaller of the absolute limit and the limit derived from the corresponding ratio. `maxSlotRatioByType = {"index_parallel": 0.5, "query_controller": 0.25}`. In this example, parallel indexing tasks can occupy up to 50% of the total task slots, and query controllers can occupy up to 25% of the total task slots.|`{}`|
+
+###### CategoryConfig
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`defaultCategory`|Specify default category for a task type.|null|
+|`categoryAffinity`|A JSON map object mapping a datasource String name to a category String name of the Middle Manager. If category isn't specified for a datasource, then using the `defaultCategory`. If no specified category and the `defaultCategory` is also null, then tasks can run on any available Middle Managers.|null|
+
+##### Autoscaler
+
+Amazon's EC2 together with Google's GCE are currently the only supported autoscalers.
+
+EC2's autoscaler properties are:
+
+|Property| Description|Default|
+|--------|------------|-------|
+|`type`|`ec2`|0|
+|`minNumWorkers`| The minimum number of workers that can be in the cluster at any given time.|0|
+|`maxNumWorkers`| The maximum number of workers that can be in the cluster at any given time.|0|
+|`envConfig.availabilityZone` | What Amazon availability zone to run in.|none|
+|`envConfig.nodeData`| A JSON object that describes how to launch new nodes.|none; required|
+| `envConfig.userData`| A JSON object that describes how to configure new nodes. If you have set `druid.indexer.autoscale.workerVersion`, this must have a `versionReplacementString`. Otherwise, a `versionReplacementString` is not necessary.|none; optional|
+
+For GCE's properties, please refer to the [gce-extensions](../development/extensions-contrib/gce-extensions.md).
+
+## Data server
+
+This section contains the configuration options for the services that reside on Data servers (Middle Managers/Peons and Historicals) in the suggested [three-server configuration](../design/architecture.md#druid-servers).
+
+Configuration options for the [Indexer process](../design/indexer.md) are also provided here.
+
+### Middle Manager and Peon
+
+These Middle Manager and Peon configurations can be defined in the `middleManager/runtime.properties` file.
+
+#### Middle Manager service config
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.host`|The host for the current service. This is used to advertise the current service location as reachable from another service and should generally be specified such that `http://${druid.host}/` could actually talk to this service|`InetAddress.getLocalHost().getCanonicalHostName()`|
+|`druid.bindOnHost`|Indicating whether the service's internal jetty server bind on `druid.host`. Default is false, which means binding to all interfaces.|false|
+|`druid.plaintextPort`|This is the port to actually listen on; unless port mapping is used, this will be the same port as is on `druid.host`|8091|
+|`druid.tlsPort`|TLS port for HTTPS connector, if [druid.enableTlsPort](../operations/tls-support.md) is set then this config will be used. If `druid.host` contains port then that port will be ignored. This should be a non-negative Integer.|8291|
+|`druid.service`|The name of the service. This is used as a dimension when emitting metrics and alerts to differentiate between the various services|`druid/middlemanager`|
+|`druid.labels`|Optional JSON object of key-value pairs that define custom labels for the server. These labels are displayed in the web console under the "Services" tab. Example: `druid.labels={"location":"Airtrunk"}` or `druid.labels.location=Airtrunk`|`null`|
+
+#### Middle Manager configuration
+
+Middle Managers pass their configurations down to their child peons. The Middle Manager requires the following configs:
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.indexer.runner.allowedPrefixes`|Whitelist of prefixes for configs that can be passed down to child peons.|`com.metamx`, `druid`, `org.apache.druid`, `user.timezone`, `file.encoding`, `java.io.tmpdir`, `hadoop`|
+|`druid.indexer.runner.compressZnodes`|Indicates whether or not the Middle Managers should compress Znodes.|true|
+|`druid.indexer.runner.classpath`|Java classpath for the peon.|`System.getProperty("java.class.path")`|
+|`druid.indexer.runner.javaCommand`|Command required to execute java.|java|
+|`druid.indexer.runner.javaOpts`|_DEPRECATED_ A string of -X Java options to pass to the peon's JVM. Quotable parameters or parameters with spaces are encouraged to use javaOptsArray|`''`|
+|`druid.indexer.runner.javaOptsArray`|A JSON array of strings to be passed in as options to the peon's JVM. This is additive to `druid.indexer.runner.javaOpts` and is recommended for properly handling arguments which contain quotes or spaces like `["-XX:OnOutOfMemoryError=kill -9 %p"]`|`[]`|
+|`druid.indexer.runner.maxZnodeBytes`|The maximum size Znode in bytes that can be created in ZooKeeper, should be in the range of [10KiB, 2GiB). [Human-readable format](human-readable-byte.md) is supported.|512KiB|
+|`druid.indexer.runner.startPort`|Starting port used for Peon services, should be greater than 1023 and less than 65536.|8100|
+|`druid.indexer.runner.endPort`|Ending port used for Peon services, should be greater than or equal to `druid.indexer.runner.startPort` and less than 65536.|65535|
+|`druid.indexer.runner.ports`|A JSON array of integers to specify ports that used for Peon services. If provided and non-empty, ports for Peon services will be chosen from these ports. And `druid.indexer.runner.startPort/druid.indexer.runner.endPort` will be completely ignored.|`[]`|
+|`druid.worker.ip`|The IP of the worker.|`localhost`|
+|`druid.worker.version`|Version identifier for the Middle Manager. The version number is a string. This affects the expected behavior during certain operations like comparison against `druid.indexer.runner.minWorkerVersion`. Specifically, the version comparison follows dictionary order. Use ISO8601 date format for the version to accommodate date comparisons.|0|
+|`druid.worker.capacity`|Maximum number of tasks the Middle Manager can accept.|Number of CPUs on the machine - 1|
+|`druid.worker.baseTaskDirs`|List of base temporary working directories, one of which is assigned per task in a round-robin fashion. This property can be used to allow usage of multiple disks for indexing. This property is recommended in place of and takes precedence over `${druid.indexer.task.baseTaskDir}`.  If this configuration is not set, `${druid.indexer.task.baseTaskDir}` is used. For example, `druid.worker.baseTaskDirs=[\"PATH1\",\"PATH2\",...]`.|null|
+|`druid.worker.baseTaskDirSize`|The total amount of bytes that can be used by tasks on any single task dir. This value is treated symmetrically across all directories, that is, if this is 500 GB and there are 3 `baseTaskDirs`, then each of those task directories is assumed to allow for 500 GB to be used and a total of 1.5 TB will potentially be available across all tasks. The actual amount of memory assigned to each task is discussed in [Configuring task storage sizes](../ingestion/tasks.md#configuring-task-storage-sizes)|`Long.MAX_VALUE`|
+|`druid.worker.category`|A string to name the category that the Middle Manager node belongs to.|`_default_worker_category`|
+|`druid.indexer.fork.property.druid.centralizedDatasourceSchema.enabled`| This config should be set when [Centralized Datasource Schema](#centralized-datasource-schema-experimental) feature is enabled. |false|
+
+#### Peon processing
+
+Processing properties set on the Middle Manager are passed through to Peons.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.processing.buffer.sizeBytes`|This specifies a buffer size (less than 2GiB) for the storage of intermediate results. The computation engine in both the Historical and Realtime processes will use a scratch buffer of this size to do all of their intermediate computations off-heap. Larger values allow for more aggregations in a single pass over the data while smaller values can require more passes depending on the query that is being executed. [Human-readable format](human-readable-byte.md) is supported.|auto (max 1 GiB)|
+|`druid.processing.buffer.poolCacheMaxCount`|Processing buffer pool caches the buffers for later use. This is the maximum count that the cache will grow to. Note that pool can create more buffers than it can cache if necessary.|`Integer.MAX_VALUE`|
+|`druid.processing.formatString`|Realtime and Historical processes use this format string to name their processing threads.|processing-%s|
+|`druid.processing.numMergeBuffers`|The number of direct memory buffers available for merging query results. The buffers are sized by `druid.processing.buffer.sizeBytes`. This property is effectively a concurrency limit for queries that require merging buffers. If you are using any queries that require merge buffers (currently, just groupBy) then you should have at least two of these.|`max(2, druid.processing.numThreads / 4)`|
+|`druid.processing.numThreads`|The number of processing threads to have available for parallel processing of segments. Our rule of thumb is `num_cores - 1`, which means that even under heavy load there will still be one core available to do background tasks like talking with ZooKeeper and pulling down segments. If only one core is available, this property defaults to the value `1`.|Number of cores - 1 (or 1)|
+|`druid.processing.numTimeoutThreads`|The number of processing threads to have available for handling per-segment query timeouts. Setting this value to `0` removes the ability to service per-segment timeouts, irrespective of `perSegmentTimeout` query context parameter. As these threads are just servicing timers, it's recommended to set this value to some small percent (e.g. 5%) of the total query processing cores available to the peon.|0|
+|`druid.processing.fifo`|Enables the processing queue to treat tasks of equal priority in a FIFO manner.|`true`|
+|`druid.processing.tmpDir`|Path where temporary files created while processing a query should be stored. If specified, this configuration takes priority over the default `java.io.tmpdir` path.|path represented by `java.io.tmpdir`|
+|`druid.processing.intermediaryData.storage.type`|Storage type for intermediary segments of data shuffle between native parallel index tasks. <br />Set to `local` to store segment files in the local storage of the Middle Manager or Indexer. <br />Set to `deepstore` to use configured deep storage for better fault tolerance during rolling updates. When the storage type is `deepstore`, Druid stores the data in the `shuffle-data` directory under the configured deep storage path. Druid does not support automated cleanup for the `shuffle-data` directory. You can set up cloud storage lifecycle rules for automated cleanup of data at the `shuffle-data` prefix location.|`local`|
+
+The amount of direct memory needed by Druid is at least
+`druid.processing.buffer.sizeBytes * (druid.processing.numMergeBuffers + druid.processing.numThreads + 1)`. You can
+ensure at least this amount of direct memory is available by providing `-XX:MaxDirectMemorySize=<VALUE>` in
+`druid.indexer.runner.javaOptsArray` as documented above.
+
+#### Peon query configuration
+
+See [general query configuration](#general-query-configuration).
+
+#### Peon caching
+
+You can optionally configure caching to be enabled on the peons by setting caching configs here.
+
+|Property|Possible Values|Description|Default|
+|--------|---------------|-----------|-------|
+|`druid.realtime.cache.useCache`|true, false|Enable the cache on the realtime.|false|
+|`druid.realtime.cache.populateCache`|true, false|Populate the cache on the realtime.|false|
+|`druid.realtime.cache.unCacheable`|All druid query types|All query types to not cache.|`[scan]`|
+|`druid.realtime.cache.maxEntrySize`|positive integer|Maximum cache entry size in bytes.|1_000_000|
+
+See [cache configuration](#cache-configuration) for how to configure cache settings.
+
+#### Additional Peon configuration
+
+Although Peons inherit the configurations of their parent Middle Managers, explicit child Peon configs in Middle Manager can be set by prefixing them with:
+
+```properties
+druid.indexer.fork.property
+```
+
+Additional Peon configs include:
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.peon.mode`|One of `local` or `remote`. Setting this property to `local` means you intend to run the Peon as a standalone process which is not recommended.|`remote`|
+|`druid.indexer.task.baseDir`|Base temporary working directory.|`System.getProperty("java.io.tmpdir")`|
+|`druid.indexer.task.baseTaskDir`|Base temporary working directory for tasks.|`${druid.indexer.task.baseDir}/persistent/task`|
+|`druid.indexer.task.defaultHadoopCoordinates`|Hadoop version to use with HadoopIndexTasks that do not request a particular version.|`org.apache.hadoop:hadoop-client-api:3.3.6`, `org.apache.hadoop:hadoop-client-runtime:3.3.6`|
+|`druid.indexer.task.defaultRowFlushBoundary`|Highest row count before persisting to disk. Used for indexing generating tasks.|75000|
+|`druid.indexer.task.directoryLockTimeout`|Wait this long for zombie Peons to exit before giving up on their replacements.|PT10M|
+|`druid.indexer.task.gracefulShutdownTimeout`|Wait this long on Middle Manager restart for restorable tasks to gracefully exit.|PT5M|
+|`druid.indexer.task.hadoopWorkingPath`|Temporary working directory for Hadoop tasks.|`/tmp/druid-indexing`|
+|`druid.indexer.task.restoreTasksOnRestart`|If true, Middle Managers will attempt to stop tasks gracefully on shutdown and restore them on restart.|false|
+|`druid.indexer.task.ignoreTimestampSpecForDruidInputSource`|If true, tasks using the [Druid input source](../ingestion/input-sources.md) will ignore the provided timestampSpec, and will use the `__time` column of the input datasource. This option is provided for compatibility with ingestion specs written before Druid 0.22.0.|false|
+|`druid.indexer.task.storeEmptyColumns`|Boolean value for whether or not to store empty columns during ingestion. When set to true, Druid stores every column specified in the [`dimensionsSpec`](../ingestion/ingestion-spec.md#dimensionsspec). If you use the string-based schemaless ingestion and don't specify any dimensions to ingest, you must also set [`includeAllDimensions`](../ingestion/ingestion-spec.md#dimensionsspec) for Druid to store empty columns.<br/><br/>If you set `storeEmptyColumns` to false, Druid SQL queries referencing empty columns will fail. If you intend to leave `storeEmptyColumns` disabled, you should either ingest placeholder data for empty columns or else not query on empty columns.<br/><br/>You can overwrite this configuration  by setting `storeEmptyColumns` in the [task context](../ingestion/tasks.md#context-parameters).|true|
+|`druid.indexer.task.tmpStorageBytesPerTask`|Maximum number of bytes per task to be used to store temporary files on disk. This config is generally intended for internal usage. Attempts to set it are very likely to be overwritten by the TaskRunner that executes the task, so be sure of what you expect to happen before directly adjusting this configuration parameter. The config is documented here primarily to provide an understanding of what it means if/when someone sees that it has been set. A value of -1 disables this limit.  |-1|
+|`druid.indexer.task.allowHadoopTaskExecution`|Conditional dictating if the cluster allows `index_hadoop` tasks to be executed. `index_hadoop` is deprecated, and defaulting to false will force cluster operators to acknowledge the deprecation and consciously opt in to using index_hadoop with the understanding that it will be removed in the future.|false|
+|`druid.indexer.server.maxChatRequests`|Maximum number of concurrent requests served by a task's chat handler. Set to 0 to disable limiting.|0|
+
+If the Peon is running in remote mode, there must be an Overlord up and running. Peons in remote mode can set the following configurations:
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.peon.taskActionClient.retry.minWait`|The minimum retry time to communicate with Overlord.|`PT5S`|
+|`druid.peon.taskActionClient.retry.maxWait`|The maximum retry time to communicate with Overlord.|`PT1M`|
+|`druid.peon.taskActionClient.retry.maxRetryCount`|The maximum number of retries to communicate with Overlord.|13 (about 10 minutes of retrying)|
+
+##### SegmentWriteOutMediumFactory
+
+When new segments are created, Druid temporarily stores some preprocessed data in some buffers.
+The following types of medium exist for the buffers:
+
+* **Temporary files** (`tmpFile`) are stored under the task working directory (see `druid.worker.baseTaskDirs` configuration above) and thus share it's mounting properties. For example, they could be backed by HDD, SSD or memory (tmpfs).
+This type of medium may do unnecessary disk I/O and requires some disk space to be available.
+
+* **Off-heap memory** (`offHeapMemory`) creates buffers in off-heap memory of a JVM process that is running a task.
+This type of medium is preferred, but it may require you to allow the JVM to have more off-heap memory by changing the `-XX:MaxDirectMemorySize` configuration. It's not understood yet how the required off-heap memory size relates to the size of the segments being created. But you shouldn't add more extra off-heap memory than the configured maximum _heap_ size (`-Xmx`) for the same JVM.
+
+* **On-heap memory** (`onHeapMemory`) creates buffers using the allocated heap memory of the JVM process running a task. Using on-heap memory introduces garbage collection overhead and so is not recommended in most cases. This type of medium is most helpful for tasks run on external clusters where it may be difficult to allocate and work with direct memory effectively.
+
+For most types of tasks, `SegmentWriteOutMediumFactory` can be configured per-task (see [Tasks](../ingestion/tasks.md) for more information), but if it's not specified for a task, or it's not supported for a particular task type, then Druid uses the value from the following configuration:
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.peon.defaultSegmentWriteOutMediumFactory.type`|`tmpFile`, `offHeapMemory`, or `onHeapMemory`|`tmpFile`|
+
+### Indexer
+
+#### Indexer process configuration
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.host`|The host for the current process. This is used to advertise the current processes location as reachable from another process and should generally be specified such that `http://${druid.host}/` could actually talk to this process|`InetAddress.getLocalHost().getCanonicalHostName()`|
+|`druid.bindOnHost`|Indicating whether the process's internal jetty server bind on `druid.host`. Default is false, which means binding to all interfaces.|false|
+|`druid.plaintextPort`|This is the port to actually listen on; unless port mapping is used, this will be the same port as is on `druid.host`|8091|
+|`druid.tlsPort`|TLS port for HTTPS connector, if [druid.enableTlsPort](../operations/tls-support.md) is set then this config will be used. If `druid.host` contains port then that port will be ignored. This should be a non-negative Integer.|8283|
+|`druid.service`|The name of the service. This is used as a dimension when emitting metrics and alerts to differentiate between the various services|`druid/indexer`|
+|`druid.labels`|Optional JSON object of key-value pairs that define custom labels for the server. These labels are displayed in the web console under the "Services" tab. Example: `druid.labels={"location":"Airtrunk"}` or `druid.labels.location=Airtrunk`|`null`|
+
+#### Indexer general configuration
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.worker.version`|Version identifier for the Indexer.|0|
+|`druid.worker.capacity`|Maximum number of tasks the Indexer can accept.|Number of available processors - 1|
+|`druid.worker.baseTaskDirs`|List of base temporary working directories, one of which is assigned per task in a round-robin fashion. This property can be used to allow usage of multiple disks for indexing. This property is recommended in place of and takes precedence over `${druid.indexer.task.baseTaskDir}`.  If this configuration is not set, `${druid.indexer.task.baseTaskDir}` is used. Example: `druid.worker.baseTaskDirs=[\"PATH1\",\"PATH2\",...]`.|null|
+|`druid.worker.baseTaskDirSize`|The total amount of bytes that can be used by tasks on any single task dir. This value is treated symmetrically across all directories, that is, if this is 500 GB and there are 3 `baseTaskDirs`, then each of those task directories is assumed to allow for 500 GB to be used and a total of 1.5 TB will potentially be available across all tasks. The actual amount of memory assigned to each task is discussed in [Configuring task storage sizes](../ingestion/tasks.md#configuring-task-storage-sizes)|`Long.MAX_VALUE`|
+|`druid.worker.globalIngestionHeapLimitBytes`|Total amount of heap available for ingestion processing. This is applied by automatically setting the `maxBytesInMemory` property on tasks.|Configured max JVM heap size / 6|
+|`druid.worker.numConcurrentMerges`|Maximum number of segment persist or merge operations that can run concurrently across all tasks.|`druid.worker.capacity` / 2, rounded down|
+|`druid.indexer.task.baseDir`|Base temporary working directory.|`System.getProperty("java.io.tmpdir")`|
+|`druid.indexer.task.baseTaskDir`|Base temporary working directory for tasks.|`${druid.indexer.task.baseDir}/persistent/tasks`|
+|`druid.indexer.task.defaultHadoopCoordinates`|Hadoop version to use with HadoopIndexTasks that do not request a particular version.|`org.apache.hadoop:hadoop-client-api:3.3.6`, `org.apache.hadoop:hadoop-client-runtime:3.3.6`|
+|`druid.indexer.task.gracefulShutdownTimeout`|Wait this long on Indexer restart for restorable tasks to gracefully exit.|`PT5M`|
+|`druid.indexer.task.hadoopWorkingPath`|Temporary working directory for Hadoop tasks.|`/tmp/druid-indexing`|
+|`druid.indexer.task.restoreTasksOnRestart`|If true, the Indexer will attempt to stop tasks gracefully on shutdown and restore them on restart.|false|
+|`druid.indexer.task.ignoreTimestampSpecForDruidInputSource`|If true, tasks using the [Druid input source](../ingestion/input-sources.md) will ignore the provided timestampSpec, and will use the `__time` column of the input datasource. This option is provided for compatibility with ingestion specs written before Druid 0.22.0.|false|
+|`druid.indexer.task.storeEmptyColumns`|Boolean value for whether or not to store empty columns during ingestion. When set to true, Druid stores every column specified in the [`dimensionsSpec`](../ingestion/ingestion-spec.md#dimensionsspec). <br/><br/>If you set `storeEmptyColumns` to false, Druid SQL queries referencing empty columns will fail. If you intend to leave `storeEmptyColumns` disabled, you should either ingest placeholder data for empty columns or else not query on empty columns.<br/><br/>You can overwrite this configuration by setting `storeEmptyColumns` in the [task context](../ingestion/tasks.md#context-parameters).|true|
+|`druid.peon.taskActionClient.retry.minWait`|The minimum retry time to communicate with Overlord.|`PT5S`|
+|`druid.peon.taskActionClient.retry.maxWait`|The maximum retry time to communicate with Overlord.|`PT1M`|
+|`druid.peon.taskActionClient.retry.maxRetryCount`|The maximum number of retries to communicate with Overlord.|13 (about 10 minutes of retrying)|
+
+#### Indexer concurrent requests
+
+Druid uses Jetty to serve HTTP requests.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.server.http.numThreads`|Number of threads for HTTP requests. Please see the [Indexer Server HTTP threads](../design/indexer.md#server-http-threads) documentation for more details on how the Indexer uses this configuration.|max(10, (Number of cores * 17) / 16 + 2) + 30|
+|`druid.server.http.queueSize`|Size of the worker queue used by Jetty server to temporarily store incoming client connections. If this value is set and a request is rejected by jetty because queue is full then client would observe request failure with TCP connection being closed immediately with a completely empty response from server.|Unbounded|
+|`druid.server.http.maxIdleTime`|The Jetty max idle time for a connection.|`PT5M`|
+|`druid.server.http.enableRequestLimit`|If enabled, no requests would be queued in jetty queue and "HTTP 429 Too Many Requests" error response would be sent. |false|
+|`druid.server.http.defaultQueryTimeout`|Query timeout in millis, beyond which unfinished queries will be cancelled|300000|
+|`druid.server.http.gracefulShutdownTimeout`|The maximum amount of time Jetty waits after receiving shutdown signal. After this timeout the threads will be forcefully shutdown. This allows any queries that are executing to complete(Only values greater than zero are valid).|`PT30S`|
+|`druid.server.http.unannouncePropagationDelay`|How long to wait for ZooKeeper unannouncements to propagate before shutting down Jetty. This is a minimum and `druid.server.http.gracefulShutdownTimeout` does not start counting down until after this period elapses.|`PT0S` (do not wait)|
+|`druid.server.http.maxQueryTimeout`|Maximum allowed value (in milliseconds) for `timeout` parameter. See [query-context](../querying/query-context-reference.md) to know more about `timeout`. Query is rejected if the query context `timeout` is greater than this value. |`Long.MAX_VALUE`|
+|`druid.server.http.maxRequestHeaderSize`|Maximum size of a request header in bytes. Larger headers consume more memory and can make a server more vulnerable to denial of service attacks.|8 * 1024|
+|`druid.server.http.enableForwardedRequestCustomizer`|If enabled, adds Jetty ForwardedRequestCustomizer which reads X-Forwarded-* request headers to manipulate servlet request object when Druid is used behind a proxy.|false|
+|`druid.server.http.allowedHttpMethods`|List of HTTP methods that should be allowed in addition to the ones required by Druid APIs. Druid APIs require GET, PUT, POST, and DELETE, which are always allowed. This option is not useful unless you have installed an extension that needs these additional HTTP methods or that adds functionality related to CORS. None of Druid's bundled extensions require these methods.|`[]`|
+|`druid.server.http.contentSecurityPolicy`|Content-Security-Policy header value to set on each non-POST response. Setting this property to an empty string, or omitting it, both result in the default `frame-ancestors: none` being set.|`frame-ancestors 'none'`|
+|`druid.server.http.uriCompliance`|Jetty `UriCompliance` mode for Druid's embedded Jetty servers. To modify, override this config with the string representation of any `UriCompliance` mode that [Jetty supports](https://javadoc.jetty.org/jetty-12/org/eclipse/jetty/http/UriCompliance.html).|LEGACY|
+|`druid.server.http.enforceStrictSNIHostChecking`| If enabled, the Jetty server will enforce strict SNI host checking. This means that if a client connects to the server using TLS but does not provide an SNI hostname, or provides an SNI hostname that does not match the server's configured hostname, a request will get a 400 response. Setting this to false is not recommended in production.|true|
+
+#### Indexer processing resources
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.processing.buffer.sizeBytes`|This specifies a buffer size (less than 2GiB) for the storage of intermediate results. The computation engine in the Indexer processes will use a scratch buffer of this size to do all of their intermediate computations off-heap. Larger values allow for more aggregations in a single pass over the data while smaller values can require more passes depending on the query that is being executed. [Human-readable format](human-readable-byte.md) is supported.|auto (max 1GiB)|
+|`druid.processing.buffer.poolCacheMaxCount`|processing buffer pool caches the buffers for later use, this is the maximum count cache will grow to. note that pool can create more buffers than it can cache if necessary.|`Integer.MAX_VALUE`|
+|`druid.processing.formatString`|Indexer processes use this format string to name their processing threads.|processing-%s|
+|`druid.processing.numMergeBuffers`|The number of direct memory buffers available for merging query results. The buffers are sized by `druid.processing.buffer.sizeBytes`. This property is effectively a concurrency limit for queries that require merging buffers. If you are using any queries that require merge buffers (currently, just groupBy) then you should have at least two of these.|`max(2, druid.processing.numThreads / 4)`|
+|`druid.processing.numThreads`|The number of processing threads to have available for parallel processing of segments. Our rule of thumb is `num_cores - 1`, which means that even under heavy load there will still be one core available to do background tasks like talking with ZooKeeper and pulling down segments. If only one core is available, this property defaults to the value `1`.|Number of cores - 1 (or 1)|
+|`druid.processing.numTimeoutThreads`|The number of processing threads to have available for handling per-segment query timeouts. Setting this value to `0` removes the ability to service per-segment timeouts, irrespective of `perSegmentTimeout` query context parameter. As these threads are just servicing timers, it's recommended to set this value to some small percent (e.g. 5%) of the total query processing cores available to the indexer.|0|
+|`druid.processing.fifo`|If the processing queue should treat tasks of equal priority in a FIFO manner|`true`|
+|`druid.processing.tmpDir`|Path where temporary files created while processing a query should be stored. If specified, this configuration takes priority over the default `java.io.tmpdir` path.|path represented by `java.io.tmpdir`|
+
+The amount of direct memory needed by Druid is at least
+`druid.processing.buffer.sizeBytes * (druid.processing.numMergeBuffers + druid.processing.numThreads + 1)`. You can
+ensure at least this amount of direct memory is available by providing `-XX:MaxDirectMemorySize=<VALUE>` at the command
+line.
+
+#### Query configurations
+
+See [general query configuration](#general-query-configuration).
+
+#### Indexer caching
+
+You can optionally configure caching to be enabled on the Indexer by setting caching configs here.
+
+|Property|Possible Values|Description|Default|
+|--------|---------------|-----------|-------|
+|`druid.realtime.cache.useCache`|true, false|Enable the cache on the realtime.|false|
+|`druid.realtime.cache.populateCache`|true, false|Populate the cache on the realtime.|false|
+|`druid.realtime.cache.unCacheable`|All druid query types|All query types to not cache.|`[scan]`|
+|`druid.realtime.cache.maxEntrySize`|positive integer|Maximum cache entry size in bytes.|1_000_000|
+
+See [cache configuration](#cache-configuration) for how to configure cache settings.
+
+Note that only local caches such as the `local`-type cache and `caffeine` cache are supported. If a remote cache such as `memcached` is used, it will be ignored.
+
+### Historical
+
+For general Historical service information, see [Historical](../design/historical.md).
+
+These Historical configurations can be defined in the `historical/runtime.properties` file.
+
+#### Historical service configuration
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.host`|The host for the current service. This is used to advertise the current service location as reachable from another service and should generally be specified such that `http://${druid.host}/` could actually talk to this service|`InetAddress.getLocalHost().getCanonicalHostName()`|
+|`druid.bindOnHost`|Indicating whether the service's internal jetty server bind on `druid.host`. Default is false, which means binding to all interfaces.|false|
+|`druid.plaintextPort`|This is the port to actually listen on; unless port mapping is used, this will be the same port as is on `druid.host`|8083|
+|`druid.tlsPort`|TLS port for HTTPS connector, if [druid.enableTlsPort](../operations/tls-support.md) is set then this config will be used. If `druid.host` contains port then that port will be ignored. This should be a non-negative Integer.|8283|
+|`druid.service`|The name of the service. This is used as a dimension when emitting metrics and alerts to differentiate between the various services|`druid/historical`|
+|`druid.labels`|Optional JSON object of key-value pairs that define custom labels for the server. These labels are displayed in the web console under the "Services" tab. Example: `druid.labels={"location":"Airtrunk"}` or `druid.labels.location=Airtrunk`|`null`|
+
+#### Historical general configuration
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.server.maxSize`|The maximum number of bytes-worth of segments that the service wants assigned to it. The Coordinator service will attempt to assign segments to a Historical service only if this property is greater than the total size of segments served by it. Since this property defines the upper limit on the total segment size that can be assigned to a Historical, it is defaulted to the sum of all `maxSize` values specified within `druid.segmentCache.locations` property. Human-readable format is supported, see [here](human-readable-byte.md). |Sum of `maxSize` values defined within `druid.segmentCache.locations`|
+|`druid.server.tier`| A string to name the distribution tier that the storage service belongs to. Many of the [rules Coordinator services use](../operations/rule-configuration.md) to manage segments can be keyed on tiers. |  `_default_tier` |
+|`druid.server.priority`|In a tiered architecture, the priority of the tier, thus allowing control over which services are queried. Higher numbers mean higher priority. The default (no priority) works for architecture with no cross replication (tiers that have no data-storage overlap). Data centers typically have equal priority. | 0 |
+
+#### Storing segments
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.segmentCache.locations`|Segments assigned to a Historical services are first stored on the local file system (in a disk cache) and then served by the Historical services. These locations define where that local cache resides. This value cannot be NULL or EMPTY. Here is an example `druid.segmentCache.locations=[{"path": "/mnt/druidSegments", "maxSize": "10k", "freeSpacePercent": 1.0}]`. "freeSpacePercent" is optional, if provided then enforces that much of free disk partition space while storing segments. But, it depends on `File.getTotalSpace()` and `File.getFreeSpace()` methods, so enable if only if they work for your File System.| none |
+|`druid.segmentCache.locationSelector.strategy`|The strategy used to select a location from the configured `druid.segmentCache.locations` for segment distribution. Possible values are `leastBytesUsed`, `roundRobin`, `random`, or `mostAvailableSize`. |leastBytesUsed|
+|`druid.segmentCache.deleteOnRemove`|Delete segment files from cache once a service is no longer serving a segment.|true|
+|`druid.segmentCache.dropSegmentDelayMillis`|How long a service delays before completely dropping segment.|30000 (30 seconds)|
+|`druid.segmentCache.infoDir`|Historical services keep track of the segments they are serving so that when the service is restarted they can reload the same segments without waiting for the Coordinator to reassign. This path defines where this metadata is kept. Directory will be created if needed.|`${first_location}/info_dir`|
+|`druid.segmentCache.announceIntervalMillis`|How frequently to announce segments while segments are loading from cache. Set this value to zero to wait for all segments to be loaded before announcing.|5000 (5 seconds)|
+|`druid.segmentCache.numLoadingThreads`|How many segments to drop or load concurrently from deep storage. Note that the work of loading segments involves downloading segments from deep storage, decompressing them and loading them to a memory mapped location. So the work is not all I/O Bound. Depending on CPU and network load, one could possibly increase this config to a higher value.|max(1,Number of cores / 6)|
+|`druid.segmentCache.numBootstrapThreads`|How many segments to load concurrently during historical startup.|`druid.segmentCache.numLoadingThreads`|
+|`druid.segmentCache.lazyLoadOnStart`|Whether or not to load segment columns metadata lazily during historical startup. When set to true, Historical startup time will be dramatically improved by deferring segment loading until the first time that segment takes part in a query, which will incur this cost instead.|false|
+|`druid.segmentCache.numThreadsToLoadSegmentsIntoPageCacheOnDownload`|Number of threads to asynchronously read segment index files into null output stream on each new segment download after the Historical service finishes bootstrapping. Recommended to set to 1 or 2 or leave unspecified to disable. See also `druid.segmentCache.numThreadsToLoadSegmentsIntoPageCacheOnBootstrap`|0|
+|`druid.segmentCache.numThreadsToLoadSegmentsIntoPageCacheOnBootstrap`|Number of threads to asynchronously read segment index files into null output stream during Historical service bootstrap. This thread pool is terminated after Historical service finishes bootstrapping. Recommended to set to half of available cores. If left unspecified, `druid.segmentCache.numThreadsToLoadSegmentsIntoPageCacheOnDownload` will be used. If both configs are unspecified, this feature is disabled. Preemptively loading segments into page cache helps in the sense that later when a segment is queried, it's already in page cache and only a minor page fault needs to be triggered instead of a more costly major page fault to make the query latency more consistent. Note that loading segment into page cache just does a blind loading of segment index files and will evict any existing segments from page cache at the discretion of operating system when the total segment size on local disk is larger than the page cache usable in the RAM, which roughly equals to total available RAM in the host - druid process memory including both heap and direct memory allocated - memory used by other non druid processes on the host, so it is the user's responsibility to ensure the host has enough RAM to host all the segments to avoid random evictions to fully leverage this feature.|`druid.segmentCache.numThreadsToLoadSegmentsIntoPageCacheOnDownload`|
+
+In `druid.segmentCache.locations`, `freeSpacePercent` was added because the `maxSize` setting is only a theoretical limit and assumes that much space will always be available for storing segments. In case of any druid bug leading to unaccounted segment files left alone on disk or some other service writing stuff to disk, This check can start failing segment loading early before filling up the disk completely and leaving the host usable otherwise.
+
+In `druid.segmentCache.locationSelector.strategy`, one of `leastBytesUsed`, `roundRobin`, `random`, or `mostAvailableSize` could be specified to represent the strategy to distribute segments across multiple segment cache locations.
+
+|Strategy|Description|
+|--------|-----------|
+|`leastBytesUsed`|Selects a location which has least bytes used in absolute terms.|
+|`roundRobin`|Selects a location in a round robin fashion oblivious to the bytes used or the capacity.|
+|`random`|Selects a segment cache location randomly each time among the available storage locations.|
+|`mostAvailableSize`|Selects a segment cache location that has most free space among the available storage locations.|
+
+Note that if `druid.segmentCache.numLoadingThreads` > 1, multiple threads can download different segments at the same time. In this case, with the `leastBytesUsed` strategy or `mostAvailableSize` strategy, Historicals may select a sub-optimal storage location because each decision is based on a snapshot of the storage location status of when a segment is requested to download.
+
+#### Historical query configs
+
+##### Concurrent requests
+
+Druid uses Jetty to serve HTTP requests.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.server.http.numThreads`|Number of threads for HTTP requests.|max(10, (Number of cores * 17) / 16 + 2) + 30|
+|`druid.server.http.queueSize`|Size of the worker queue used by Jetty server to temporarily store incoming client connections. If this value is set and a request is rejected by jetty because queue is full then client would observe request failure with TCP connection being closed immediately with a completely empty response from server.|Unbounded|
+|`druid.server.http.maxIdleTime`|The Jetty max idle time for a connection.|`PT5M`|
+|`druid.server.http.enableRequestLimit`|If enabled, no requests would be queued in jetty queue and "HTTP 429 Too Many Requests" error response would be sent. |false|
+|`druid.server.http.defaultQueryTimeout`|Query timeout in millis, beyond which unfinished queries will be cancelled|300000|
+|`druid.server.http.gracefulShutdownTimeout`|The maximum amount of time Jetty waits after receiving shutdown signal. After this timeout the threads will be forcefully shutdown. This allows any queries that are executing to complete(Only values greater than zero are valid).|`PT30S`|
+|`druid.server.http.unannouncePropagationDelay`|How long to wait for ZooKeeper unannouncements to propagate before shutting down Jetty. This is a minimum and `druid.server.http.gracefulShutdownTimeout` does not start counting down until after this period elapses.|`PT0S` (do not wait)|
+|`druid.server.http.maxQueryTimeout`|Maximum allowed value (in milliseconds) for `timeout` parameter. See [query-context](../querying/query-context-reference.md) to know more about `timeout`. Query is rejected if the query context `timeout` is greater than this value. |`Long.MAX_VALUE`|
+|`druid.server.http.maxRequestHeaderSize`|Maximum size of a request header in bytes. Larger headers consume more memory and can make a server more vulnerable to denial of service attacks.|8 * 1024|
+|`druid.server.http.contentSecurityPolicy`|Content-Security-Policy header value to set on each non-POST response. Setting this property to an empty string, or omitting it, both result in the default `frame-ancestors: none` being set.|`frame-ancestors 'none'`|
+
+##### Processing
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.processing.buffer.sizeBytes`|This specifies a buffer size (less than 2GiB), for the storage of intermediate results. The computation engine in both the Historical and Realtime processes will use a scratch buffer of this size to do all of their intermediate computations off-heap. Larger values allow for more aggregations in a single pass over the data while smaller values can require more passes depending on the query that is being executed.  [Human-readable format](human-readable-byte.md) is supported.|auto (max 1GiB)|
+|`druid.processing.buffer.poolCacheMaxCount`|processing buffer pool caches the buffers for later use, this is the maximum count cache will grow to. note that pool can create more buffers than it can cache if necessary.|`Integer.MAX_VALUE`|
+|`druid.processing.formatString`|Realtime and Historical processes use this format string to name their processing threads.|processing-%s|
+|`druid.processing.numMergeBuffers`|The number of direct memory buffers available for merging query results. The buffers are sized by `druid.processing.buffer.sizeBytes`. This property is effectively a concurrency limit for queries that require merging buffers. If you are using any queries that require merge buffers (currently, just groupBy) then you should have at least two of these.|`max(2, druid.processing.numThreads / 4)`|
+|`druid.processing.numThreads`|The number of processing threads to have available for parallel processing of segments. Our rule of thumb is `num_cores - 1`, which means that even under heavy load there will still be one core available to do background tasks like talking with ZooKeeper and pulling down segments. If only one core is available, this property defaults to the value `1`.|Number of cores - 1 (or 1)|
+|`druid.processing.numTimeoutThreads`|The number of processing threads to have available for handling per-segment query timeouts. Setting this value to `0` removes the ability to service per-segment timeouts, irrespective of `perSegmentTimeout` query context parameter. As these threads are just servicing timers, it's recommended to set this value to some small percent (e.g. 5%) of the total query processing cores available to the historical.|0|
+|`druid.processing.fifo`|If the processing queue should treat tasks of equal priority in a FIFO manner|`true`|
+|`druid.processing.tmpDir`|Path where temporary files created while processing a query should be stored. If specified, this configuration takes priority over the default `java.io.tmpdir` path.|path represented by `java.io.tmpdir`|
+
+The amount of direct memory needed by Druid is at least
+`druid.processing.buffer.sizeBytes * (druid.processing.numMergeBuffers + druid.processing.numThreads + 1)`. You can
+ensure at least this amount of direct memory is available by providing `-XX:MaxDirectMemorySize=<VALUE>` at the command
+line.
+
+##### Historical query configuration
+
+See [general query configuration](#general-query-configuration).
+
+#### Historical caching
+
+You can optionally only configure caching to be enabled on the Historical by setting caching configs here.
+
+|Property|Possible Values|Description|Default|
+|--------|---------------|-----------|-------|
+|`druid.historical.cache.useCache`|true, false|Enable the cache on the Historical.|false|
+|`druid.historical.cache.populateCache`|true, false|Populate the cache on the Historical.|false|
+|`druid.historical.cache.unCacheable`|All druid query types|All query types to not cache.|`[scan]`|
+|`druid.historical.cache.maxEntrySize`|positive integer|Maximum cache entry size in bytes.|1_000_000|
+
+See [cache configuration](#cache-configuration) for how to configure cache settings.
+
+## Query server
+
+This section contains the configuration options for the services that reside on Query servers (Brokers) in the suggested [three-server configuration](../design/architecture.md#druid-servers).
+
+Configuration options for the [Router process](../design/router.md) are also provided here.
+
+### Broker
+
+For general Broker process information, see [here](../design/broker.md).
+
+These Broker configurations can be defined in the `broker/runtime.properties` file.
+
+#### Broker process configs
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.host`|The host for the current process. This is used to advertise the current processes location as reachable from another process and should generally be specified such that `http://${druid.host}/` could actually talk to this process|`InetAddress.getLocalHost().getCanonicalHostName()`|
+|`druid.bindOnHost`|Indicating whether the process's internal jetty server bind on `druid.host`. Default is false, which means binding to all interfaces.|false|
+|`druid.plaintextPort`|This is the port to actually listen on; unless port mapping is used, this will be the same port as is on `druid.host`|8082|
+|`druid.tlsPort`|TLS port for HTTPS connector, if [druid.enableTlsPort](../operations/tls-support.md) is set then this config will be used. If `druid.host` contains port then that port will be ignored. This should be a non-negative Integer.|8282|
+|`druid.service`|The name of the service. This is used as a dimension when emitting metrics and alerts to differentiate between the various services|`druid/broker`|
+|`druid.labels`|Optional JSON object of key-value pairs that define custom labels for the server. These labels are displayed in the web console under the "Services" tab. Example: `druid.labels={"location":"Airtrunk"}` or `druid.labels.location=Airtrunk`|`null`|
+
+#### Query configuration
+
+##### Query routing
+
+|Property|Possible Values|Description|Default|
+|--------|---------------|-----------|-------|
+|`druid.broker.balancer.type`|`random`, `connectionCount`|Determines how the broker balances connections to Historical processes. `random` choose randomly, `connectionCount` picks the process with the fewest number of active connections to|`random`|
+|`druid.broker.select.tier`|`highestPriority`, `lowestPriority`, `custom`, `preferred`|If segments are cross-replicated across tiers in a cluster, you can tell the broker to prefer to select segments in a tier with a certain priority.|`highestPriority`|
+|`druid.broker.select.tier.custom.priorities`|An array of integer priorities, such as `[-1, 0, 1, 2]`|Select servers in tiers with a custom priority list.|The config only has effect if `druid.broker.select.tier` is set to `custom`. If `druid.broker.select.tier` is set to `custom` but this config is not specified, the effect is the same as `druid.broker.select.tier` set to `highestPriority`. Any of the integers in this config can be ignored if there's no corresponding tiers with such priorities. Tiers with priorities explicitly specified in this config always have higher priority than those not and those not specified fall back to use `highestPriority` strategy among themselves.|
+|`druid.broker.select.tier.preferred.tier`| The preferred tier name. E.g., `_default_tier` | A non-empty value that specifies the preferred tier in which historical servers will be picked up for queries. If there are not enough historical servers from the preferred tier, servers from other tiers (if there are any) will be selected. This config only has effect if `druid.broker.select.tier` is set to `preferred` | null |
+|`druid.broker.select.tier.preferred.priority`| `highest`, `lowest` | If there are multiple candidates in a preferred tier, specifies the priority to pick up candidates. By default, the higher priority a historical, the higher chances it will be picked up. This config only has effect if `druid.broker.select.tier` is set to `preferred`| `highest` |
+
+##### Query prioritization and laning
+
+Laning strategies allow you to control capacity utilization for heterogeneous query workloads. With laning, the broker examines and classifies a query for the purpose of assigning it to a lane. Lanes have capacity limits, enforced by the broker, that can be used to ensure sufficient resources are available for other lanes or for interactive queries (with no lane), or to limit overall throughput for queries within the lane. Requests in excess of the capacity are discarded with an HTTP 429 status code.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.query.scheduler.numThreads`|Maximum number of concurrently-running queries. When this parameter is set lower than `druid.server.http.numThreads`, query requests beyond the limit are put into the Jetty request queue. This has the effect of reserving the leftover Jetty threads for non-query requests.<br /><br />When this parameter is set equal to or higher than `druid.server.http.numThreads`, it has no effect.|Unbounded|
+|`druid.query.scheduler.laning.strategy`|Query laning strategy to use to assign queries to a lane in order to control capacities for certain classes of queries.|`none`|
+|`druid.query.scheduler.prioritization.strategy`|Query prioritization strategy to automatically assign priorities.|`manual`|
+
+##### Prioritization strategies
+
+###### Manual prioritization strategy
+
+With this configuration, queries are never assigned a priority automatically, but will preserve a priority manually set on the [query context](../querying/query-context-reference.md) with the `priority` key. This mode can be explicitly set by setting `druid.query.scheduler.prioritization.strategy` to `manual`.
+
+###### Threshold prioritization strategy
+
+This prioritization strategy lowers the priority of queries that cross any of a configurable set of thresholds, such as how far in the past the data is, how large of an interval a query covers, or the number of segments taking part in a query.
+
+This strategy can be enabled by setting `druid.query.scheduler.prioritization.strategy` to `threshold`.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.query.scheduler.prioritization.periodThreshold`|ISO duration threshold for how old data can be queried before automatically adjusting query priority.|none|
+|`druid.query.scheduler.prioritization.durationThreshold`|ISO duration threshold for maximum duration a queries interval can span before the priority is automatically adjusted.|none|
+|`druid.query.scheduler.prioritization.segmentCountThreshold`|Number threshold for maximum number of segments that can take part in a query before its priority is automatically adjusted.|none|
+|`druid.query.scheduler.prioritization.segmentRangeThreshold`|ISO duration threshold for maximum segment range a query can span before the priority is automatically adjusted.|none|
+|`druid.query.scheduler.prioritization.adjustment`|Amount to reduce the priority of queries which cross any threshold.|none|
+
+##### Laning strategies
+
+###### No laning strategy
+
+In this mode, queries are never assigned a lane, and the concurrent query count will only be limited by `druid.server.http.numThreads` or `druid.query.scheduler.numThreads`, if set. This is the default Druid query scheduler operating mode. Enable this strategy explicitly by setting `druid.query.scheduler.laning.strategy` to `none`.
+
+###### 'High/Low' laning strategy
+
+This laning strategy splits queries with a `priority` below zero into a `low` query lane, automatically. Queries with priority of zero (the default) or above are considered 'interactive'. The limit on `low` queries can be set to some desired percentage of the total capacity (or HTTP thread pool size), reserving capacity for interactive queries. Queries in the `low` lane are _not_ guaranteed their capacity, which may be consumed by interactive queries, but may use up to this limit if total capacity is available.
+
+If the `low` lane is specified in the [query context](../querying/query-context-reference.md) `lane` parameter, this will override the computed lane.
+
+This strategy can be enabled by setting `druid.query.scheduler.laning.strategy=hilo`.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.query.scheduler.laning.maxLowPercent`|Maximum percent of the smaller number of `druid.server.http.numThreads` or `druid.query.scheduler.numThreads`, defining the number of HTTP threads that can be used by queries with a priority lower than 0. Value must be an integer in the range 1 to 100, and will be rounded up|No default, must be set if using this mode|
+
+##### Guardrails for materialization of subqueries
+
+Druid stores the subquery rows in temporary tables that live in the Java heap. It is a good practice to avoid large subqueries in Druid.
+Therefore, there are guardrails that are built in Druid to prevent the queries from generating subquery results which can exhaust the heap
+space. They can be set on a cluster level or modified per query level as desired.
+Note the following guardrails that can be set by the cluster admin to limit the subquery results:
+
+1. `druid.server.http.maxSubqueryRows` in broker's config to set a default for the entire cluster or `maxSubqueryRows` in the query context to set an upper limit on the number of rows a subquery can generate
+2. `druid.server.http.maxSubqueryBytes` in broker's config to set a default for the entire cluster or `maxSubqueryBytes` in the query context to set an upper limit on the number of bytes a subquery can generate
+
+Limiting the subquery by bytes is an experimental feature as it materializes the results differently.
+
+You can configure `maxSubqueryBytes` to the following values:
+
+* `disabled`: It is the default setting out of the box. It disables the subquery's from the byte based limit, and effectively disables this feature.
+* `auto`: Druid automatically decides the optimal byte based limit based upon the heap space available and the max number of concurrent queries.
+* A positive long value: User can manually specify the number of bytes that the results of the subqueries of a single query can occupy on the heap.
+
+Due to the conversion between the Java objects and the Frame's format, setting `maxSubqueryBytes` can become slow if the subquery starts generating
+rows in the order of magnitude of around 10 million and above. In those scenarios, disable the `maxSubqueryBytes` settings for such queries, assess the number of rows that the subqueries generate and override the `maxSubqueryRows` to appropriate value.
+
+If you choose to modify or set any of the above limits, you must also think about the heap size of all Brokers, Historicals, and task Peons that process data for the subqueries to accommodate the subquery results.
+There is no formula to calculate the correct value. Trial and error is the best approach.
+
+###### Manual laning strategy
+
+This laning strategy is best suited for cases where one or more external applications which query Druid are capable of manually deciding what lane a given query should belong to. Configured with a map of lane names to percent or exact max capacities, queries with a matching `lane` parameter in the [query context](../querying/query-context-reference.md) will be subjected to those limits.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.query.scheduler.laning.lanes.{name}`|Maximum percent or exact limit of queries that can concurrently run in the defined lanes. Any number of lanes may be defined like this. The lane names 'total' and 'default' are reserved for internal use.|No default, must define at least one lane with a limit above 0. If `druid.query.scheduler.laning.isLimitPercent` is set to `true`, values must be integers in the range of 1 to 100.|
+|`druid.query.scheduler.laning.isLimitPercent`|If set to `true`, the values set for `druid.query.scheduler.laning.lanes` will be treated as a percent of the smaller number of `druid.server.http.numThreads` or `druid.query.scheduler.numThreads`. Note that in this mode, these lane values across lanes are _not_ required to add up to, and can exceed, 100%.|`false`|
+
+##### Server configuration
+
+Druid uses Jetty to serve HTTP requests. Each query being processed consumes a single thread from `druid.server.http.numThreads`, so consider defining `druid.query.scheduler.numThreads` to a lower value in order to reserve HTTP threads for responding to health checks, lookup loading, and other non-query, (in most cases) comparatively very short-lived, HTTP requests.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.server.http.numThreads`|Number of threads for HTTP requests.|max(10, (Number of cores * 17) / 16 + 2) + 30|
+|`druid.server.http.queueSize`|Size of the worker queue used by Jetty server to temporarily store incoming client connections. If this value is set and a request is rejected by jetty because queue is full then client would observe request failure with TCP connection being closed immediately with a completely empty response from server.|Unbounded|
+|`druid.server.http.maxIdleTime`|The Jetty max idle time for a connection.|`PT5M`|
+|`druid.server.http.enableRequestLimit`|If enabled, no requests would be queued in jetty queue and "HTTP 429 Too Many Requests" error response would be sent. |false|
+|`druid.server.http.defaultQueryTimeout`|Query timeout in millis, beyond which unfinished queries will be cancelled|300000|
+|`druid.server.http.maxScatterGatherBytes`|Maximum number of bytes gathered from data processes such as Historicals and realtime processes to execute a query. Queries that exceed this limit will fail. This is an advance configuration that allows to protect in case Broker is under heavy load and not utilizing the data gathered in memory fast enough and leading to OOMs. This limit can be further reduced at query time using `maxScatterGatherBytes` in the context. Note that having large limit is not necessarily bad if broker is never under heavy concurrent load in which case data gathered is processed quickly and freeing up the memory used. Human-readable format is supported, see [here](human-readable-byte.md). |`Long.MAX_VALUE`|
+|`druid.server.http.maxSubqueryRows`|Maximum number of rows from all subqueries per query. Druid stores the subquery rows in temporary tables that live in the Java heap. `druid.server.http.maxSubqueryRows` is a guardrail to prevent the system from exhausting available heap. When a subquery exceeds the row limit, Druid throws a resource limit exceeded exception: "Subquery generated results beyond maximum."<br /><br />It is a good practice to avoid large subqueries in Druid. However, if you choose to raise the subquery row limit, you must also increase the heap size of all Brokers, Historicals, and task Peons that process data for the subqueries to accommodate the subquery results.<br /><br />There is no formula to calculate the correct value. Trial and error is the best approach.|100000|
+|`druid.server.http.maxSubqueryBytes`|Maximum number of bytes from all subqueries per query. Since the results are stored on the Java heap, `druid.server.http.maxSubqueryBytes` is a guardrail like `druid.server.http.maxSubqueryRows` to prevent the heap space from exhausting. When a subquery exceeds the byte limit, Druid throws a resource limit exceeded exception. A negative value for the guardrail indicates that Druid won't guardrail by memory. This can be set to 'disabled' which disables the results from being limited via the byte limit, 'auto' which sets this value automatically taking free heap space into account, or a positive long value depicting the number of bytes per query's subqueries' results can occupy. This is an experimental feature for now as this materializes the results in a different format.|'disabled'|
+|`druid.server.http.gracefulShutdownTimeout`|The maximum amount of time Jetty waits after receiving shutdown signal. After this timeout the threads will be forcefully shutdown. This allows any queries that are executing to complete(Only values greater than zero are valid).|`PT30S`|
+|`druid.server.http.unannouncePropagationDelay`|How long to wait for ZooKeeper unannouncements to propagate before shutting down Jetty. This is a minimum and `druid.server.http.gracefulShutdownTimeout` does not start counting down until after this period elapses.|`PT0S` (do not wait)|
+|`druid.server.http.maxQueryTimeout`|Maximum allowed value (in milliseconds) for `timeout` parameter. See [query-context](../querying/query-context-reference.md) to know more about `timeout`. Query is rejected if the query context `timeout` is greater than this value. |`Long.MAX_VALUE`|
+|`druid.server.http.maxRequestHeaderSize`|Maximum size of a request header in bytes. Larger headers consume more memory and can make a server more vulnerable to denial of service attacks. |8 * 1024|
+|`druid.server.http.contentSecurityPolicy`|Content-Security-Policy header value to set on each non-POST response. Setting this property to an empty string, or omitting it, both result in the default `frame-ancestors: none` being set.|`frame-ancestors 'none'`|
+|`druid.server.http.enableHSTS`|If set to true, druid services will add strict transport security header `Strict-Transport-Security: max-age=63072000; includeSubDomains` to all HTTP responses|`false`|
+
+##### Client configuration
+
+Druid Brokers use an HTTP client to communicate with data servers (Historical servers and real-time tasks). This
+client has the following configuration options.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.broker.http.numConnections`|Size of connection pool for the Broker to connect to Historical and real-time processes. If there are more queries than this number that all need to speak to the same process, then they will queue up.|20|
+|`druid.broker.http.eagerInitialization`|Indicates that http connections from Broker to Historical and Real-time processes should be eagerly initialized. If set to true, `numConnections` connections are created upon initialization|`true`|
+|`druid.broker.http.compressionCodec`|Compression codec the Broker uses to communicate with Historical and real-time processes. May be "gzip" or "identity".|`gzip`|
+|`druid.broker.http.readTimeout`|The timeout for data reads from Historical servers and real-time tasks.|`PT15M`|
+|`druid.broker.http.unusedConnectionTimeout`|The timeout for idle connections in connection pool. The connection in the pool will be closed after this timeout and a new one will be established. This timeout should be less than `druid.broker.http.readTimeout`. Set this timeout = ~90% of `druid.broker.http.readTimeout`|`PT4M`|
+|`druid.broker.http.maxQueuedBytes`|Maximum number of bytes queued per query before exerting [backpressure](../operations/basic-cluster-tuning.md#broker-backpressure) on channels to the data servers.<br /><br />Similar to `druid.server.http.maxScatterGatherBytes`, except that `maxQueuedBytes` triggers [backpressure](../operations/basic-cluster-tuning.md#broker-backpressure) instead of query failure. Set to zero to disable. You can override this setting by using the [`maxQueuedBytes` query context parameter](../querying/query-context-reference.md). Druid supports [human-readable](human-readable-byte.md) format. |25 MB or 2% of maximum Broker heap size, whichever is greater.|
+|`druid.broker.http.numMaxThreads`|`Maximum number of I/O worker threads|(number of cores) * 3 / 2 + 1`|
+|`druid.broker.http.clientConnectTimeout`|The timeout (in milliseconds) for establishing client connections.|500|
+
+
+##### Retry policy
+
+Druid broker can optionally retry queries internally for transient errors.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.broker.retryPolicy.numTries`|Number of tries.|1|
+
+##### Processing
+
+The broker uses processing configs for nested groupBy queries.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.processing.buffer.sizeBytes`|This specifies a buffer size (less than 2GiB) for the storage of intermediate results. The computation engine in both the Historical and Realtime processes will use a scratch buffer of this size to do all of their intermediate computations off-heap. Larger values allow for more aggregations in a single pass over the data while smaller values can require more passes depending on the query that is being executed. [Human-readable format](human-readable-byte.md) is supported.|auto (max 1GiB)|
+|`druid.processing.buffer.poolCacheInitialCount`|initializes the number of buffers allocated on the intermediate results pool. Note that pool can create more buffers if necessary.|`0`|
+|`druid.processing.buffer.poolCacheMaxCount`|processing buffer pool caches the buffers for later use, this is the maximum count cache will grow to. note that pool can create more buffers than it can cache if necessary.|`Integer.MAX_VALUE`|
+|`druid.processing.numMergeBuffers`|The number of direct memory buffers available for merging query results. The buffers are sized by `druid.processing.buffer.sizeBytes`. This property is effectively a concurrency limit for queries that require merging buffers. If you are using any queries that require merge buffers (currently, just groupBy) then you should have at least two of these.|`max(2, druid.processing.numThreads / 4)`|
+|`druid.processing.fifo`|If the processing queue should treat tasks of equal priority in a FIFO manner|`true`|
+|`druid.processing.tmpDir`|Path where temporary files created while processing a query should be stored. If specified, this configuration takes priority over the default `java.io.tmpdir` path.|path represented by `java.io.tmpdir`|
+|`druid.processing.merge.useParallelMergePool`|Enable automatic parallel merging for Brokers on a dedicated async ForkJoinPool. If `false`, instead merges will be done serially on the `HTTP` thread pool.|`true`|
+|`druid.processing.merge.parallelism`|Size of ForkJoinPool. Note that the default configuration assumes that the value returned by `Runtime.getRuntime().availableProcessors()` represents 2 hyper-threads per physical core, and multiplies this value by `0.75` in attempt to size `1.5` times the number of _physical_ cores.|`Runtime.getRuntime().availableProcessors() * 0.75` (rounded up)|
+|`druid.processing.merge.defaultMaxQueryParallelism`|Default maximum number of parallel merge tasks per query. Note that the default configuration assumes that the value returned by `Runtime.getRuntime().availableProcessors()` represents 2 hyper-threads per physical core, and multiplies this value by `0.5` in attempt to size to the number of _physical_ cores.|`Runtime.getRuntime().availableProcessors() * 0.5` (rounded up)|
+|`druid.processing.merge.awaitShutdownMillis`|Time to wait for merge ForkJoinPool tasks to complete before ungracefully stopping on process shutdown in milliseconds.|`60_000`|
+|`druid.processing.merge.targetRunTimeMillis`|Ideal run-time of each ForkJoinPool merge task, before forking off a new task to continue merging sequences.|100|
+|`druid.processing.merge.initialYieldNumRows`|Number of rows to yield per ForkJoinPool merge task, before forking off a new task to continue merging sequences.|16384|
+|`druid.processing.merge.smallBatchNumRows`|Size of result batches to operate on in ForkJoinPool merge tasks.|4096|
+
+The amount of direct memory needed by Druid is at least
+`druid.processing.buffer.sizeBytes * (druid.processing.numMergeBuffers + 1)`. You can
+ensure at least this amount of direct memory is available by providing `-XX:MaxDirectMemorySize=<VALUE>` at the command
+line.
+
+##### Broker query configuration
+
+See [general query configuration](#general-query-configuration).
+
+###### Broker generated query configuration supplementation
+
+The Broker generates queries internally. This configuration section describes how an operator can augment the configuration
+of these queries.
+
+As of now the only supported augmentation is overriding the default query context. This allows an operator the flexibility
+to adjust it as they see fit. A common use of this configuration is to override the query priority of the cluster generated
+queries in order to avoid running as a default priority of 0.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.broker.internal.query.config.context`|A string formatted `key:value` map of a query context to add to internally generated broker queries.|null|
+
+#### SQL
+
+The Druid SQL server is configured through the following properties on the Broker.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.sql.enable`|Whether to enable SQL at all, including background metadata fetching. If false, this overrides all other SQL-related properties and disables SQL metadata, serving, and planning completely.|true|
+|`druid.sql.avatica.enable`|Whether to enable JDBC querying at `/druid/v2/sql/avatica/`.|true|
+|`druid.sql.avatica.maxConnections`|Maximum number of open connections for the Avatica server. These are not HTTP connections, but are logical client connections that may span multiple HTTP connections.|25|
+|`druid.sql.avatica.maxRowsPerFrame`|Maximum acceptable value for the JDBC client `Statement.setFetchSize` method. This setting determines the maximum number of rows that Druid will populate in a single 'fetch' for a JDBC `ResultSet`. Set this property to -1 to enforce no row limit on the server-side and potentially return the entire set of rows on the initial statement execution. If the JDBC client calls `Statement.setFetchSize` with a value other than -1, Druid uses the lesser value of the client-provided limit and `maxRowsPerFrame`. If `maxRowsPerFrame` is smaller than `minRowsPerFrame`, then the `ResultSet` size will be fixed. To handle queries that produce results with a large number of rows, you can increase value of `druid.sql.avatica.maxRowsPerFrame` to reduce the number of fetches required to completely transfer the result set.|5,000|
+|`druid.sql.avatica.minRowsPerFrame`|Minimum acceptable value for the JDBC client `Statement.setFetchSize` method. The value for this property must greater than 0. If the JDBC client calls `Statement.setFetchSize` with a lesser value, Druid uses `minRowsPerFrame` instead. If `maxRowsPerFrame` is less than `minRowsPerFrame`, Druid uses the minimum value of the two. For handling queries which produce results with a large number of rows, you can increase this value to reduce the number of fetches required to completely transfer the result set.|100|
+|`druid.sql.avatica.maxStatementsPerConnection`|Maximum number of simultaneous open statements per Avatica client connection.|4|
+|`druid.sql.avatica.connectionIdleTimeout`|Avatica client connection idle timeout.|`PT5M`|
+|`druid.sql.avatica.fetchTimeoutMs`|Avatica fetch timeout, in milliseconds. When a request for the next batch of data takes longer than this time, Druid returns an empty result set, causing the client to poll again. This avoids HTTP timeouts for long-running queries. The default of 5 sec. is good for most cases. |5000|
+|`druid.sql.http.enable`|Whether to enable JSON over HTTP querying at `/druid/v2/sql/`.|true|
+|`druid.sql.planner.maxTopNLimit`|Maximum threshold for a [TopN query](../querying/topnquery.md). Higher limits will be planned as [GroupBy queries](../querying/groupbyquery.md) instead.|100000|
+|`druid.sql.planner.metadataRefreshPeriod`|Throttle for metadata refreshes.|`PT1M`|
+|`druid.sql.planner.metadataColumnTypeMergePolicy`|Defines how column types will be chosen when faced with differences between segments when computing the SQL schema. Options are specified as a JSON object, with valid choices of `leastRestrictive` or `latestInterval`. For `leastRestrictive`, Druid will automatically widen the type computed for the schema to a type which data across all segments can be converted into, however planned schema migrations can only take effect once all segments have been re-ingested to the new schema. With `latestInterval`, the column type in most recent time chunks defines the type for the schema. |`leastRestrictive`|
+|`druid.sql.planner.useApproximateCountDistinct`|Whether to use an approximate cardinality algorithm for `COUNT(DISTINCT foo)`.|true|
+|`druid.sql.planner.useGroupingSetForExactDistinct`|Only relevant when `useApproximateCountDistinct` is disabled. If set to true, exact distinct queries are re-written using grouping sets. Otherwise, exact distinct queries are re-written using joins. This should be set to true for group by query with multiple exact distinct aggregations. This flag can be overridden per query.|false|
+|`druid.sql.planner.useApproximateTopN`|Whether to use approximate [TopN queries](../querying/topnquery.md) when a SQL query could be expressed as such. If false, exact [GroupBy queries](../querying/groupbyquery.md) will be used instead.|true|
+|`druid.sql.planner.useLexicographicTopN`|Whether to use [TopN queries](../querying/topnquery.md) with lexicographic dimension ordering. If false, [GroupBy queries](../querying/groupbyquery.md) will be used instead for lexicographic ordering. When both this and `useApproximateTopN` are false, TopN queries are never used.|false|
+|`druid.sql.planner.requireTimeCondition`|Whether to require SQL to have filter conditions on `__time` column so that all generated native queries will have user specified intervals. If true, all queries without filter condition on `__time` column will fail|false|
+|`druid.sql.planner.sqlTimeZone`|Sets the default time zone for the server, which will affect how time functions and timestamp literals behave. Should be a time zone name like "America/Los_Angeles" or offset like "-08:00".|UTC|
+|`druid.sql.planner.metadataSegmentCacheEnable`|Whether to keep a cache of published segments in broker. If true, broker polls coordinator in background to get segments from metadata store and maintains a local cache. If false, coordinator's REST API will be invoked when broker needs published segments info.|false|
+|`druid.sql.planner.metadataSegmentPollPeriod`|How often to poll coordinator for published segments list if `druid.sql.planner.metadataSegmentCacheEnable` is set to true. Poll period is in milliseconds. |60000|
+|`druid.sql.planner.authorizeSystemTablesDirectly`|If true, Druid authorizes queries against any of the system schema tables (`sys` in SQL) as `SYSTEM_TABLE` resources which require `READ` access, in addition to permissions based content filtering.|false|
+|`druid.sql.planner.useNativeQueryExplain`|If true, `EXPLAIN PLAN FOR` will return the explain plan as a JSON representation of equivalent native query(s), else it will return the original version of explain plan generated by Calcite. It can be overridden per query with `useNativeQueryExplain` context key.|true|
+|`druid.sql.planner.maxNumericInFilters`|Max limit for the amount of numeric values that can be compared for a string type dimension when the entire SQL WHERE clause of a query translates to an [OR](../querying/filters.md#or) of [Bound filter](../querying/filters.md#bound-filter). By default, Druid does not restrict the amount of numeric Bound Filters on String columns, although this situation may block other queries from running. Set this property to a smaller value to prevent Druid from running queries that have prohibitively long segment processing times. The optimal limit requires some trial and error; we recommend starting with 100.  Users who submit a query that exceeds the limit of `maxNumericInFilters` should instead rewrite their queries to use strings in the `WHERE` clause instead of numbers. For example, `WHERE someString IN (‘123’, ‘456’)`. If this value is disabled, `maxNumericInFilters` set through query context is ignored.|`-1` (disabled)|
+|`druid.sql.approxCountDistinct.function`|Implementation to use for the [`APPROX_COUNT_DISTINCT` function](../querying/sql-aggregations.md). Without extensions loaded, the only valid value is `APPROX_COUNT_DISTINCT_BUILTIN` (a HyperLogLog, or HLL, based implementation). If the [DataSketches extension](../development/extensions-core/datasketches-extension.md) is loaded, this can also be `APPROX_COUNT_DISTINCT_DS_HLL` (alternative HLL implementation) or `APPROX_COUNT_DISTINCT_DS_THETA`.<br /><br />Theta sketches use significantly more memory than HLL sketches, so you should prefer one of the two HLL implementations.|`APPROX_COUNT_DISTINCT_BUILTIN`|
+
+:::info
+ Previous versions of Druid had properties named `druid.sql.planner.maxQueryCount` and `druid.sql.planner.maxSemiJoinRowsInMemory`.
+ These properties are no longer available. Since Druid 0.18.0, you can use `druid.server.http.maxSubqueryRows` to control the maximum
+ number of rows permitted across all subqueries.
+:::
+
+#### Broker caching
+
+You can optionally only configure caching to be enabled on the Broker by setting caching configs here.
+
+|Property|Possible Values|Description|Default|
+|--------|---------------|-----------|-------|
+|`druid.broker.cache.useCache`|true, false|Enable the cache on the Broker.|false|
+|`druid.broker.cache.populateCache`|true, false|Populate the cache on the Broker.|false|
+|`druid.broker.cache.useResultLevelCache`|true, false|Enable result level caching on the Broker.|false|
+|`druid.broker.cache.populateResultLevelCache`|true, false|Populate the result level cache on the Broker.|false|
+|`druid.broker.cache.resultLevelCacheLimit`|positive integer|Maximum size of query response that can be cached.|`Integer.MAX_VALUE`|
+|`druid.broker.cache.unCacheable`|All druid query types|All query types to not cache.|`[scan]`|
+|`druid.broker.cache.cacheBulkMergeLimit`|positive integer or 0|Queries with more segments than this number will not attempt to fetch from cache at the broker level, leaving potential caching fetches (and cache result merging) to the Historicals|`Integer.MAX_VALUE`|
+|`druid.broker.cache.maxEntrySize`|positive integer|Maximum cache entry size in bytes.|1_000_000|
+
+See [cache configuration](#cache-configuration) for how to configure cache settings.
+
+:::info
+ Note: Even if cache is enabled, for [groupBy](../querying/groupbyquery.md) queries, segment level cache does not work on Brokers.
+ See [Query caching](../querying/caching.md) for more information.
+:::
+
+#### Segment discovery
+
+|Property|Possible Values|Description|Default|
+|--------|---------------|-----------|-------|
+|`druid.serverview.type`|batch or http|Segment discovery method to use. "http" enables discovering segments using HTTP instead of ZooKeeper.|http|
+|`druid.broker.segment.watchedTiers`|List of strings|The Broker watches segment announcements from processes that serve segments to build a cache to relate each process to the segments it serves. This configuration allows the Broker to only consider segments being served from a list of tiers. By default, Broker considers all tiers. This can be used to partition your dataSources in specific Historical tiers and configure brokers in partitions so that they are only queryable for specific dataSources. This config is mutually exclusive from `druid.broker.segment.ignoredTiers` and at most one of these can be configured on a Broker.|none|
+|`druid.broker.segment.ignoredTiers`|List of strings|The Broker watches segment announcements from processes that serve segments to build a cache to relate each process to the segments it serves. This configuration allows the Broker to ignore the segments being served from a list of tiers. By default, Broker considers all tiers. This config is mutually exclusive from `druid.broker.segment.watchedTiers` and at most one of these can be configured on a Broker.|none|
+|`druid.broker.segment.watchedDataSources`|List of strings|Broker watches the segment announcements from processes serving segments to build cache of which process is serving which segments, this configuration allows to only consider segments being served from a whitelist of dataSources. By default, Broker would consider all datasources. This can be used to configure brokers in partitions so that they are only queryable for specific dataSources.|none|
+|`druid.broker.segment.watchRealtimeTasks`|Boolean|The Broker watches segment announcements from processes that serve segments to build a cache to relate each process to the segments it serves. When `watchRealtimeTasks` is true, the Broker watches for segment announcements from both Historicals and realtime processes. To configure a broker to exclude segments served by realtime processes, set `watchRealtimeTasks` to false. |true|
+|`druid.broker.segment.awaitInitializationOnStart`|Boolean|Whether the Broker will wait for its view of segments to fully initialize before starting up. If set to 'true', the Broker's HTTP server will not start up, and the Broker will not announce itself as available, until the server view is initialized. See also `druid.sql.planner.awaitInitializationOnStart`, a related setting.|true|
+
+## Metrics monitors
+
+You can configure Druid services to emit [metrics](../operations/metrics.md) regularly from a number of [monitors](#metrics-monitors-for-each-service) via [emitters](#metrics-emitters). The following table lists general configurations for metrics:
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.monitoring.emissionPeriod`| Frequency that Druid emits metrics.|`PT1M`|
+|[`druid.monitoring.monitors`](#metrics-monitors-for-each-service)|Sets list of Druid monitors used by a service.|none (no monitors)|
+|[`druid.emitter`](#metrics-emitters)|Setting this value initializes one of the emitter modules.|`noop` (metric emission disabled by default)|
+
+### Metrics monitors for each service
+
+Metric monitoring is an essential part of Druid operations.
+Monitors can be enabled by configuring the property `druid.monitoring.monitors` in the common configuration file, `common.runtime.properties`.
+If a monitor is not supported on a certain service, it will simply be ignored while starting up that service.
+
+The following table lists available monitors and the respective services where they are supported:
+
+|Name|Description|Service|
+|----|-----------|-------|
+|`org.apache.druid.client.cache.CacheMonitor`|Emits metrics (to logs) about the segment results cache for Historical and Broker services. Reports typical cache statistics include hits, misses, rates, and size (bytes and number of entries), as well as timeouts and and errors.|Broker, Historical, Indexer, Peon|
+|`org.apache.druid.java.util.metrics.OshiSysMonitor`|Reports on various system activities and statuses using the [OSHI](https://github.com/oshi/oshi), a JNA-based (native) Operating System and Hardware Information library for Java.|Any|
+|`org.apache.druid.java.util.metrics.JvmMonitor`|Reports various JVM-related statistics.|Any|
+|`org.apache.druid.java.util.metrics.JvmCpuMonitor`|Reports statistics of CPU consumption by the JVM.|Any|
+|`org.apache.druid.java.util.metrics.CpuAcctDeltaMonitor`|Reports consumed CPU as per the cpuacct cgroup.|Any|
+|`org.apache.druid.java.util.metrics.JvmThreadsMonitor`|Reports Thread statistics in the JVM, like numbers of total, daemon, started, died threads.|Any|
+|`org.apache.druid.java.util.metrics.CgroupCpuMonitor`|Reports CPU shares and quotas as per the `cpu` cgroup.|Any|
+|`org.apache.druid.java.util.metrics.CgroupCpuSetMonitor`|Reports CPU core/HT and memory node allocations as per the `cpuset` cgroup.|Any|
+|`org.apache.druid.java.util.metrics.CgroupDiskMonitor`|Reports disk statistic as per the blkio cgroup.|Any|
+|`org.apache.druid.java.util.metrics.CgroupMemoryMonitor`|Reports memory statistic as per the memory cgroup.|Any|
+|`org.apache.druid.java.util.metrics.CgroupV2CpuMonitor`| **EXPERIMENTAL** Reports CPU usage from `cpu.stat` file. Only applicable to `cgroupv2`.|Any|
+|`org.apache.druid.java.util.metrics.CgroupV2DiskMonitor`| **EXPERIMENTAL** Reports disk usage from `io.stat` file. Only applicable to `cgroupv2`.|Any|
+|`org.apache.druid.java.util.metrics.CgroupV2MemoryMonitor`| **EXPERIMENTAL** Reports memory usage from `memory.current` and `memory.max` files. Only applicable to `cgroupv2`.|Any|
+|`org.apache.druid.server.metrics.HistoricalMetricsMonitor`|Reports statistics on Historical services.|Historical|
+|`org.apache.druid.server.metrics.SegmentStatsMonitor` | **EXPERIMENTAL** Reports statistics about segments on Historical services. Not to be used when lazy loading is configured.|Historical|
+|`org.apache.druid.server.metrics.QueryCountStatsMonitor`|Reports how many queries have been successful/failed/interrupted.|Broker, Historical, Router, Indexer, Peon|
+|`org.apache.druid.server.metrics.SubqueryCountStatsMonitor`|Reports how many subqueries have been materialized as rows or bytes and various other statistics related to the subquery execution|Broker|
+|`org.apache.druid.server.emitter.HttpEmittingMonitor`|Reports internal metrics of `http` or `parametrized` emitter (see below). Must not be used with another emitter type. See the description of the metrics here: https://github.com/apache/druid/pull/4973.|Any|
+|`org.apache.druid.server.metrics.TaskCountStatsMonitor`|Reports how many ingestion tasks are currently running/pending/waiting and also the number of successful/failed tasks per emission period.|Overlord|
+|`org.apache.druid.server.metrics.TaskSlotCountStatsMonitor`|Reports metrics about task slot usage per emission period.|Overlord|
+|`org.apache.druid.server.metrics.WorkerTaskCountStatsMonitor`|Reports how many ingestion tasks are currently running/pending/waiting, the number of successful/failed tasks, and metrics about task slot usage for the reporting worker, per emission period. |MiddleManager, Indexer|
+|`org.apache.druid.server.metrics.ServiceStatusMonitor`|Reports a heartbeat for the service.|Any|
+|`org.apache.druid.server.metrics.GroupByStatsMonitor`|Report metrics for groupBy queries like disk and merge buffer utilization. |Broker, Historical, Indexer, Peon|
+
+For example, if you only wanted monitors on all services for system and JVM information, you'd add the following to `common.runtime.properties`:
+
+```properties
+druid.monitoring.monitors=["org.apache.druid.java.util.metrics.OshiSysMonitor","org.apache.druid.java.util.metrics.JvmMonitor"]
+```
+
+All the services in your Druid deployment would have these two monitors.
+
+If you want any service specific monitors though, you need to add all the monitors you want to run for that service to the service's `runtime.properties` file even if they are listed in the common file. The service specific properties take precedence.
+
+The following example adds the `TaskCountStatsMonitor` and `TaskSlotCountStatsMonitor` as well as the `OshiSysMonitor` and `JvmMonitor` from the previous example to the Overlord service (`coordinator-overlord/runtime.properties`):
+
+```properties
+druid.monitoring.monitors=["org.apache.druid.server.metrics.TaskCountStatsMonitor", "org.apache.druid.server.metrics.TaskSlotCountStatsMonitor", "org.apache.druid.java.util.metrics.OshiSysMonitor","org.apache.druid.java.util.metrics.JvmMonitor"]
+```
+
+If you don't include `OshiSysMonitor` and `JvmMonitor` in the Overlord's `runtime.properties` file, the monitors don't get loaded onto the Overlord despite being specified in the common file.
+
+### Metrics emitters
+
+There are several emitters available:
+
+* `noop` (default) disables metric emission.
+* [`logging`](#logging-emitter-module) emits logs using Log4j2.
+* [`http`](#http-emitter-module) sends `POST` requests of JSON events.
+* [`parametrized`](#parametrized-http-emitter-module) operates like the `http` emitter but fine-tunes the recipient URL based on the event feed.
+* [`composing`](#composing-emitter-module) initializes multiple emitter modules.
+* [`graphite`](#graphite-emitter) emits metrics to a [Graphite](https://graphiteapp.org/) Carbon service.
+* [`switching`](#switching-emitter) initializes and emits to multiple emitter modules based on the event feed.
+
+#### Logging emitter module
+
+The use this emitter module, set `druid.emitter=logging`. The `logging` emitter uses a Log4j2 logger named
+`druid.emitter.logging.loggerClass` to emit events. Each event is logged as a single `json` object with a
+[Marker](https://logging.apache.org/log4j/2.x/manual/markers.html) as the feed of the event. Users may wish to edit the
+log4j config to route these logs to different sources based on the feed of the event.
+
+|Property|Description| Default|
+|--------|-----------|--------|
+|`druid.emitter.logging.loggerClass`|The class used for logging.|`org.apache.druid.java.util.emitter.core.LoggingEmitter`|
+|`druid.emitter.logging.logLevel`|Choices: debug, info, warn, error. The log level at which message are logged.|info|
+
+#### HTTP emitter module
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.emitter.http.flushMillis`|How often the internal message buffer is flushed (data is sent).|60000|
+|`druid.emitter.http.flushCount`|How many messages the internal message buffer can hold before flushing (sending).|500|
+|`druid.emitter.http.basicAuthentication`|[Password Provider](../operations/password-provider.md) for providing login and password for authentication in `"login:password"` form. For example, `druid.emitter.http.basicAuthentication=admin:adminpassword` uses Default Password Provider which allows plain text passwords.|not specified = no authentication|
+|`druid.emitter.http.flushTimeOut`|The timeout after which an event should be sent to the endpoint, even if internal buffers are not filled, in milliseconds.|not specified = no timeout|
+|`druid.emitter.http.batchingStrategy`|The strategy of how the batch is formatted. "ARRAY" means `[event1,event2]`, "NEWLINES" means `event1\nevent2`, ONLY_EVENTS means `event1event2`.|ARRAY|
+|`druid.emitter.http.maxBatchSize`|The maximum batch size, in bytes.|the minimum of (10% of JVM heap size divided by 2) or (5242880 (i. e. 5 MiB))|
+|`druid.emitter.http.batchQueueSizeLimit`|The maximum number of batches in emitter queue, if there are problems with emitting.|the maximum of (2) or (10% of the JVM heap size divided by 5MiB)|
+|`druid.emitter.http.minHttpTimeoutMillis`|If the speed of filling batches imposes timeout smaller than that, not even trying to send batch to endpoint, because it will likely fail, not being able to send the data that fast. Configure this depending based on emitter/successfulSending/minTimeMs metric. Reasonable values are 10ms..100ms.|0|
+|`druid.emitter.http.recipientBaseUrl`|The base URL to emit messages to. Druid will POST JSON to be consumed at the HTTP endpoint specified by this property.|none, required config|
+
+#### HTTP emitter module TLS overrides
+
+By default, when sending events to a TLS-enabled receiver, the HTTP Emitter uses an SSLContext obtained from the service described at [Druid's internal communication over TLS](../operations/tls-support.md), that is the same SSLContext that would be used for internal communications between Druid services.
+
+In some use cases it may be desirable to have the HTTP Emitter use its own separate truststore configuration. For example, there may be organizational policies that prevent the TLS-enabled metrics receiver's certificate from being added to the same truststore used by Druid's internal HTTP client.
+
+The following properties allow the HTTP Emitter to use its own truststore configuration when building its SSLContext.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.emitter.http.ssl.useDefaultJavaContext`|If set to true, the HttpEmitter will use `SSLContext.getDefault()`, the default Java SSLContext, and all other properties below are ignored.|false|
+|`druid.emitter.http.ssl.trustStorePath`|The file path or URL of the TLS/SSL Key store where trusted root certificates are stored. If this is unspecified, the HTTP Emitter will use the same SSLContext as Druid's internal HTTP client, as described in the beginning of this section, and all other properties below are ignored.|null|
+|`druid.emitter.http.ssl.trustStoreType`|The type of the key store where trusted root certificates are stored.|`java.security.KeyStore.getDefaultType()`|
+|`druid.emitter.http.ssl.trustStoreAlgorithm`|Algorithm to be used by TrustManager to validate certificate chains|`javax.net.ssl.TrustManagerFactory.getDefaultAlgorithm()`|
+|`druid.emitter.http.ssl.trustStorePassword`|The [Password Provider](../operations/password-provider.md) or String password for the Trust Store.|none|
+|`druid.emitter.http.ssl.protocol`|TLS protocol to use.|"TLSv1.2"|
+
+#### Parametrized HTTP emitter module
+
+The parametrized emitter takes the same configs as the [`http` emitter](#http-emitter-module) using the prefix `druid.emitter.parametrized.httpEmitting.`.
+For example:
+
+* `druid.emitter.parametrized.httpEmitting.flushMillis`
+* `druid.emitter.parametrized.httpEmitting.flushCount`
+* `druid.emitter.parametrized.httpEmitting.ssl.trustStorePath`
+
+Do not specify `recipientBaseUrl` with the parametrized emitter.
+Instead use `recipientBaseUrlPattern` described in the table below.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.emitter.parametrized.recipientBaseUrlPattern`|The URL pattern to send an event to, based on the event's feed. For example, `http://foo.bar/{feed}`, that will send event to `http://foo.bar/metrics` if the event's feed is "metrics".|none, required config|
+
+#### Composing emitter module
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.emitter.composing.emitters`|List of emitter modules to load, such as ["logging","http"].|[]|
+
+#### Graphite emitter
+
+To use graphite as emitter set `druid.emitter=graphite`. For configuration details, see [Graphite emitter](../development/extensions-contrib/graphite.md) for the Graphite emitter Druid extension.
+
+#### Switching emitter
+
+To use switching as emitter set `druid.emitter=switching`.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.emitter.switching.emitters`|JSON map of feed to list of emitter modules that will be used for the mapped feed, such as `{"metrics":["http"], "alerts":["logging"]}`|{}|
+|`druid.emitter.switching.defaultEmitters`|JSON list of emitter modules to load that will be used if there is no emitter specifically designated for that event's feed, such as `["logging","http"]`.|[]|
+
+
+## Cache configuration
+
+This section describes caching configuration that is common to Broker, Historical, and Middle Manager/Peon processes.
+
+Caching could optionally be enabled on the Broker, Historical, and Middle Manager/Peon processes. See
+[Broker](#broker-caching), [Historical](#historical-caching), and [Peon](#peon-caching) configuration options for how to
+enable it for different processes.
+
+Druid uses a local in-memory cache by default, unless a different type of cache is specified.
+Use the `druid.cache.type` configuration to set a different kind of cache.
+
+Cache settings are set globally, so the same configuration can be re-used
+for both Broker and Historical processes, when defined in the common properties file.
+
+### Cache type
+
+|Property|Possible Values|Description|Default|
+|--------|---------------|-----------|-------|
+|`druid.cache.type`|`local`, `memcached`, `hybrid`, `caffeine`|The type of cache to use for queries. See below of the configuration options for each cache type|`caffeine`|
+
+#### Local cache
+
+:::info
+ DEPRECATED: Use caffeine (default as of v0.12.0) instead
+:::
+
+The local cache is deprecated in favor of the Caffeine cache, and may be removed in a future version of Druid. The Caffeine cache affords significantly better performance and control over eviction behavior compared to `local` cache, and is recommended in any situation where you are using JRE 8u60 or higher.
+
+A simple in-memory LRU cache. Local cache resides in JVM heap memory, so if you enable it, make sure you increase heap size accordingly.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.cache.sizeInBytes`|Maximum cache size in bytes. Zero disables caching.|0|
+|`druid.cache.initialSize`|Initial size of the hash table backing the cache.|500000|
+|`druid.cache.logEvictionCount`|If non-zero, log cache eviction every `logEvictionCount` items.|0|
+
+#### Caffeine cache
+
+A highly performant local cache implementation for Druid based on [Caffeine](https://github.com/ben-manes/caffeine). Requires a JRE8u60 or higher if using `COMMON_FJP`.
+
+##### Configuration
+
+The following table shows the configuration options known to this module:
+
+|`runtime.properties`|Description|Default|
+|--------------------|-----------|-------|
+|`druid.cache.type`| Set this to `caffeine` or leave out parameter|`caffeine`|
+|`druid.cache.sizeInBytes`|The maximum size of the cache in bytes on heap. It can be configured as described in [here](human-readable-byte.md). |min(1GiB, Runtime.maxMemory / 10)|
+|`druid.cache.expireAfter`|The time (in ms) after an access for which a cache entry may be expired|None (no time limit)|
+|`druid.cache.cacheExecutorFactory`|The executor factory to use for Caffeine maintenance. One of `COMMON_FJP`, `SINGLE_THREAD`, or `SAME_THREAD`|ForkJoinPool common pool (`COMMON_FJP`)|
+|`druid.cache.evictOnClose`|If a close of a namespace (ex: removing a segment from a process) should cause an eager eviction of associated cache values|`false`|
+
+##### `druid.cache.cacheExecutorFactory`
+
+The following are the possible values for `druid.cache.cacheExecutorFactory`, which controls how maintenance tasks are run:
+
+* `COMMON_FJP` (default) use the common ForkJoinPool. Should use with [JRE 8u60 or higher](https://github.com/apache/druid/pull/4810#issuecomment-329922810). Older versions of the JRE may have worse performance than newer JRE versions.
+* `SINGLE_THREAD` Use a single-threaded executor.
+* `SAME_THREAD` Cache maintenance is done eagerly.
+
+##### Metrics
+
+In addition to the normal cache metrics, the caffeine cache implementation also reports the following in both `total` and `delta`:
+
+|Metric|Description|Normal value|
+|------|-----------|------------|
+|`query/cache/caffeine/*/requests`|Count of hits or misses.|hit + miss|
+|`query/cache/caffeine/*/loadTime`|Length of time caffeine spends loading new values (unused feature).|0|
+|`query/cache/caffeine/*/evictionBytes`|Size in bytes that have been evicted from the cache|Varies, should tune cache `sizeInBytes` so that `sizeInBytes`/`evictionBytes` is approximately the rate of cache churn you desire.|
+
+##### Memcached
+
+Uses memcached as cache backend. This allows all processes to share the same cache.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.cache.expiration`|Memcached [expiration time](https://code.google.com/p/memcached/wiki/NewCommands#Standard_Protocol).|2592000 (30 days)|
+|`druid.cache.timeout`|Maximum time in milliseconds to wait for a response from Memcached.|500|
+|`druid.cache.hosts`|Comma separated list of Memcached hosts `<host:port>`. Need to specify all nodes when `druid.cache.clientMode` is set to static. Dynamic mode [automatically identifies nodes in your cluster](https://docs.aws.amazon.com/AmazonElastiCache/latest/mem-ug/AutoDiscovery.html) so just specifying the configuration endpoint and port is fine.|none|
+|`druid.cache.maxObjectSize`|Maximum object size in bytes for a Memcached object.|52428800 (50 MiB)|
+|`druid.cache.memcachedPrefix`|Key prefix for all keys in Memcached.|druid|
+|`druid.cache.numConnections`| Number of memcached connections to use.|1|
+|`druid.cache.protocol`| Memcached communication protocol. Can be binary or text.|binary|
+|`druid.cache.locator`| Memcached locator. Can be consistent or `array_mod`.|consistent|
+|`druid.cache.enableTls`|Enable TLS based connection for Memcached client. Boolean.|false|
+|`druid.cache.clientMode`|Client Mode. Static mode requires the user to specify individual cluster nodes. Dynamic mode uses [AutoDiscovery](https://docs.aws.amazon.com/AmazonElastiCache/latest/mem-ug/AutoDiscovery.HowAutoDiscoveryWorks.html) feature of AWS Memcached. String. ["static"](https://docs.aws.amazon.com/AmazonElastiCache/latest/mem-ug/AutoDiscovery.Manual.html) or ["dynamic"](https://docs.aws.amazon.com/AmazonElastiCache/latest/mem-ug/AutoDiscovery.Using.ModifyApp.Java.html)|static|
+|`druid.cache.skipTlsHostnameVerification`|Skip TLS Hostname Verification. Boolean.|true|
+
+#### Hybrid
+
+Uses a combination of any two caches as a two-level L1 / L2 cache.
+This may be used to combine a local in-memory cache with a remote memcached cache.
+
+Cache requests will first check L1 cache before checking L2.
+If there is an L1 miss and L2 hit, it will also populate L1.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.cache.l1.type`|The type of cache to use for L1 cache. See `druid.cache.type` configuration for valid types.|`caffeine`|
+|`druid.cache.l2.type`|The type of cache to use for L2 cache. See `druid.cache.type` configuration for valid types.|`caffeine`|
+|`druid.cache.l1.*`|Any property valid for the given type of L1 cache can be set using this prefix. For instance, if you are using a `caffeine` L1 cache, specify `druid.cache.l1.sizeInBytes` to set its size.|defaults are the same as for the given cache type|
+|`druid.cache.l2.*`|Prefix for L2 cache settings, see description for L1.|defaults are the same as for the given cache type|
+|`druid.cache.useL2`|A boolean indicating whether to query L2 cache, if it's a miss in L1. It makes sense to configure this to `false` on Historical processes, if L2 is a remote cache like `memcached`, and this cache also used on brokers, because in this case if a query reached Historical it means that a broker didn't find corresponding results in the same remote cache, so a query to the remote cache from Historical is guaranteed to be a miss.|`true`|
+|`druid.cache.populateL2`|A boolean indicating whether to put results into L2 cache.|`true`|
+
+## General query configuration
+
+This section describes configurations that control behavior of Druid's query types, applicable to Broker, Historical, and Middle Manager processes.
+
+### Overriding default query context values
+
+You can override any [query context general parameter](../querying/query-context-reference.md#general-parameters) default value by setting the runtime property in the format of `druid.query.default.context.{query_context_key}`.
+The `druid.query.default.context.{query_context_key}` runtime property prefix applies to all current and future query context keys, the same as how query context parameter passed with the query works. You can override the runtime property value if the value for the same key is specified in the query contexts.
+
+The precedence chain for query context values is as follows:
+
+hard-coded default value in Druid code `<-` runtime property not prefixed with `druid.query.default.context`
+`<-` runtime property prefixed with `druid.query.default.context` `<-` context parameter in the query
+
+Note that not all query context key has a runtime property not prefixed with `druid.query.default.context` that can
+override the hard-coded default value. For example, `maxQueuedBytes` has `druid.broker.http.maxQueuedBytes`
+but `joinFilterRewriteMaxSize` does not. Hence, the only way of overriding `joinFilterRewriteMaxSize` hard-coded default
+value is with runtime property `druid.query.default.context.joinFilterRewriteMaxSize`.
+
+To further elaborate on the previous example:
+
+If neither `druid.broker.http.maxQueuedBytes` or `druid.query.default.context.maxQueuedBytes` is set and
+the query does not have `maxQueuedBytes` in the context, then the hard-coded value in Druid code is use.
+If runtime property only contains `druid.broker.http.maxQueuedBytes=x` and query does not have `maxQueuedBytes` in the
+context, then the value of the property, `x`, is use. However, if query does have `maxQueuedBytes` in the context,
+then that value is use instead.
+If runtime property only contains `druid.query.default.context.maxQueuedBytes=y` OR runtime property contains both
+`druid.broker.http.maxQueuedBytes=x` and `druid.query.default.context.maxQueuedBytes=y`, then the value of
+`druid.query.default.context.maxQueuedBytes`, `y`, is use (given that query does not have `maxQueuedBytes` in the
+context). If query does have `maxQueuedBytes` in the context, then that value is use instead.
+
+### TopN query config
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.query.topN.minTopNThreshold`|See [TopN Aliasing](../querying/topnquery.md#aliasing) for details.|1000|
+
+### Search query config
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.query.search.maxSearchLimit`|Maximum number of search results to return.|1000|
+|`druid.query.search.searchStrategy`|Default search query strategy.|`useIndexes`|
+
+### SegmentMetadata query config
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.query.segmentMetadata.defaultHistory`|When no interval is specified in the query, use a default interval of defaultHistory before the end time of the most recent segment, specified in ISO8601 format. This property also controls the duration of the default interval used by `GET` `/druid/v2/datasources/{dataSourceName}` interactions for retrieving datasource dimensions and metrics.|`P1W`|
+|`druid.query.segmentMetadata.defaultAnalysisTypes`|This can be used to set the Default Analysis Types for all segment metadata queries, this can be overridden when making the query|`["cardinality", "interval", "minmax"]`|
+
+### GroupBy query config
+
+This section describes the configurations for groupBy queries. You can set the runtime properties in the `runtime.properties` file on Broker, Historical, and Middle Manager processes. You can set the query context parameters through the [query context](../querying/query-context-reference.md).
+
+Supported runtime properties:
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.query.groupBy.maxSelectorDictionarySize`|Maximum amount of heap space (approximately) to use for per-segment string dictionaries. See [groupBy memory tuning and resource limits](../querying/groupbyquery.md#memory-tuning-and-resource-limits) for details.|100000000|
+|`druid.query.groupBy.maxMergingDictionarySize`|Maximum amount of heap space (approximately) to use for per-query string dictionaries. When the dictionary exceeds this size, a spill to disk will be triggered. See [groupBy memory tuning and resource limits](../querying/groupbyquery.md#memory-tuning-and-resource-limits) for details.|100000000|
+|`druid.query.groupBy.maxOnDiskStorage`|Maximum amount of disk space to use, per-query, for spilling result sets to disk when either the merging buffer or the dictionary fills up. Queries that exceed this limit will fail. Set to zero to disable disk spilling.|0 (disabled)|
+|`druid.query.groupBy.defaultOnDiskStorage`|Default amount of disk space to use, per-query, for spilling the result sets to disk when either the merging buffer or the dictionary fills up. Set to zero to disable disk spilling for queries which don't override `maxOnDiskStorage` in their context.|`druid.query.groupBy.maxOnDiskStorage`|
+
+Supported query contexts:
+
+|Key|Description|
+|---|-----------|
+|`maxSelectorDictionarySize`|Can be used to lower the value of `druid.query.groupBy.maxMergingDictionarySize` for this query.|
+|`maxMergingDictionarySize`|Can be used to lower the value of `druid.query.groupBy.maxMergingDictionarySize` for this query.|
+|`maxOnDiskStorage`|Can be used to set `maxOnDiskStorage` to a value between 0 and `druid.query.groupBy.maxOnDiskStorage` for this query. If this query context override exceeds `druid.query.groupBy.maxOnDiskStorage`, the query will use `druid.query.groupBy.maxOnDiskStorage`. Omitting this from the query context will cause the query to use `druid.query.groupBy.defaultOnDiskStorage` for `maxOnDiskStorage`|
+
+### Advanced configurations
+
+Supported runtime properties:
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.query.groupBy.singleThreaded`|Merge results using a single thread.|false|
+|`druid.query.groupBy.bufferGrouperInitialBuckets`|Initial number of buckets in the off-heap hash table used for grouping results. Set to 0 to use a reasonable default (1024).|0|
+|`druid.query.groupBy.bufferGrouperMaxLoadFactor`|Maximum load factor of the off-heap hash table used for grouping results. When the load factor exceeds this size, the table will be grown or spilled to disk. Set to 0 to use a reasonable default (0.7).|0|
+|`druid.query.groupBy.forceHashAggregation`|Force to use hash-based aggregation.|false|
+|`druid.query.groupBy.intermediateCombineDegree`|Number of intermediate processes combined together in the combining tree. Higher degrees will need less threads which might be helpful to improve the query performance by reducing the overhead of too many threads if the server has sufficiently powerful CPU cores.|8|
+|`druid.query.groupBy.numParallelCombineThreads`|Hint for the number of parallel combining threads. This should be larger than 1 to turn on the parallel combining feature. The actual number of threads used for parallel combining is min(`druid.query.groupBy.numParallelCombineThreads`, `druid.processing.numThreads`).|1 (disabled)|
+
+Supported query contexts:
+
+|Key|Description|Default|
+|---|-----------|-------|
+|`groupByIsSingleThreaded`|Overrides the value of `druid.query.groupBy.singleThreaded` for this query.| |
+|`bufferGrouperInitialBuckets`|Overrides the value of `druid.query.groupBy.bufferGrouperInitialBuckets` for this query.|none|
+|`bufferGrouperMaxLoadFactor`|Overrides the value of `druid.query.groupBy.bufferGrouperMaxLoadFactor` for this query.|none|
+|`forceHashAggregation`|Overrides the value of `druid.query.groupBy.forceHashAggregation`|none|
+|`intermediateCombineDegree`|Overrides the value of `druid.query.groupBy.intermediateCombineDegree`|none|
+|`numParallelCombineThreads`|Overrides the value of `druid.query.groupBy.numParallelCombineThreads`|none|
+|`sortByDimsFirst`|Sort the results first by dimension values and then by timestamp.|false|
+|`forceLimitPushDown`|When all fields in the orderby are part of the grouping key, the broker will push limit application down to the Historical processes. When the sorting order uses fields that are not in the grouping key, applying this optimization can result in approximate results with unknown accuracy, so this optimization is disabled by default in that case. Enabling this context flag turns on limit push down for limit/orderbys that contain non-grouping key columns.|false|
+
+### Router
+
+#### Router process configs
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.host`|The host for the current process. This is used to advertise the current processes location as reachable from another process and should generally be specified such that `http://${druid.host}/` could actually talk to this process|`InetAddress.getLocalHost().getCanonicalHostName()`|
+|`druid.bindOnHost`|Indicating whether the process's internal jetty server bind on `druid.host`. Default is false, which means binding to all interfaces.|false|
+|`druid.plaintextPort`|This is the port to actually listen on; unless port mapping is used, this will be the same port as is on `druid.host`|8888|
+|`druid.tlsPort`|TLS port for HTTPS connector, if [druid.enableTlsPort](../operations/tls-support.md) is set then this config will be used. If `druid.host` contains port then that port will be ignored. This should be a non-negative Integer.|9088|
+|`druid.service`|The name of the service. This is used as a dimension when emitting metrics and alerts to differentiate between the various services|`druid/router`|
+|`druid.labels`|Optional JSON object of key-value pairs that define custom labels for the server. These labels are displayed in the web console under the "Services" tab. Example: `druid.labels={"location":"Airtrunk"}` or `druid.labels.location=Airtrunk`|`null`|
+
+#### Runtime configuration
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.router.defaultBrokerServiceName`|The default Broker to connect to in case service discovery fails.|`druid/broker`|
+|`druid.router.tierToBrokerMap`|Queries for a certain tier of data are routed to their appropriate Broker. This value should be an ordered JSON map of tiers to Broker names. The priority of Brokers is based on the ordering.|`{"_default_tier": "<defaultBrokerServiceName>"}`|
+|`druid.router.defaultRule`|The default rule for all datasources.|`_default`|
+|`druid.router.pollPeriod`|How often to poll for new rules.|`PT1M`|
+|`druid.router.sql.enable`|Enable routing of SQL queries using strategies. When`true`, the Router uses the  strategies defined in `druid.router.strategies` to determine the broker service for a given SQL query. When `false`, the Router uses the `defaultBrokerServiceName`.|`false`|
+|`druid.router.strategies`|Please see [Router Strategies](../design/router.md#router-strategies) for details.|`[{"type":"timeBoundary"},{"type":"priority"}]`|
+|`druid.router.avatica.balancer.type`|Class to use for balancing Avatica queries across Brokers. Please see [Avatica Query Balancing](../design/router.md#avatica-query-balancing).|`rendezvousHash`|
+|`druid.router.managementProxy.enabled`|Enables the Router's [management proxy](../design/router.md#router-as-management-proxy) functionality.|false|
+|`druid.router.http.numConnections`|Size of connection pool for the Router to connect to Broker processes. If there are more queries than this number that all need to speak to the same process, then they will queue up.|`20`|
+|`druid.router.http.eagerInitialization`|Indicates that http connections from Router to Broker should be eagerly initialized. If set to true, `numConnections` connections are created upon initialization|`true`|
+|`druid.router.http.readTimeout`|The timeout for data reads from Broker processes.|`PT15M`|
+|`druid.router.http.numMaxThreads`|Maximum number of worker threads to handle HTTP requests and responses|`(number of cores) * 3 / 2 + 1`|
+|`druid.router.http.numRequestsQueued`|Maximum number of requests that may be queued to a destination|`1024`|
+|`druid.router.http.requestBuffersize`|Size of the content buffer for receiving requests. These buffers are only used for active connections that have requests with bodies that will not fit within the header buffer|`8 * 1024`|
+|`druid.router.http.clientConnectTimeout`|The timeout (in milliseconds) for establishing client connections.|500|
diff --git a/docs/35.0.0/configuration/logging.md b/docs/35.0.0/configuration/logging.md
new file mode 100644
index 0000000000..d740f38b09
--- /dev/null
+++ b/docs/35.0.0/configuration/logging.md
@@ -0,0 +1,170 @@
+---
+id: logging
+title: "Logging"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+Apache Druid services emit logs that to help you debug. 
+The same services also emit periodic [metrics](../configuration/index.md#metrics-monitors) about their state.
+To disable metric info logs set the following runtime property: `-Ddruid.emitter.logging.logLevel=debug`.
+
+Druid uses [log4j2](http://logging.apache.org/log4j/2.x/) for logging.
+The default configuration file log4j2.xml ships with Druid at the following path: `conf/druid/{config}/_common/log4j2.xml`.
+
+By default, Druid uses `RollingRandomAccessFile` for rollover daily, and keeps log files up to 7 days. 
+If that's not suitable in your case, modify the `log4j2.xml` accordingly.
+
+The following example log4j2.xml is based upon the micro quickstart:
+
+```
+<?xml version="1.0" encoding="UTF-8" ?>
+<Configuration status="WARN">
+  <Properties>
+    <!-- to change log directory, set DRUID_LOG_DIR environment variable to your directory before launching Druid -->
+    <Property name="druid.log.path" value="log" />
+  </Properties>
+
+  <Appenders>
+    <Console name="Console" target="SYSTEM_OUT">
+      <PatternLayout pattern="%d{ISO8601} %p [%t] %c -%notEmpty{ [%markerSimpleName]} %m%n"/>
+    </Console>
+
+    <!-- Rolling Files-->
+    <RollingRandomAccessFile name="FileAppender"
+                             fileName="${sys:druid.log.path}/${sys:druid.node.type}.log"
+                             filePattern="${sys:druid.log.path}/${sys:druid.node.type}.%d{yyyyMMdd}.log">
+      <PatternLayout pattern="%d{ISO8601} %p [%t] %c -%notEmpty{ [%markerSimpleName]} %m%n"/>
+      <Policies>
+        <TimeBasedTriggeringPolicy interval="1" modulate="true"/>
+      </Policies>
+      <DefaultRolloverStrategy>
+        <Delete basePath="${sys:druid.log.path}/" maxDepth="1">
+          <IfFileName glob="*.log" />
+          <IfLastModified age="7d" />
+        </Delete>
+      </DefaultRolloverStrategy>
+    </RollingRandomAccessFile>
+
+  </Appenders>
+
+  <Loggers>
+    <Root level="info">
+      <AppenderRef ref="FileAppender"/>
+    </Root>
+
+    <!-- Set level="debug" to see stack traces for query errors -->
+    <Logger name="org.apache.druid.server.QueryResource" level="info" additivity="false">
+      <Appender-ref ref="FileAppender"/>
+    </Logger>
+    <Logger name="org.apache.druid.server.QueryLifecycle" level="info" additivity="false">
+      <Appender-ref ref="FileAppender"/>
+    </Logger>
+
+    <!-- Set level="debug" or "trace" to see more Coordinator details (segment balancing, load/drop rules, etc) -->
+    <Logger name="org.apache.druid.server.coordinator" level="info" additivity="false">
+      <Appender-ref ref="FileAppender"/>
+    </Logger>
+
+    <!-- Set level="debug" to see low-level details about segments and ingestion -->
+    <Logger name="org.apache.druid.segment" level="info" additivity="false">
+      <Appender-ref ref="FileAppender"/>
+    </Logger>
+
+    <!-- Set level="debug" to see more information about extension initialization -->
+    <Logger name="org.apache.druid.initialization" level="info" additivity="false">
+      <Appender-ref ref="FileAppender"/>
+    </Logger>
+
+    <!-- Quieter logging at startup -->
+    <Logger name="com.sun.jersey.guice" level="warn" additivity="false">
+      <Appender-ref ref="FileAppender"/>
+    </Logger>
+  </Loggers>
+</Configuration>
+```
+
+Peons always output logs to standard output. Middle Managers redirect task logs from standard output to
+[long-term storage](index.md#log-long-term-storage).
+
+:::info
+
+ Druid shares the log4j configuration file among all services, including task peon processes.
+ However, you must define a console appender in the logger for your peon processes.
+ If you don't define a console appender, Druid creates and configures a new console appender
+ that retains the log level, such as `info` or `warn`, but does not retain any other appender
+ configuration, including non-console ones.
+:::
+
+## Log directory
+The included log4j2.xml configuration for Druid and ZooKeeper writes logs to the `log` directory at the root of the distribution.
+
+If you want to change the log directory, set the environment variable `DRUID_LOG_DIR` to the right directory before you start Druid.
+
+## All-in-one start commands
+
+If you use one of the all-in-one start commands, such as `bin/start-micro-quickstart`, the default configuration for each service has two kinds of log files.
+Log4j2 writes the main log file and rotates it periodically.
+For example, `log/historical.log`.
+
+The secondary log file contains anything that is written by the component
+directly to standard output or standard error without going through log4j2.
+For example, `log/historical.stdout.log`.
+This consists mainly of messages from the
+Java runtime itself.
+This file is not rotated, but it is generally small due to the low volume of messages.
+If necessary, you can truncate it using the Linux command `truncate --size 0 log/historical.stdout.log`.
+
+## Set the logs to asynchronously write
+
+If your logs are really chatty, you can set them to write asynchronously.
+The following example shows a `log4j2.xml` that configures some of the more chatty classes to write asynchronously:
+
+```
+<?xml version="1.0" encoding="UTF-8" ?>
+<Configuration status="WARN">
+  <Appenders>
+    <Console name="Console" target="SYSTEM_OUT">
+      <PatternLayout pattern="%d{ISO8601} %p [%t] %c -%notEmpty{ [%markerSimpleName]} %m%n"/>
+    </Console>
+  </Appenders>
+  
+<Loggers>
+    <!-- AsyncLogger instead of Logger -->
+    <AsyncLogger name="org.apache.druid.curator.inventory.CuratorInventoryManager" level="debug" additivity="false">
+      <AppenderRef ref="Console"/>
+    </AsyncLogger>
+    <AsyncLogger name="org.apache.druid.client.BatchServerInventoryView" level="debug" additivity="false">
+      <AppenderRef ref="Console"/>
+    </AsyncLogger>
+    <!-- Make extra sure nobody adds logs in a bad way that can hurt performance -->
+    <AsyncLogger name="org.apache.druid.client.ServerInventoryView" level="debug" additivity="false">
+      <AppenderRef ref="Console"/>
+    </AsyncLogger>
+    <AsyncLogger name ="org.apache.druid.java.util.http.client.pool.ChannelResourceFactory" level="info" additivity="false">
+      <AppenderRef ref="Console"/>
+    </AsyncLogger>
+    <Root level="info">
+      <AppenderRef ref="Console"/>
+    </Root>
+  </Loggers>
+</Configuration>
+```
diff --git a/docs/35.0.0/data-management/automatic-compaction.md b/docs/35.0.0/data-management/automatic-compaction.md
new file mode 100644
index 0000000000..1a0803bafb
--- /dev/null
+++ b/docs/35.0.0/data-management/automatic-compaction.md
@@ -0,0 +1,370 @@
+---
+id: automatic-compaction
+title: "Automatic compaction"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+In Apache Druid, compaction is a special type of ingestion task that reads data from a Druid datasource and writes it back into the same datasource. A common use case for this is to [optimally size segments](../operations/segment-optimization.md) after ingestion to improve query performance. Automatic compaction, or auto-compaction, refers to the system for automatic execution of compaction tasks issued by Druid itself. In addition to auto-compaction, you can perform [manual compaction](./manual-compaction.md) using the Overlord APIs.
+
+:::info
+ Auto-compaction skips datasources that have a segment granularity of `ALL`.
+:::
+
+As a best practice, you should set up auto-compaction for all Druid datasources. You can run compaction tasks manually for cases where you want to allocate more system resources. For example, you may choose to run multiple compaction tasks in parallel to compact an existing datasource for the first time. See [Compaction](compaction.md) for additional details and use cases.
+
+This topic guides you through setting up automatic compaction for your Druid cluster. See the [examples](#examples) for common use cases for automatic compaction.
+
+## Auto-compaction syntax
+
+You can configure automatic compaction dynamically without restarting Druid.
+The automatic compaction system uses the following syntax:
+
+```json
+{
+    "dataSource": <task_datasource>,
+    "ioConfig": <IO config>,
+    "dimensionsSpec": <custom dimensionsSpec>,
+    "transformSpec": <custom transformSpec>,
+    "metricsSpec": <custom metricsSpec>,
+    "tuningConfig": <parallel indexing task tuningConfig>,
+    "granularitySpec": <compaction task granularitySpec>,
+    "skipOffsetFromLatest": <time period to avoid compaction>,
+    "taskPriority": <compaction task priority>,
+    "taskContext": <task context>
+}
+```
+
+:::info[Experimental]
+
+The MSQ task engine is available as a compaction engine when you run automatic compaction as a compaction supervisor. For more information, see [Auto-compaction using compaction supervisors](#auto-compaction-using-compaction-supervisors).
+
+:::
+
+For automatic compaction using Coordinator duties, you submit the spec to the [Compaction config UI](#manage-auto-compaction-using-the-web-console) or the [Compaction configuration API](#manage-auto-compaction-using-coordinator-apis).
+
+Most fields in the auto-compaction configuration correlate to a typical [Druid ingestion spec](../ingestion/ingestion-spec.md).
+The following properties only apply to auto-compaction:
+* `skipOffsetFromLatest`
+* `taskPriority`
+* `taskContext`
+
+Since the automatic compaction system provides a management layer on top of manual compaction tasks,
+the auto-compaction configuration does not include task-specific properties found in a typical Druid ingestion spec.
+The following properties are automatically set by the Coordinator:
+* `type`: Set to `compact`.
+* `id`: Generated using the task type, datasource name, interval, and timestamp. The task ID is prefixed with `coordinator-issued`.
+* `context`: Set according to the user-provided `taskContext`.
+
+Compaction tasks typically fetch all [relevant segments](manual-compaction.md#compaction-io-configuration) prior to launching any subtasks,
+_unless_ the following properties are all set to non-null values. It is strongly recommended to set them to non-null values to
+maximize performance and minimize disk usage of the `compact` tasks launched by auto-compaction:
+
+- [`granularitySpec`](manual-compaction.md#compaction-granularity-spec), with non-null values for each of `segmentGranularity`, `queryGranularity`, and `rollup`
+- [`dimensionsSpec`](manual-compaction.md#compaction-dimensions-spec)
+- `metricsSpec`
+
+For more details on each of the specs in an auto-compaction configuration, see [Automatic compaction dynamic configuration](../configuration/index.md#automatic-compaction-dynamic-configuration).
+
+## Auto-compaction using Coordinator duties
+
+You can control how often the Coordinator checks to see if auto-compaction is needed. The Coordinator [indexing period](../configuration/index.md#data-management), `druid.coordinator.period.indexingPeriod`, controls the frequency of compaction tasks.
+The default indexing period is 30 minutes, meaning that the Coordinator first checks for segments to compact at most 30 minutes from when auto-compaction is enabled.
+This time period also affects other Coordinator duties such as cleanup of unused segments and stale pending segments.
+To configure the auto-compaction time period without interfering with `indexingPeriod`, see [Set frequency of compaction runs](#change-compaction-frequency).
+
+At every invocation of auto-compaction, the Coordinator initiates a [segment search](../design/coordinator.md#segment-search-policy-in-automatic-compaction) to determine eligible segments to compact.
+When there are eligible segments to compact, the Coordinator issues compaction tasks based on available worker capacity.
+If a compaction task takes longer than the indexing period, the Coordinator waits for it to finish before resuming the period for segment search.
+
+No additional configuration is needed to run automatic compaction tasks using the Coordinator and native engine. This is the default behavior for Druid.
+You can configure it for a datasource through the web console or programmatically via an API.
+This process differs for manual compaction tasks, which can be submitted from the [Tasks view of the web console](../operations/web-console.md) or the [Tasks API](../api-reference/tasks-api.md).
+
+### Manage auto-compaction using the web console
+
+Use the web console to enable automatic compaction for a datasource as follows:
+
+1. Click **Datasources** in the top-level navigation.
+2. In the **Compaction** column, click the edit icon for the datasource to compact.
+3. In the **Compaction config** dialog, configure the auto-compaction settings. The dialog offers a form view as well as a JSON view. Editing the form updates the JSON specification, and editing the JSON updates the form field, if present. Form fields not present in the JSON indicate default values. You may add additional properties to the JSON for auto-compaction settings not displayed in the form. See [Configure automatic compaction](#auto-compaction-syntax) for supported settings for auto-compaction.
+4. Click **Submit**.
+5. Refresh the **Datasources** view. The **Compaction** column for the datasource changes from “Not enabled” to “Awaiting first run.”
+
+The following screenshot shows the compaction config dialog for a datasource with auto-compaction enabled.
+![Compaction config in web console](../assets/compaction-config.png)
+
+To disable auto-compaction for a datasource, click **Delete** from the **Compaction config** dialog. Druid does not retain your auto-compaction configuration.
+
+### Manage auto-compaction using Coordinator APIs  
+
+Use the [Automatic compaction API](../api-reference/automatic-compaction-api.md#manage-automatic-compaction) to configure automatic compaction.
+To enable auto-compaction for a datasource, create a JSON object with the desired auto-compaction settings.
+See [Configure automatic compaction](#auto-compaction-syntax) for the syntax of an auto-compaction spec.
+Send the JSON object as a payload in a [`POST` request](../api-reference/automatic-compaction-api.md#create-or-update-automatic-compaction-configuration) to `/druid/coordinator/v1/config/compaction`.
+The following example configures auto-compaction for the `wikipedia` datasource:
+
+```sh
+curl --location --request POST 'http://localhost:8081/druid/coordinator/v1/config/compaction' \
+--header 'Content-Type: application/json' \
+--data-raw '{
+    "dataSource": "wikipedia",
+    "granularitySpec": {
+        "segmentGranularity": "DAY"
+    }
+}'
+```
+
+To disable auto-compaction for a datasource, send a [`DELETE` request](../api-reference/automatic-compaction-api.md#remove-automatic-compaction-configuration) to `/druid/coordinator/v1/config/compaction/{dataSource}`. Replace `{dataSource}` with the name of the datasource for which to disable auto-compaction. For example:
+
+```sh
+curl --location --request DELETE 'http://localhost:8081/druid/coordinator/v1/config/compaction/wikipedia'
+```
+
+### Change compaction frequency
+
+If you want the Coordinator to check for compaction more frequently than its indexing period, create a separate group to handle compaction duties.
+Set the time period of the duty group in the `coordinator/runtime.properties` file.
+The following example shows how to create a duty group named `compaction` and set the auto-compaction period to 1 minute:
+```
+druid.coordinator.dutyGroups=["compaction"]
+druid.coordinator.compaction.duties=["compactSegments"]
+druid.coordinator.compaction.period=PT60S
+```
+
+### View Coordinator duty auto-compaction stats
+
+After the Coordinator has initiated auto-compaction, you can view compaction statistics for the datasource, including the number of bytes, segments, and intervals already compacted and those awaiting compaction. The Coordinator also reports the total bytes, segments, and intervals not eligible for compaction in accordance with its [segment search policy](../design/coordinator.md#segment-search-policy-in-automatic-compaction).
+
+In the web console, the Datasources view displays auto-compaction statistics. The Tasks view shows the task information for compaction tasks that were triggered by the automatic compaction system.
+
+To get statistics by API, send a [`GET` request](../api-reference/automatic-compaction-api.md#view-automatic-compaction-status) to `/druid/coordinator/v1/compaction/status`. To filter the results to a particular datasource, pass the datasource name as a query parameter to the request—for example, `/druid/coordinator/v1/compaction/status?dataSource=wikipedia`.
+
+
+## Avoid conflicts with ingestion
+
+Compaction tasks may be interrupted when they interfere with ingestion. For example, this occurs when an ingestion task needs to write data to a segment for a time interval locked for compaction. If there are continuous failures that prevent compaction from making progress, consider one of the following strategies:
+
+* Enable [concurrent append and replace tasks](#enable-concurrent-append-and-replace) on your datasource and on the ingestion tasks.
+* Set `skipOffsetFromLatest` to reduce the chance of conflicts between ingestion and compaction. See more details in [Skip compaction for latest segments](#skip-compaction-for-latest-segments).
+* Increase the priority value of compaction tasks relative to ingestion tasks. Only recommended for advanced users. This approach can cause ingestion jobs to fail or lag. To change the priority of compaction tasks, set `taskPriority` to the desired priority value in the auto-compaction configuration. For details on the priority values of different task types, see [Lock priority](../ingestion/tasks.md#lock-priority).
+
+### Enable concurrent append and replace
+
+You can use concurrent append and replace to safely replace the existing data in an interval of a datasource while new data is being appended to that interval even during compaction.
+
+To do this, you need to update your datasource to allow concurrent append and replace tasks:
+
+* If you're using the API, include the following `taskContext` property in your API call: `"useConcurrentLocks": true`
+* If you're using the UI, enable **Use concurrent locks** in the **Compaction config** for your datasource.
+
+You'll also need to update your ingestion jobs for the datasource to include the task context `"useConcurrentLocks": true`.
+
+For information on how to do this, see [Concurrent append and replace](../ingestion/concurrent-append-replace.md).
+
+### Skip compaction for latest segments
+
+The Coordinator compacts segments from newest to oldest. In the auto-compaction configuration, you can set a time period, relative to the end time of the most recent segment, for segments that should not be compacted. Assign this value to `skipOffsetFromLatest`. Note that this offset is not relative to the current time but to the latest segment time. For example, if you want to skip over segments from five days prior to the end time of the most recent segment, assign `"skipOffsetFromLatest": "P5D"`.
+
+To set `skipOffsetFromLatest`, consider how frequently you expect the stream to receive late arriving data. If your stream only occasionally receives late arriving data, the auto-compaction system robustly compacts your data even though data is ingested outside the `skipOffsetFromLatest` window. For most realtime streaming ingestion use cases, it is reasonable to set `skipOffsetFromLatest` to a few hours or a day.
+
+## Examples
+
+The following examples demonstrate potential use cases in which auto-compaction may improve your Druid performance. See more details in [Compaction strategies](../data-management/compaction.md#compaction-guidelines). The examples in this section do not change the underlying data.
+
+### Change segment granularity
+
+You have a stream set up to ingest data with `HOUR` segment granularity into the `wikistream` datasource. You notice that your Druid segments are smaller than the [recommended segment size](../operations/segment-optimization.md) of 5 million rows per segment. You wish to automatically compact segments to `DAY` granularity while leaving the latest week of data _not_ compacted because your stream consistently receives data within that time period.
+
+The following auto-compaction configuration compacts existing `HOUR` segments into `DAY` segments while leaving the latest week of data not compacted:
+
+```json
+{
+  "dataSource": "wikistream",
+  "granularitySpec": {
+    "segmentGranularity": "DAY"
+  },
+  "skipOffsetFromLatest": "P1W",
+}
+```
+
+### Update partitioning scheme
+
+For your `wikipedia` datasource, you want to optimize segment access when regularly ingesting data without compromising compute time when querying the data. Your ingestion spec for batch append uses [dynamic partitioning](../ingestion/native-batch.md#dynamic-partitioning) to optimize for write-time operations, while your stream ingestion partitioning is configured by the stream service. You want to implement auto-compaction to reorganize the data with a suitable read-time partitioning using [multi-dimension range partitioning](../ingestion/native-batch.md#multi-dimension-range-partitioning). Based on the dimensions frequently accessed in queries, you wish to partition on the following dimensions: `channel`, `countryName`, `namespace`.
+
+The following auto-compaction configuration compacts updates the `wikipedia` segments to use multi-dimension range partitioning:
+
+```json
+{
+  "dataSource": "wikipedia",
+  "tuningConfig": {
+    "partitionsSpec": {
+      "type": "range",
+      "partitionDimensions": [
+        "channel",
+        "countryName",
+        "namespace"
+      ],
+      "targetRowsPerSegment": 5000000
+    }
+  }
+}
+```
+
+## Auto-compaction using compaction supervisors  
+
+:::info[Experimental]
+Compaction supervisors are experimental. For production use, we recommend [auto-compaction using Coordinator duties](#auto-compaction-using-coordinator-duties).
+:::
+
+You can run automatic compaction using compaction supervisors on the Overlord rather than Coordinator duties. Compaction supervisors provide the following benefits over Coordinator duties:
+
+* Can use the supervisor framework to get information about the auto-compaction, such as status or state
+* More easily suspend or resume compaction for a datasource
+* Can use either the native compaction engine or the [MSQ task engine](#use-msq-for-auto-compaction)
+* More reactive and submits tasks as soon as a compaction slot is available
+* Tracked compaction task status to avoid re-compacting an interval repeatedly
+
+
+To use compaction supervisors, update the [compaction dynamic config](../api-reference/automatic-compaction-api.md#update-cluster-level-compaction-config) and set:
+
+*  `useSupervisors` to `true` so that compaction tasks can be run as supervisor tasks
+*  `engine` to `msq` to use the MSQ task engine as the compaction engine or to `native` (default value) to use the native engine.
+
+Compaction supervisors use the same syntax as auto-compaction using Coordinator duties with one key difference: you submit the auto-compaction as a supervisor spec. In the spec, set the `type` to `autocompact` and include the auto-compaction config in the `spec`.
+
+To submit an automatic compaction task, you can submit a supervisor spec through the [web console](#manage-compaction-supervisors-with-the-web-console) or the [supervisor API](#manage-compaction-supervisors-with-supervisor-apis).
+
+
+### Manage compaction supervisors with the web console
+
+To submit a supervisor spec for MSQ task engine automatic compaction, perform the following steps:
+
+1. In the web console, go to the **Supervisors** tab.
+1. Click **...** > **Submit JSON supervisor**.
+1. In the dialog, include the following:
+     - The type of supervisor spec by setting `"type": "autocompact"`
+     - The compaction configuration by adding it to the `spec` field
+    ```json
+    {
+     "type": "autocompact",
+     "spec": {
+       "dataSource": YOUR_DATASOURCE,
+       "tuningConfig": {...},
+       "granularitySpec": {...},
+       "engine": <native|msq>,
+       ...
+    }
+    ```
+1. Submit the supervisor.
+
+To stop the automatic compaction task, suspend or terminate the supervisor through the UI or API.
+
+### Manage compaction supervisors with supervisor APIs
+
+Submitting an automatic compaction as a supervisor task uses the same endpoint as supervisor tasks for streaming ingestion.
+
+The following example configures auto-compaction for the `wikipedia` datasource:
+
+```sh
+curl --location --request POST 'http://localhost:8081/druid/indexer/v1/supervisor' \
+--header 'Content-Type: application/json' \
+--data-raw '{
+   "type": "autocompact",                     // required
+   "suspended": false,                        // optional 
+   "spec": {                                  // required
+       "dataSource": "wikipedia",             // required
+       "tuningConfig": {...},                 // optional
+       "granularitySpec": {...},              // optional
+       "engine": <native|msq>,                // optional
+       ...
+   }
+}'
+```
+
+Note that if you omit `spec.engine`, Druid uses the default compaction engine. You can control the default compaction engine with the `druid.supervisor.compaction.engine` Overlord runtime property. If `spec.engine` and `druid.supervisor.compaction.engine` are omitted, Druid defaults to the native engine.
+
+To stop the automatic compaction task, suspend or terminate the supervisor through the UI or API.
+
+### Use MSQ for auto-compaction
+
+The MSQ task engine is available as a compaction engine if you configure auto-compaction to use compaction supervisors. To use the MSQ task engine for automatic compaction, make sure the following requirements are met:
+
+* [Load the MSQ task engine extension](../multi-stage-query/index.md#load-the-extension).
+* In your Overlord runtime properties, set the following properties:
+  *  `druid.supervisor.compaction.enabled` to `true` so that compaction tasks can be run as a supervisor task.
+  *  Optionally, set `druid.supervisor.compaction.engine` to `msq` to specify the MSQ task engine as the default compaction engine. If you don't do this, you'll need to set `spec.engine` to `msq` for each compaction supervisor spec where you want to use the MSQ task engine.
+* Have at least two compaction task slots available or set `compactionConfig.taskContext.maxNumTasks` to two or more. The MSQ task engine requires at least two tasks to run, one controller task and one worker task.
+
+You can use [MSQ task engine context parameters](../multi-stage-query/reference.md#context-parameters) in `spec.taskContext` when configuring your datasource for automatic compaction, such as setting the maximum number of tasks using the `spec.taskContext.maxNumTasks` parameter. Some of the MSQ task engine context parameters overlap with automatic compaction parameters. When these settings overlap, set one or the other.
+
+
+#### MSQ task engine limitations
+
+<!--This list also exists in multi-stage-query/known-issues-->
+
+When using the MSQ task engine for auto-compaction, keep the following limitations in mind:
+
+- The `metricSpec` field is only supported for certain aggregators. For more information, see [Supported aggregators](#supported-aggregators).
+- Only dynamic and range-based partitioning are supported.
+- Set `rollup`  to `true` if and only if `metricSpec` is not empty or null.
+- You can only partition on string dimensions. However, multi-valued string dimensions are not supported.
+- The `maxTotalRows` config is not supported in `DynamicPartitionsSpec`. Use `maxRowsPerSegment` instead.
+- Segments can only be sorted on `__time` as the first column.
+
+#### Supported aggregators
+
+Auto-compaction using the MSQ task engine supports only aggregators that satisfy the following properties: 
+* __Mergeability__: can combine partial aggregates
+* __Idempotency__: produces the same results on repeated runs of the aggregator on previously aggregated values in a column
+
+This is exemplified by the following `longSum` aggregator:
+
+```
+{"name": "added", "type": "longSum", "fieldName": "added"}
+```
+
+where `longSum` being capable of combining partial results satisfies mergeability, while input and output column being the same (`added`) ensures idempotency.
+
+The following are some examples of aggregators that aren't supported since at least one of the required conditions aren't satisfied:
+
+*  `longSum` aggregator where the `added` column rolls up into `sum_added` column discarding the input `added` column, violating idempotency, as subsequent runs would no longer find the `added` column:
+    ```
+    {"name": "sum_added", "type": "longSum", "fieldName": "added"}
+    ```
+* Partial sketches which cannot themselves be used to combine partial aggregates and need merging aggregators -- such as `HLLSketchMerge` required for `HLLSketchBuild` aggregator below -- violating mergeability:
+    ```
+    {"name": "added", "type": "HLLSketchBuild", "fieldName": "added"}
+    ```
+* Count aggregator since it cannot be used to combine partial aggregates and it rolls up into a different `count` column discarding the input column(s), violating both mergeability and idempotency.
+    ```
+    {"type": "count", "name": "count"}
+    ```
+
+
+
+## Learn more
+
+See the following topics for more information:
+* [Compaction](compaction.md) for an overview of compaction in Druid.
+* [Manual compaction](manual-compaction.md) for how to manually perform compaction tasks.
+* [Segment optimization](../operations/segment-optimization.md) for guidance on evaluating and optimizing Druid segment size.
+* [Coordinator process](../design/coordinator.md#automatic-compaction) for details on how the Coordinator plans compaction tasks.
+
diff --git a/docs/35.0.0/data-management/compaction.md b/docs/35.0.0/data-management/compaction.md
new file mode 100644
index 0000000000..51bf7ee864
--- /dev/null
+++ b/docs/35.0.0/data-management/compaction.md
@@ -0,0 +1,113 @@
+---
+id: compaction
+title: "Compaction"
+description: "Defines compaction and automatic compaction (auto-compaction or autocompaction) for segment optimization. Use cases and strategies for compaction. Describes compaction task configuration."
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+  
+Query performance in Apache Druid depends on optimally sized segments. Compaction is one strategy you can use to optimize segment size for your Druid database. Compaction tasks read an existing set of segments for a given time interval and combine the data into a new "compacted" set of segments. In some cases the compacted segments are larger, but there are fewer of them. In other cases the compacted segments may be smaller. Compaction tends to increase performance because optimized segments require less per-segment processing and less memory overhead for ingestion and for querying paths.
+
+## Compaction guidelines
+
+There are several cases to consider compaction for segment optimization:
+
+- With streaming ingestion, data can arrive out of chronological order creating many small segments.
+- If you append data using `appendToExisting` for [native batch](../ingestion/native-batch.md) ingestion creating suboptimal segments.
+- When you use `index_parallel` for parallel batch indexing and the parallel ingestion tasks create many small segments.
+- When a misconfigured ingestion task creates oversized segments.
+
+By default, compaction does not modify the underlying data of the segments. However, there are cases when you may want to modify data during compaction to improve query performance:
+
+- If, after ingestion, you realize that data for the time interval is sparse, you can use compaction to increase the segment granularity.
+- If you don't need fine-grained granularity for older data, you can use compaction to change older segments to a coarser query granularity. For example, from `minute` to `hour` or `hour` to `day`. This reduces the storage space required for older data.
+- You can change the dimension order to improve sorting and reduce segment size.
+- You can remove unused columns in compaction or implement an aggregation metric for older data.
+- You can change segment rollup from dynamic partitioning with best-effort rollup to hash or range partitioning with perfect rollup. For more information on rollup, see [perfect vs best-effort rollup](../ingestion/rollup.md#perfect-rollup-vs-best-effort-rollup).
+
+Compaction does not improve performance in all situations. For example, if you rewrite your data with each ingestion task, you don't need to use compaction. See [Segment optimization](../operations/segment-optimization.md) for additional guidance to determine if compaction will help in your environment.
+
+## Ways to run compaction
+
+Automatic compaction, also called auto-compaction, works in most use cases and should be your first option. 
+
+The Coordinator uses its [segment search policy](../design/coordinator.md#segment-search-policy-in-automatic-compaction) to periodically identify segments for compaction starting from newest to oldest. When the Coordinator discovers segments that have not been compacted or segments that were compacted with a different or changed spec, it submits compaction tasks for the time interval covering those segments.
+
+To learn more, see [Automatic compaction](../data-management/automatic-compaction.md).
+
+In cases where you require more control over compaction, you can manually submit compaction tasks. For example:
+
+- Automatic compaction is running into the limit of task slots available to it, so tasks are waiting for previous automatic compaction tasks to complete. Manual compaction can use all available task slots, therefore you can complete compaction more quickly by submitting more concurrent tasks for more intervals.
+- You want to force compaction for a specific time range or you want to compact data out of chronological order.
+
+See [Setting up a manual compaction task](./manual-compaction.md#setting-up-manual-compaction) for more about manual compaction tasks.
+
+## Data handling with compaction
+
+During compaction, Druid overwrites the original set of segments with the compacted set. Druid also locks the segments for the time interval being compacted to ensure data consistency. By default, compaction tasks do not modify the underlying data. You can configure the compaction task to change the query granularity or add or remove dimensions in the compaction task. This means that the only changes to query results should be the result of intentional, not automatic, changes.
+
+You can set `dropExisting` in `ioConfig` to "true" in the compaction task to configure Druid to replace all existing segments fully contained by the interval. See the suggestion for reindexing with finer granularity under [Implementation considerations](../ingestion/native-batch.md#implementation-considerations) for an example.
+:::info
+ WARNING: `dropExisting` in `ioConfig` is a beta feature.
+:::
+
+If an ingestion task needs to write data to a segment for a time interval locked for compaction, by default the ingestion task supersedes the compaction task and the compaction task fails without finishing. For manual compaction tasks, you can adjust the input spec interval to avoid conflicts between ingestion and compaction. For automatic compaction, you can set the `skipOffsetFromLatest` key to adjust the auto-compaction starting point from the current time to reduce the chance of conflicts between ingestion and compaction.
+Another option is to set the compaction task to higher priority than the ingestion task.
+For more information, see [Avoid conflicts with ingestion](../data-management/automatic-compaction.md#avoid-conflicts-with-ingestion).
+
+### Segment granularity handling
+
+Unless you modify the segment granularity in [`granularitySpec`](manual-compaction.md#compaction-granularity-spec), Druid attempts to retain the granularity for the compacted segments. When segments have different segment granularities with no overlap in interval Druid creates a separate compaction task for each to retain the segment granularity in the compacted segment.
+
+If segments have different segment granularities before compaction but there is some overlap in interval, Druid attempts find start and end of the overlapping interval and uses the closest segment granularity level for the compacted segment.
+
+For example consider two overlapping segments: segment "A" for the interval 01/01/2020-01/02/2020 with day granularity and segment "B" for the interval 01/01/2020-02/01/2020. Druid attempts to combine and compact the overlapped segments. In this example, the earliest start time for the two segments is 01/01/2020 and the latest end time of the two segments is 02/01/2020. Druid compacts the segments together even though they have different segment granularity. Druid uses month segment granularity for the newly compacted segment even though segment A's original segment granularity was day granularity.
+
+### Query granularity handling
+
+Unless you modify the query granularity in the [`granularitySpec`](manual-compaction.md#compaction-granularity-spec), Druid retains the query granularity for the compacted segments. If segments have different query granularities before compaction, Druid chooses the finest level of granularity for the resulting compacted segment. For example if a compaction task combines two segments, one with day query granularity and one with minute query granularity, the resulting segment uses minute query granularity.
+
+:::info
+ In Apache Druid 0.21.0 and prior, Druid sets the granularity for compacted segments to the default granularity of `NONE` regardless of the query granularity of the original segments.
+:::
+
+If you configure query granularity in compaction to go from a finer granularity like month to a coarser query granularity like year, then Druid overshadows the original segment with coarser granularity. Because the new segments have a coarser granularity, running a kill task to remove the overshadowed segments for those intervals will cause you to permanently lose the finer granularity data.
+
+### Dimension handling
+
+Apache Druid supports schema changes. Therefore, dimensions can be different across segments even if they are a part of the same datasource. See [Segments with different schemas](../design/segments.md#segments-with-different-schemas). If the input segments have different dimensions, the resulting compacted segment includes all dimensions of the input segments.
+
+Even when the input segments have the same set of dimensions, the dimension order or the data type of dimensions can be different. The dimensions of recent segments precede that of old segments in terms of data types and the ordering because more recent segments are more likely to have the preferred order and data types.
+
+If you want to control dimension ordering or ensure specific values for dimension types, you can configure a custom `dimensionsSpec` in the compaction task spec.
+
+### Rollup
+
+Druid only rolls up the output segment when `rollup` is set for all input segments.
+See [Roll-up](../ingestion/rollup.md) for more details.
+You can check that your segments are rolled up or not by using [Segment Metadata Queries](../querying/segmentmetadataquery.md#analysistypes).
+
+## Learn more
+
+See the following topics for more information:
+- [Segment optimization](../operations/segment-optimization.md) for guidance to determine if compaction will help in your case.
+- [Manual compaction](./manual-compaction.md) for how to run a one-time compaction task.
+- [Automatic compaction](automatic-compaction.md) for how to enable and configure automatic compaction.
+
diff --git a/docs/35.0.0/data-management/delete.md b/docs/35.0.0/data-management/delete.md
new file mode 100644
index 0000000000..e37ba48b54
--- /dev/null
+++ b/docs/35.0.0/data-management/delete.md
@@ -0,0 +1,148 @@
+---
+id: delete
+title: "Data deletion"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+## Delete data for a time range manually
+
+Apache Druid stores data [partitioned by time chunk](../design/storage.md) and supports
+deleting data for time chunks by dropping segments. This is a fast, metadata-only operation.
+
+Deletion by time range happens in two steps:
+
+1. Segments to be deleted must first be marked as ["unused"](../design/storage.md#segment-lifecycle). This can
+   happen when a segment is dropped by a [drop rule](../operations/rule-configuration.md) or when you manually mark a
+   segment unused through the Coordinator API or web console. This is a soft delete: the data is not available for
+   querying, but the segment files remains in deep storage, and the segment records remains in the metadata store.
+2. Once a segment is marked "unused", you can use a [`kill` task](#kill-task) to permanently delete the segment file from
+   deep storage and remove its record from the metadata store. This is a hard delete: the data is unrecoverable unless
+   you have a backup.
+
+For documentation on disabling segments using the Coordinator API, see the
+[Legacy metadata API reference](../api-reference/legacy-metadata-api.md#datasources).
+
+A data deletion tutorial is available at [Tutorial: Deleting data](../tutorials/tutorial-delete-data.md).
+
+## Delete data automatically using drop rules
+
+Druid supports [load and drop rules](../operations/rule-configuration.md), which are used to define intervals of time
+where data should be preserved, and intervals where data should be discarded. Data that falls under a drop rule is
+marked unused, in the same manner as if you [manually mark that time range unused](#delete-data-for-a-time-range-manually). This is a
+fast, metadata-only operation.
+
+Data that is dropped in this way is marked unused, but remains in deep storage. To permanently delete it, use a
+[`kill` task](#kill-task).
+
+## Delete specific records
+
+Druid supports deleting specific records using [reindexing](update.md#reindex) with a filter. The filter specifies which
+data remains after reindexing, so it must be the inverse of the data you want to delete. Because segments must be
+rewritten to delete data in this way, it can be a time-consuming operation.
+
+For example, to delete records where `userName` is `'bob'` with native batch indexing, use a
+[`transformSpec`](../ingestion/ingestion-spec.md#transformspec) with filter `{"type": "not", "field": {"type":
+"selector", "dimension": "userName", "value": "bob"}}`.
+
+To delete the same records using SQL, use [REPLACE](../multi-stage-query/concepts.md#overwrite-data-with-replace) with `WHERE userName <> 'bob'`.
+
+To reindex using [native batch](../ingestion/native-batch.md), use the [`druid` input
+source](../ingestion/input-sources.md#druid-input-source). If needed,
+[`transformSpec`](../ingestion/ingestion-spec.md#transformspec) can be used to filter or modify data during the
+reindexing job. To reindex with SQL, use [`REPLACE <table> OVERWRITE`](../multi-stage-query/reference.md#replace)
+with `SELECT ... FROM <table>`. (Druid does not have `UPDATE` or `ALTER TABLE` statements.) Any SQL SELECT query can be
+used to filter, modify, or enrich the data during the reindexing job.
+
+Data that is deleted in this way is marked unused, but remains in deep storage. To permanently delete it, use a [`kill`
+task](#kill-task).
+
+## Delete an entire table
+
+Deleting an entire table works the same way as [deleting part of a table by time range](#delete-data-for-a-time-range-manually). First,
+mark all segments unused using the Coordinator API or web console. Then, optionally, delete it permanently using a
+[`kill` task](#kill-task).
+
+<a name="kill-task"></a>
+
+## Delete data permanently using `kill` tasks
+
+Data that has been overwritten or soft-deleted still remains as segments that have been marked unused. You can use a
+`kill` task to permanently delete this data.
+
+The available grammar is:
+
+```json
+{
+    "type": "kill",
+    "id": <task_id>,
+    "dataSource": <task_datasource>,
+    "interval" : <all_unused_segments_in_this_interval_will_die!>,
+    "versions" : <optional_list_of_segment_versions_to_delete_in_this_interval>,
+    "context": <task_context>,
+    "batchSize": <optional_batch_size>,
+    "limit": <optional_maximum_number_of_segments_to_delete>,
+    "maxUsedStatusLastUpdatedTime": <optional_maximum_timestamp_when_segments_were_marked_as_unused>
+}
+```
+
+Some of the parameters used in the task payload are further explained below:
+
+| Parameter   | Default         | Explanation                                                                                                                                                                                                                                                                                                                                                                 |
+|-------------|-----------------|-----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
+| `versions` | null (all versions) | List of segment versions within the specified `interval` for the kill task to delete. The default behavior is to delete all unused segment versions in the specified `interval`.|
+| `batchSize`    |100    | Maximum number of segments that are deleted in one kill batch. Some operations on the Overlord may get stuck while a `kill` task is in progress due to concurrency constraints (such as in `TaskLockbox`). Thus, a `kill` task splits the list of unused segments to be deleted into smaller batches to yield the Overlord resources intermittently to other task operations.|
+| `limit`     | null (no limit) | Maximum number of segments for the kill task to delete.|
+| `maxUsedStatusLastUpdatedTime` | null (no cutoff) | Maximum timestamp used as a cutoff to include unused segments. The kill task only considers segments which lie in the specified `interval` and were marked as unused no later than this time. The default behavior is to kill all unused segments in the `interval` regardless of when they where marked as unused.|
+
+
+**WARNING:** The `kill` task permanently removes all information about the affected segments from the metadata store and
+deep storage. This operation cannot be undone.
+
+### Auto-kill data using Coordinator duties
+
+Instead of submitting `kill` tasks manually to permanently delete data for a given interval, you can enable auto-kill of unused segments on the Coordinator.
+The Coordinator runs a duty periodically to identify intervals containing unused segments that are eligible for kill. It then launches a `kill` task for each of these intervals.
+
+Refer to [Data management on the Coordinator](../configuration/index.md#data-management) to configure auto-kill of unused segments on the Coordinator.
+
+### Auto-kill data on the Overlord (Experimental)
+
+:::info
+This is an experimental feature that:
+- Can be used only if [segment metadata caching](../configuration/index.md#segment-metadata-cache-experimental) is enabled on the Overlord.
+- MUST NOT be used if auto-kill of unused segments is already enabled on the Coordinator.
+:::
+
+This is an experimental feature to run kill tasks in an "embedded" mode on the Overlord itself.
+
+These embedded tasks offer several advantages over auto-kill performed by the Coordinator as they:
+- avoid a lot of unnecessary REST API calls to the Overlord from tasks or the Coordinator.
+- kill unused segments as soon as they become eligible.
+- run on the Overlord and do not take up task slots.
+- finish faster as they save on the overhead of launching a task process.
+- kill a small number of segments per task, to ensure that locks on an interval are not held for too long.
+- skip locked intervals to avoid head-of-line blocking in kill tasks.
+- require little to no configuration.
+- can keep up with a large number of unused segments in the cluster.
+- take advantage of the segment metadata cache on the Overlord.
+
+Refer to [Auto-kill unused segments on the Overlord](../configuration/index.md#auto-kill-unused-segments-experimental) to configure auto-kill of unused segments on the Overlord.
+See [Auto-kill metrics](../operations/metrics.md#auto-kill-unused-segments) for the metrics emitted by embedded kill tasks.
diff --git a/docs/35.0.0/data-management/index.md b/docs/35.0.0/data-management/index.md
new file mode 100644
index 0000000000..0e0e09ac89
--- /dev/null
+++ b/docs/35.0.0/data-management/index.md
@@ -0,0 +1,34 @@
+---
+id: index
+title: "Data management"
+sidebar_label: "Overview"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+Apache Druid stores data [partitioned by time chunk](../design/storage.md) in immutable
+files called [segments](../design/segments.md). Data management operations involving replacing, or deleting,
+these segments include:
+
+- [Updates](update.md) to existing data.
+- [Deletion](delete.md) of existing data.
+- [Schema changes](schema-changes.md) for new and existing data.
+- [Compaction](compaction.md) and [automatic compaction](automatic-compaction.md), which reindex existing data to
+  optimize storage footprint and performance.
diff --git a/docs/35.0.0/data-management/manual-compaction.md b/docs/35.0.0/data-management/manual-compaction.md
new file mode 100644
index 0000000000..e6e34dba82
--- /dev/null
+++ b/docs/35.0.0/data-management/manual-compaction.md
@@ -0,0 +1,167 @@
+---
+id: manual-compaction
+title: "Manual compaction"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+In Apache Druid, compaction is a special type of ingestion task that reads data from a Druid datasource and writes it back into the same datasource. A common use case for this is to [optimally size segments](../operations/segment-optimization.md) after ingestion to improve query performance.
+
+You can perform manual compaction where you submit a one-time compaction task for a specific interval. Generally, you don't need to do this if you use [automatic compaction](./automatic-compaction.md), which is recommended for most workloads.
+
+## Setting up manual compaction
+
+ Compaction tasks merge all segments for the defined interval according to the following syntax:
+
+```json
+{
+    "type": "compact",
+    "id": <task_id>,
+    "dataSource": <task_datasource>,
+    "ioConfig": <IO config>,
+    "dimensionsSpec": <custom dimensionsSpec>,
+    "transformSpec": <custom transformSpec>,
+    "metricsSpec": <custom metricsSpec>,
+    "tuningConfig": <parallel indexing task tuningConfig>,
+    "granularitySpec": <compaction task granularitySpec>,
+    "context": <task context>
+}
+```
+
+|Field|Description|Required|
+|-----|-----------|--------|
+|`type`|Task type. Set the value to `compact`.|Yes|
+|`id`|Task ID|No|
+|`dataSource`|Data source name to compact|Yes|
+|`ioConfig`|I/O configuration for compaction task. See [Compaction I/O configuration](#compaction-io-configuration) for details.|Yes|
+|`dimensionsSpec`|When set, the compaction task uses the specified `dimensionsSpec` rather than generating one from existing segments. See [Compaction dimensionsSpec](#compaction-dimensions-spec) for details.|No|
+|`transformSpec`|When set, the compaction task uses the specified `transformSpec` rather than using `null`. See [Compaction transformSpec](#compaction-transform-spec) for details.|No|
+|`metricsSpec`|When set, the compaction task uses the specified `metricsSpec` rather than generating one from existing segments.|No|
+|`segmentGranularity`|Deprecated. Use `granularitySpec`.|No|
+|`tuningConfig`|[Tuning configuration](../ingestion/native-batch.md#tuningconfig) for parallel indexing. `awaitSegmentAvailabilityTimeoutMillis` value is not supported for compaction tasks. Leave this parameter at the default value, 0.|No|
+|`granularitySpec`|When set, the compaction task uses the specified `granularitySpec` rather than generating one from existing segments. See [Compaction `granularitySpec`](#compaction-granularity-spec) for details.|No|
+|`context`|[Task context](../ingestion/tasks.md#context-parameters)|No|
+
+:::info
+ Note: Use `granularitySpec` over `segmentGranularity` and only set one of these values. If you specify different values for these in the same compaction spec, the task fails.
+:::
+
+To control the number of result segments per time chunk, you can set [`maxRowsPerSegment`](../ingestion/native-batch.md#partitionsspec) or [`numShards`](../ingestion/native-batch.md#tuningconfig).
+
+:::info
+ You can run multiple compaction tasks in parallel. For example, if you want to compact the data for a year, you are not limited to running a single task for the entire year. You can run 12 compaction tasks with month-long intervals.
+:::
+
+A compaction task internally generates an `index` or `index_parallel` task spec for performing compaction work with some fixed parameters. For example, its `inputSource` is always the [`druid` input source](../ingestion/input-sources.md), and `dimensionsSpec` and `metricsSpec` include all dimensions and metrics of the input segments by default.
+
+Compaction tasks typically fetch all [relevant segments](#compaction-io-configuration) prior to launching any subtasks, _unless_ the following properties are all set to non-null values. It is strongly recommended to set them to non-null values to maximize performance and minimize disk usage of the `compact` task:
+
+- [`granularitySpec`](#compaction-granularity-spec), with non-null values for each of `segmentGranularity`, `queryGranularity`, and `rollup`
+- [`dimensionsSpec`](#compaction-dimensions-spec)
+- `metricsSpec`
+
+Compaction tasks exit without doing anything and issue a failure status code in either of the following cases:
+
+- If the interval you specify has no data segments loaded.
+- If the interval you specify is empty.
+
+Note that the metadata between input segments and the resulting compacted segments may differ if the metadata among the input segments differs as well. If all input segments have the same metadata, however, the resulting output segment will have the same metadata as all input segments.
+
+
+## Manual compaction task example
+
+The following JSON illustrates a compaction task to compact _all segments_ within the interval `2020-01-01/2021-01-01` and create new segments:
+
+```json
+{
+  "type": "compact",
+  "dataSource": "wikipedia",
+  "ioConfig": {
+    "type": "compact",
+    "inputSpec": {
+      "type": "interval",
+      "interval": "2020-01-01/2021-01-01"
+    }
+  },
+  "granularitySpec": {
+    "segmentGranularity": "day",
+    "queryGranularity": "hour"
+  }
+}
+```
+
+`granularitySpec` is an optional field.
+If you don't specify `granularitySpec`, Druid retains the original segment and query granularities when compaction is complete.
+
+## Compaction I/O configuration
+
+The compaction `ioConfig` requires specifying `inputSpec` as follows:
+
+|Field|Description|Default|Required|
+|-----|-----------|-------|--------|
+|`type`|Task type. Set the value to `compact`.|none|Yes|
+|`inputSpec`|Specification of the target [interval](#interval-inputspec) or [segments](#segments-inputspec).|none|Yes|
+|`dropExisting`|If `true`, the task replaces all existing segments fully contained by either of the following:<br />- the `interval` in the `interval` type `inputSpec`.<br />- the umbrella interval of the `segments` in the `segment` type `inputSpec`.<br />If compaction fails, Druid does not change any of the existing segments.<br />**WARNING**: `dropExisting` in `ioConfig` is a beta feature. |false|No|
+|`allowNonAlignedInterval`|If `true`, the task allows an explicit [`segmentGranularity`](#compaction-granularity-spec) that is not aligned with the provided [interval](#interval-inputspec) or [segments](#segments-inputspec). This parameter is only used if [`segmentGranularity`](#compaction-granularity-spec) is explicitly provided.<br /><br />This parameter is provided for backwards compatibility. In most scenarios it should not be set, as it can lead to data being accidentally overshadowed. This parameter may be removed in a future release.|false|No|
+
+The compaction task has two kinds of `inputSpec`:
+
+### Interval `inputSpec`
+
+|Field|Description|Required|
+|-----|-----------|--------|
+|`type`|Task type. Set the value to `interval`.|Yes|
+|`interval`|Interval to compact.|Yes|
+
+### Segments `inputSpec`
+
+|Field|Description|Required|
+|-----|-----------|--------|
+|`type`|Task type. Set the value to `segments`.|Yes|
+|`segments`|A list of segment IDs.|Yes|
+
+## Compaction dimensions spec
+
+|Field|Description|Required|
+|-----|-----------|--------|
+|`dimensions`| A list of dimension names or objects. Cannot have the same column in both `dimensions` and `dimensionExclusions`. Defaults to `null`, which preserves the original dimensions.|No|
+|`dimensionExclusions`| The names of dimensions to exclude from compaction. Only names are supported here, not objects. This list is only used if the dimensions list is null or empty; otherwise it is ignored. Defaults to `[]`.|No|
+
+## Compaction transform spec
+
+|Field|Description|Required|
+|-----|-----------|--------|
+|`filter`| The `filter` conditionally filters input rows during compaction. Only rows that pass the filter will be included in the compacted segments. Any of Druid's standard [query filters](../querying/filters.md) can be used. Defaults to 'null', which will not filter any row. |No|
+
+## Compaction granularity spec
+
+|Field|Description|Required|
+|-----|-----------|--------|
+|`segmentGranularity`|Time chunking period for the segment granularity. Defaults to 'null', which preserves the original segment granularity. Accepts all [Query granularity](../querying/granularities.md) values.|No|
+|`queryGranularity`|The resolution of timestamp storage within each segment. Defaults to 'null', which preserves the original query granularity. Accepts all [Query granularity](../querying/granularities.md) values.|No|
+|`rollup`|Enables compaction-time rollup. To preserve the original setting, keep the default value. To enable compaction-time rollup, set the value to `true`. Once the data is rolled up, you can no longer recover individual records.|No|
+
+## Learn more
+
+See the following topics for more information:
+* [Compaction](compaction.md) for an overview of compaction and how to set up manual compaction in Druid.
+* [Segment optimization](../operations/segment-optimization.md) for guidance on evaluating and optimizing Druid segment size.
+* [Coordinator process](../design/coordinator.md#automatic-compaction) for details on how the Coordinator plans compaction tasks.
+
diff --git a/docs/35.0.0/data-management/schema-changes.md b/docs/35.0.0/data-management/schema-changes.md
new file mode 100644
index 0000000000..0771da3ce2
--- /dev/null
+++ b/docs/35.0.0/data-management/schema-changes.md
@@ -0,0 +1,39 @@
+---
+id: schema-changes
+title: "Schema changes"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+## For new data
+
+Apache Druid allows you to provide a new schema for new data without the need to update the schema of any existing data.
+It is sufficient to update your supervisor spec, if using [streaming ingestion](../ingestion/index.md#streaming), or to
+provide the new schema the next time you do a [batch ingestion](../ingestion/index.md#batch). This is made possible by
+the fact that each [segment](../design/segments.md), at the time it is created, stores a
+copy of its own schema. Druid reconciles all of these individual segment schemas automatically at query time.
+
+## For existing data
+
+Schema changes are sometimes necessary for existing data. For example, you may want to change the type of a column in
+previously-ingested data, or drop a column entirely. Druid handles this using [reindexing](update.md), the same method
+it uses to handle updates of existing data. Reindexing involves rewriting all affected segments and can be a
+time-consuming operation.
diff --git a/docs/35.0.0/data-management/update.md b/docs/35.0.0/data-management/update.md
new file mode 100644
index 0000000000..a8c75a5d34
--- /dev/null
+++ b/docs/35.0.0/data-management/update.md
@@ -0,0 +1,78 @@
+---
+id: update
+title: "Data updates"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+## Overwrite
+
+Apache Druid stores data [partitioned by time chunk](../design/storage.md) and supports
+overwriting existing data using time ranges. Data outside the replacement time range is not touched. Overwriting of
+existing data is done using the same mechanisms as [batch ingestion](../ingestion/index.md#batch).
+
+For example:
+
+- [Native batch](../ingestion/native-batch.md) with `appendToExisting: false`, and `intervals` set to a specific
+  time range, overwrites data for that time range.
+- [SQL `REPLACE <table> OVERWRITE [ALL | WHERE ...]`](../multi-stage-query/reference.md#replace) overwrites data for
+  the entire table or for a specified time range.
+
+In both cases, Druid's atomic update mechanism ensures that queries will flip seamlessly from the old data to the new
+data on a time-chunk-by-time-chunk basis.
+
+Ingestion and overwriting cannot run concurrently for the same time range of the same datasource. While an overwrite job
+is ongoing for a particular time range of a datasource, new ingestions for that time range are queued up. Ingestions for
+other time ranges proceed as normal. Read-only queries also proceed as normal, using the pre-existing version of the
+data.
+
+:::info
+ Druid does not support single-record updates by primary key.
+:::
+
+## Reindex
+
+Reindexing is an [overwrite of existing data](#overwrite) where the source of new data is the existing data itself. It
+is used to perform schema changes, repartition data, filter out unwanted data, enrich existing data, and so on. This
+behaves just like any other [overwrite](#overwrite) with regard to atomic updates and locking.
+
+With [native batch](../ingestion/native-batch.md), use the [`druid` input
+source](../ingestion/input-sources.md#druid-input-source). If needed,
+[`transformSpec`](../ingestion/ingestion-spec.md#transformspec) can be used to filter or modify data during the
+reindexing job.
+
+With SQL, use [`REPLACE <table> OVERWRITE`](../multi-stage-query/reference.md#replace) with `SELECT ... FROM <table>`.
+(Druid does not have `UPDATE` or `ALTER TABLE` statements.) Any SQL SELECT query can be used to filter,
+modify, or enrich the data during the reindexing job.
+
+## Rolled-up datasources
+
+Rolled-up datasources can be effectively updated using appends, without rewrites. When you append a row that has an
+identical set of dimensions to an existing row, queries that use aggregation operators automatically combine those two
+rows together at query time.
+
+[Compaction](compaction.md) or [automatic compaction](automatic-compaction.md) can be used to physically combine these
+matching rows together later on, by rewriting segments in the background.
+
+## Lookups
+
+If you have a dimension where values need to be updated frequently, try first using [lookups](../querying/lookups.md). A
+classic use case of lookups is when you have an ID dimension stored in a Druid segment, and want to map the ID dimension to a
+human-readable string that may need to be updated periodically.
diff --git a/docs/35.0.0/design/architecture.md b/docs/35.0.0/design/architecture.md
new file mode 100644
index 0000000000..04498defb1
--- /dev/null
+++ b/docs/35.0.0/design/architecture.md
@@ -0,0 +1,185 @@
+---
+id: architecture
+title: "Architecture"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+Druid has a distributed architecture that is designed to be cloud-friendly and easy to operate. You can configure and scale services independently for maximum flexibility over cluster operations. This design includes enhanced fault tolerance: an outage of one component does not immediately affect other components.
+
+The following diagram shows the services that make up the Druid architecture, their typical arrangement across servers, and how queries and data flow through this architecture.
+
+![Druid architecture](../assets/druid-architecture.svg)
+
+The following sections describe the components of this architecture.
+
+## Druid services
+
+Druid has several types of services:
+
+* [Coordinator](../design/coordinator.md) manages data availability on the cluster.
+* [Overlord](../design/overlord.md) controls the assignment of data ingestion workloads.
+* [Broker](../design/broker.md) handles queries from external clients.
+* [Router](../design/router.md) routes requests to Brokers, Coordinators, and Overlords.
+* [Historical](../design/historical.md) stores queryable data.
+* [Middle Manager](../design/middlemanager.md) and [Peon](../design/peons.md) ingest data.
+* [Indexer](../design/indexer.md) serves as an alternative to the Middle Manager + Peon task execution system.
+
+You can view services in the **Services** tab in the web console: 
+
+![Druid services](../assets/services-overview.png "Services in the web console")
+
+## Druid servers
+
+You can deploy Druid services according to your preferences. For ease of deployment, we recommend organizing them into three server types: [Master](#master-server), [Query](#query-server), and [Data](#data-server).
+
+### Master server
+
+A Master server manages data ingestion and availability. It is responsible for starting new ingestion jobs and coordinating availability of data on the [Data server](#data-server).
+
+Master servers divide operations between Coordinator and Overlord services.
+
+#### Coordinator service
+
+[Coordinator](../design/coordinator.md) services watch over the Historical services on the Data servers. They are responsible for assigning segments to specific servers, and for ensuring segments are well-balanced across Historicals.
+
+#### Overlord service
+
+[Overlord](../design/overlord.md) services watch over the Middle Manager services on the Data servers and are the controllers of data ingestion into Druid. They are responsible for assigning ingestion tasks to Middle Managers and for coordinating segment publishing.
+
+### Query server
+
+A Query server provides the endpoints that users and client applications interact with, routing queries to Data servers or other Query servers (and optionally proxied Master server requests).
+
+Query servers divide operations between Broker and Router services.
+
+#### Broker service
+
+[Broker](../design/broker.md) services receive queries from external clients and forward those queries to Data servers. When Brokers receive results from those subqueries, they merge those results and return them to the caller. Typically, you query Brokers rather than querying Historical or Middle Manager services on Data servers directly.
+
+#### Router service
+
+[**Router**](../design/router.md) services provide a unified API gateway in front of Brokers, Overlords, and Coordinators.
+
+The Router service also runs the [web console](../operations/web-console.md), a UI for loading data, managing datasources and tasks, and viewing server status and segment information.
+
+### Data server
+
+A Data server executes ingestion jobs and stores queryable data.
+
+Data servers divide operations between Historical and Middle Manager services.
+
+#### Historical service
+
+[**Historical**](../design/historical.md) services handle storage and querying on historical data, including any streaming data that has been in the system long enough to be committed. Historical services download segments from deep storage and respond to queries about these segments. They don't accept writes.
+
+#### Middle Manager service
+
+[**Middle Manager**](../design/middlemanager.md) services handle ingestion of new data into the cluster. They are responsible
+for reading from external data sources and publishing new Druid segments.
+
+##### Peon service
+
+[**Peon**](../design/peons.md) services are task execution engines spawned by Middle Managers. Each Peon runs a separate JVM and is responsible for executing a single task. Peons always run on the same host as the Middle Manager that spawned them.
+
+#### Indexer service (optional)
+
+[**Indexer**](../design/indexer.md) services are an alternative to Middle Managers and Peons. Instead of
+forking separate JVM processes per-task, the Indexer runs tasks as individual threads within a single JVM process.
+
+The Indexer is designed to be easier to configure and deploy compared to the MiddleManager + Peon system and to better enable resource sharing across tasks, which can help streaming ingestion. The Indexer is currently designated [experimental](../development/experimental.md).
+
+Typically, you would deploy one of the following: MiddleManagers, [MiddleManager-less ingestion using Kubernetes](../development/extensions-core/k8s-jobs.md), or Indexers. You wouldn't deploy more than one of these options.
+
+## Colocation of services
+
+Colocating Druid services by server type generally results in better utilization of hardware resources for most clusters.
+For very large scale clusters, it can be desirable to split the Druid services such that they run on individual servers to avoid resource contention.
+
+This section describes guidelines and configuration parameters related to service colocation.
+
+### Coordinators and Overlords
+
+The workload on the Coordinator service tends to increase with the number of segments in the cluster. The Overlord's workload also increases based on the number of segments in the cluster, but to a lesser degree than the Coordinator.
+
+In clusters with very high segment counts, it can make sense to separate the Coordinator and Overlord services to provide more resources for the Coordinator's segment balancing workload.
+
+You can run the Coordinator and Overlord services as a single combined service by setting the `druid.coordinator.asOverlord.enabled` property.
+For more information, see [Coordinator Operation](../configuration/index.md#coordinator-operation).
+
+### Historicals and Middle Managers
+
+With higher levels of ingestion or query load, it can make sense to deploy the Historical and Middle Manager services on separate hosts to to avoid CPU and memory contention.
+
+The Historical service also benefits from having free memory for memory mapped segments, which can be another reason to deploy the Historical and Middle Manager services separately.
+
+## External dependencies
+
+In addition to its built-in service types, Druid also has three external dependencies. These are intended to be able to
+leverage existing infrastructure, where present.
+
+### Deep storage
+
+Druid uses deep storage to store any data that has been ingested into the system. Deep storage is shared file
+storage accessible by every Druid server. In a clustered deployment, this is typically a distributed object store like S3 or
+HDFS, or a network mounted filesystem. In a single-server deployment, this is typically local disk.
+
+Druid uses deep storage for the following purposes:
+
+- To store all the data you ingest. Segments that get loaded onto Historical services for low latency queries are also kept in deep storage for backup purposes. Additionally, segments that are only in deep storage can be used for [queries from deep storage](../querying/query-from-deep-storage.md).
+- As a way to transfer data in the background between Druid services. Druid stores data in files called _segments_.
+
+Historical services cache data segments on local disk and serve queries from that cache as well as from an in-memory cache.
+Segments on disk for Historical services provide the low latency querying performance Druid is known for.
+
+You can also query directly from deep storage. When you query segments that exist only in deep storage, you trade some performance  for the ability to query more of your data without necessarily having to scale your Historical services.
+
+When determining sizing for your storage, keep the following in mind:
+
+- Deep storage needs to be able to hold all the data that you ingest into Druid.
+- On disk storage for Historical services need to be able to accommodate the data you want to load onto them to run queries. The data on Historical services should be data you access frequently and need to run low latency queries for. 
+
+Deep storage is an important part of Druid's elastic, fault-tolerant design. Druid bootstraps from deep storage even
+if every single data server is lost and re-provisioned.
+
+For more details, please see the [Deep storage](../design/deep-storage.md) page.
+
+### Metadata storage
+
+The metadata storage holds various shared system metadata such as segment usage information and task information. In a
+clustered deployment, this is typically a traditional RDBMS like PostgreSQL or MySQL. In a single-server
+deployment, it is typically a locally-stored Apache Derby database.
+
+For more details, please see the [Metadata storage](../design/metadata-storage.md) page.
+
+### ZooKeeper
+
+Used for internal service discovery, coordination, and leader election.
+
+For more details, please see the [ZooKeeper](zookeeper.md) page.
+
+## Learn more
+
+See the following topics for more information:
+
+* [Storage components](storage.md) to learn about data storage in Druid.
+* [Segments](segments.md) to learn about segment files.
+* [Query processing](../querying/query-processing.md) for a high-level overview of how Druid processes queries.
\ No newline at end of file
diff --git a/docs/35.0.0/design/broker.md b/docs/35.0.0/design/broker.md
new file mode 100644
index 0000000000..bbd6b94f2b
--- /dev/null
+++ b/docs/35.0.0/design/broker.md
@@ -0,0 +1,54 @@
+---
+id: broker
+title: "Broker service"
+sidebar_label: "Broker"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+The Broker service routes queries in a distributed cluster setup. It interprets the metadata published to ZooKeeper about segment distribution across services and routes queries accordingly. Additionally, the Broker service consolidates result sets from individual services.
+
+## Configuration
+
+For Apache Druid Broker service configuration, see [Broker Configuration](../configuration/index.md#broker).
+
+For basic tuning guidance for the Broker service, see [Basic cluster tuning](../operations/basic-cluster-tuning.md#broker).
+
+## HTTP endpoints
+
+For a list of API endpoints supported by the Broker, see [Broker API](../api-reference/legacy-metadata-api.md#broker).
+
+## Running
+
+```
+org.apache.druid.cli.Main server broker
+```
+
+## Forwarding queries
+
+Most Druid queries contain an interval object that indicates a span of time for which data is requested. Similarly, Druid partitions [segments](../design/segments.md) to contain data for some interval of time and distributes the segments across a cluster. Consider a simple datasource with seven segments where each segment contains data for a given day of the week. Any query issued to the datasource for more than one day of data will hit more than one segment. These segments will likely be distributed across multiple services, and hence, the query will likely hit multiple services.
+
+To determine which services to forward queries to, the Broker service first builds a view of the world from information in ZooKeeper. ZooKeeper maintains information about [Historical](../design/historical.md) and streaming ingestion [Peon](../design/peons.md) services and the segments they are serving. For every datasource in ZooKeeper, the Broker service builds a timeline of segments and the services that serve them. When queries are received for a specific datasource and interval, the Broker service performs a lookup into the timeline associated with the query datasource for the query interval and retrieves the services that contain data for the query. The Broker service then forwards down the query to the selected services.
+
+## Caching
+
+Broker services employ a cache with an LRU cache invalidation strategy. The Broker cache stores per-segment results. The cache can be local to each Broker service or shared across multiple services using an external distributed cache such as [memcached](http://memcached.org/). Each time a Broker service receives a query, it first maps the query to a set of segments. A subset of these segment results may already exist in the cache and the results can be directly pulled from the cache. For any segment results that do not exist in the cache, the Broker service will forward the query to the
+Historical services. Once the Historical services return their results, the Broker will store those results in the cache. Real-time segments are never cached and hence requests for real-time data will always be forwarded to real-time services. Real-time data is perpetually changing and caching the results would be unreliable.
\ No newline at end of file
diff --git a/docs/35.0.0/design/coordinator.md b/docs/35.0.0/design/coordinator.md
new file mode 100644
index 0000000000..bc4c5ebc1c
--- /dev/null
+++ b/docs/35.0.0/design/coordinator.md
@@ -0,0 +1,176 @@
+---
+id: coordinator
+title: "Coordinator service"
+sidebar_label: "Coordinator"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+The Coordinator service is primarily responsible for segment management and distribution. More specifically, the
+Coordinator service communicates to Historical services to load or drop segments based on configurations. The Coordinator is responsible for loading new segments, dropping outdated segments, ensuring that segments are "replicated" (that is, loaded on multiple different Historical nodes) proper (configured) number of times, and moving
+("balancing") segments between Historical nodes to keep the latter evenly loaded.
+
+The Coordinator runs its duties periodically and the time between each run is a configurable parameter. On each
+run, the Coordinator assesses the current state of the cluster before deciding on the appropriate actions to take.
+Similar to the Broker and Historical services, the Coordinator maintains a connection to a ZooKeeper cluster for
+current cluster information. The Coordinator also maintains a connection to a database containing information about
+"used" segments (that is, the segments that *should* be loaded in the cluster) and the loading rules.
+
+Before any unassigned segments are serviced by Historical services, the Historical services for each tier are first
+sorted in terms of capacity, with least capacity servers having the highest priority. Unassigned segments are always
+assigned to the services with least capacity to maintain a level of balance between services. The Coordinator does not
+directly communicate with a Historical service when assigning it a new segment; instead the Coordinator creates some
+temporary information about the new segment under load queue path of the Historical service. Once this request is seen,
+the Historical service loads the segment and begins servicing it.
+
+## Configuration
+
+For Apache Druid Coordinator service configuration, see [Coordinator configuration](../configuration/index.md#coordinator).
+
+For basic tuning guidance for the Coordinator service, see [Basic cluster tuning](../operations/basic-cluster-tuning.md#coordinator).
+
+## HTTP endpoints
+
+For a list of API endpoints supported by the Coordinator, see [Service status API reference](../api-reference/service-status-api.md#coordinator).
+
+## Running
+
+```
+org.apache.druid.cli.Main server coordinator
+```
+
+## Rules
+
+Segments can be automatically loaded and dropped from the cluster based on a set of rules. For more information on rules, see [Rule Configuration](../operations/rule-configuration.md).
+
+### Clean up overshadowed segments
+
+On each run, the Coordinator compares the set of used segments in the database with the segments served by some
+Historical nodes in the cluster. The Coordinator sends requests to Historical nodes to unload unused segments or segments
+that are removed from the database.
+
+Segments that are overshadowed (their versions are too old and their data has been replaced by newer segments) are
+marked as unused. During the next Coordinator's run, they will be unloaded from Historical nodes in the cluster.
+
+### Clean up non-overshadowed eternity tombstone segments
+
+On each run, the Coordinator determines and cleans up unneeded eternity tombstone segments for each datasource. These segments must fit all the following criteria:
+- It is a tombstone segment that starts at -INF or ends at INF (for example, a tombstone with an interval of `-146136543-09-08T08:23:32.096Z/2000-01-01` or `2020-01-01/146140482-04-24T15:36:27.903Z` or `-146136543-09-08T08:23:32.096Z/146140482-04-24T15:36:27.903Z`)
+- It does not overlap with any overshadowed segment
+- It has 0 core partitions
+
+## Segment availability
+
+If a Historical service restarts or becomes unavailable for any reason, the Coordinator notices that a service has gone missing and treats all segments served by that service as being dropped. The segments are then reassigned to other Historical services in the cluster. However, each segment that is dropped is not immediately forgotten. Instead, there is a transitional data structure that stores all dropped segments with an associated lifetime. The lifetime represents a period of time in which the Coordinator will not reassign a dropped segment. Hence, if a Historical service becomes unavailable and available again within a short period of time, the Historical service will start up and serve segments from its cache without any of those segments being reassigned across the cluster.
+
+## Balancing segments in a tier
+
+Druid queries perform optimally when segments are distributed evenly across Historical services. An ideal distribution would ensure that all Historicals participate equally in the query load thus avoiding hot-spots in the system. To some extent, this can be achieved by keeping multiple replicas of a segment in a cluster.
+But in a tier with several Historicals (or a low replication factor), segment replication is not sufficient to attain balance.
+Thus, the Coordinator constantly monitors the set of segments present on each Historical in a tier and employs one of the following strategies to identify segments that may be moved from one Historical to another to retain balance.
+
+- `cost` (default): For a given segment in a tier, this strategy picks the server with the minimum "cost" of placing that segment. The cost is a function of the data interval of the segment and the data intervals of all the segments already present on the candidate server. In essence, this strategy tries to avoid placing segments with adjacent or overlapping data intervals on the same server. This is based on the premise that adjacent-interval segments are more likely to be used together in a query and placing them on the same server may lead to skewed CPU usages of Historicals.
+- `diskNormalized`: A derivative of the `cost` strategy that weights the cost of placing a segment on a server with the disk usage ratio of the server. There are known issues with this strategy and is not recommended for a production cluster.
+- `random`: Distributes segments randomly across servers. This is an experimental strategy and is not recommended for a production cluster.
+
+All of the above strategies prioritize moving segments from the Historical with the least available disk space.
+
+## Automatic compaction
+
+The Coordinator manages the [automatic compaction system](../data-management/automatic-compaction.md).
+Each run, the Coordinator compacts segments by merging small segments or splitting a large one. This is useful when the size of your segments is not optimized which may degrade query performance.
+See [Segment size optimization](../operations/segment-optimization.md) for details.
+
+The Coordinator first finds the segments to compact based on the [segment search policy](#segment-search-policy-in-automatic-compaction).
+Once some segments are found, it issues a [compaction task](../ingestion/tasks.md#compact) to compact those segments.
+The maximum number of running compaction tasks is `min(sum of worker capacity * slotRatio, maxSlots)`.
+Note that even if `min(sum of worker capacity * slotRatio, maxSlots) = 0`, at least one compaction task is always submitted
+if the compaction is enabled for a dataSource.
+See [Automatic compaction configuration API](../api-reference/automatic-compaction-api.md#manage-automatic-compaction) and [Automatic compaction configuration](../configuration/index.md#automatic-compaction-dynamic-configuration) to enable and configure automatic compaction.
+
+Compaction tasks might fail due to the following reasons:
+
+- If the input segments of a compaction task are removed or overshadowed before it starts, that compaction task fails immediately.
+- If a task of a higher priority acquires a [time chunk lock](../ingestion/tasks.md#locking) for an interval overlapping with the interval of a compaction task, the compaction task fails.
+
+Once a compaction task fails, the Coordinator simply checks the segments in the interval of the failed task again, and issues another compaction task in the next run.
+
+Note that Compacting Segments Coordinator Duty is automatically enabled and run as part of the Indexing Service Duties group. However, Compacting Segments Coordinator Duty can be configured to run in isolation as a separate Coordinator duty group. This allows changing the period of Compacting Segments Coordinator Duty without impacting the period of other Indexing Service Duties. This can be done by setting the following properties. For more details, see [custom pluggable Coordinator Duty](../development/modules.md#adding-your-own-custom-pluggable-coordinator-duty).
+```
+druid.coordinator.dutyGroups=[<SOME_GROUP_NAME>]
+druid.coordinator.<SOME_GROUP_NAME>.duties=["compactSegments"]
+druid.coordinator.<SOME_GROUP_NAME>.period=<PERIOD_TO_RUN_COMPACTING_SEGMENTS_DUTY>
+```
+
+## Segment search policy in automatic compaction
+
+At every Coordinator run, this policy looks up time chunks from newest to oldest and checks whether the segments in those time chunks
+need compaction.
+A set of segments needs compaction if all conditions below are satisfied:
+
+* Total size of segments in the time chunk is smaller than or equal to the configured `inputSegmentSizeBytes`.
+* Segments have never been compacted yet or compaction spec has been updated since the last compaction: `maxTotalRows` or `indexSpec`.
+
+Here are some details with an example. Suppose we have two dataSources (`foo`, `bar`) as seen below:
+
+- `foo`
+  - `foo_2017-11-01T00:00:00.000Z_2017-12-01T00:00:00.000Z_VERSION`
+  - `foo_2017-11-01T00:00:00.000Z_2017-12-01T00:00:00.000Z_VERSION_1`
+  - `foo_2017-09-01T00:00:00.000Z_2017-10-01T00:00:00.000Z_VERSION`
+- `bar`
+  - `bar_2017-10-01T00:00:00.000Z_2017-11-01T00:00:00.000Z_VERSION`
+  - `bar_2017-10-01T00:00:00.000Z_2017-11-01T00:00:00.000Z_VERSION_1`
+
+Assuming that each segment is 10 MB and haven't been compacted yet, this policy first returns two segments of
+`foo_2017-11-01T00:00:00.000Z_2017-12-01T00:00:00.000Z_VERSION` and `foo_2017-11-01T00:00:00.000Z_2017-12-01T00:00:00.000Z_VERSION_1` to compact together because
+`2017-11-01T00:00:00.000Z/2017-12-01T00:00:00.000Z` is the most recent time chunk.
+
+If the Coordinator has enough task slots for compaction, this policy will continue searching for the next segments and return
+`bar_2017-10-01T00:00:00.000Z_2017-11-01T00:00:00.000Z_VERSION` and `bar_2017-10-01T00:00:00.000Z_2017-11-01T00:00:00.000Z_VERSION_1`.
+Finally, `foo_2017-09-01T00:00:00.000Z_2017-10-01T00:00:00.000Z_VERSION` will be picked up even though there is only one segment in the time chunk of `2017-09-01T00:00:00.000Z/2017-10-01T00:00:00.000Z`.
+
+The search start point can be changed by setting `skipOffsetFromLatest`.
+If this is set, this policy will ignore the segments falling into the time chunk of (the end time of the most recent segment - `skipOffsetFromLatest`).
+This is to avoid conflicts between compaction tasks and realtime tasks.
+Note that realtime tasks have a higher priority than compaction tasks by default. Realtime tasks will revoke the locks of compaction tasks if their intervals overlap, resulting in the termination of the compaction task.
+For more information, see [Avoid conflicts with ingestion](../data-management/automatic-compaction.md#avoid-conflicts-with-ingestion).
+
+:::info
+ This policy currently cannot handle the situation when there are a lot of small segments which have the same interval,
+ and their total size exceeds [`inputSegmentSizeBytes`](../configuration/index.md#automatic-compaction-dynamic-configuration).
+ If it finds such segments, it simply skips them.
+:::
+
+## FAQ
+
+1. **Do clients ever contact the Coordinator service?**
+
+    The Coordinator is not involved in a query.
+
+    Historical services never directly contact the Coordinator service. The Coordinator tells the Historical services to load/drop data via ZooKeeper, but the Historical services are completely unaware of the Coordinator.
+
+    Brokers also never contact the Coordinator. Brokers base their understanding of the data topology on metadata exposed by the Historical services via ZooKeeper and are completely unaware of the Coordinator.
+
+2. **Does it matter if the Coordinator service starts up before or after other services?**
+
+    No. If the Coordinator is not started up, no new segments will be loaded in the cluster and outdated segments will not be dropped. However, the Coordinator service can be started up at any time, and after a configurable delay, will start running Coordinator tasks.
+
+    This also means that if you have a working cluster and all of your Coordinators die, the cluster will continue to function, it just won’t experience any changes to its data topology.
diff --git a/docs/35.0.0/design/deep-storage.md b/docs/35.0.0/design/deep-storage.md
new file mode 100644
index 0000000000..0674f32429
--- /dev/null
+++ b/docs/35.0.0/design/deep-storage.md
@@ -0,0 +1,88 @@
+---
+id: deep-storage
+title: "Deep storage"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+Deep storage is where segments are stored.  It is a storage mechanism that Apache Druid does not provide.  This deep storage infrastructure defines the level of durability of your data. As long as Druid processes can see this storage infrastructure and get at the segments stored on it, you will not lose data no matter how many Druid nodes you lose.  If segments disappear from this storage layer, then you will lose whatever data those segments represented.
+
+In addition to being the backing store for segments, you can use [query from deep storage](#querying-from-deep-storage) and run queries against segments stored primarily in deep storage. The [load rules](../operations/rule-configuration.md#load-rules) you configure determine whether segments exist primarily in deep storage or in a combination of deep storage and Historical processes.
+
+## Deep storage options
+
+Druid supports multiple options for deep storage, including blob storage from major cloud providers. Select the one that fits your environment.
+
+### Local
+
+Local storage is intended for use in the following situations:
+
+- You have just one server.
+- Or, you have multiple servers, and they all have access to a shared filesystem (for example: NFS).
+
+In multi-server production clusters, rather than local storage with a shared filesystem, it is instead recommended to
+use cloud-based deep storage ([Amazon S3](#amazon-s3-or-s3-compatible), [Google Cloud Storage](#google-cloud-storage),
+or [Azure Blob Storage](#azure-blob-storage)), S3-compatible storage (like Minio), or [HDFS](#hdfs). These options are
+generally more convenient, more scalable, and more robust than setting up a shared filesystem.
+
+The following configurations in `common.runtime.properties` apply to local storage:
+
+|Property|Possible Values|Description|Default|
+|--------|---------------|-----------|-------|
+|`druid.storage.type`|`local`||Must be set.|
+|`druid.storage.storageDirectory`|any local directory|Directory for storing segments. Must be different from `druid.segmentCache.locations` and `druid.segmentCache.infoDir`.|`/tmp/druid/localStorage`|
+|`druid.storage.zip`|`true`, `false`|Whether segments in `druid.storage.storageDirectory` are written as directories (`false`) or zip files (`true`).|`false`|
+
+For example:
+
+```
+druid.storage.type=local
+druid.storage.storageDirectory=/tmp/druid/localStorage
+```
+
+The `druid.storage.storageDirectory` must be set to a different path than `druid.segmentCache.locations` or
+`druid.segmentCache.infoDir`.
+
+### Amazon S3 or S3-compatible
+
+See [`druid-s3-extensions`](../development/extensions-core/s3.md).
+
+### Google Cloud Storage
+
+See [`druid-google-extensions`](../development/extensions-core/google.md).
+
+### Azure Blob Storage
+
+See [`druid-azure-extensions`](../development/extensions-core/azure.md).
+
+### HDFS
+
+See [druid-hdfs-storage extension documentation](../development/extensions-core/hdfs.md).
+
+### Additional options
+
+For additional deep storage options, please see our [extensions list](../configuration/extensions.md).
+
+## Querying from deep storage
+
+Although not as performant as querying segments stored on disk for Historical processes, you can query from deep storage to access segments that you may not need frequently or with the extreme low latency Druid queries traditionally provide. You trade some performance for a total lower storage cost because you can access more of your data without the need to increase the number or capacity of your Historical processes.
+
+For information about how to run queries, see [Query from deep storage](../querying/query-from-deep-storage.md).
\ No newline at end of file
diff --git a/docs/35.0.0/design/extensions-contrib/dropwizard.md b/docs/35.0.0/design/extensions-contrib/dropwizard.md
new file mode 100644
index 0000000000..7e1100dc7c
--- /dev/null
+++ b/docs/35.0.0/design/extensions-contrib/dropwizard.md
@@ -0,0 +1,95 @@
+---
+id: dropwizard
+layout: doc_page
+title: "Dropwizard metrics emitter"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+# Dropwizard Emitter
+
+To use this extension, make sure to [include](../../configuration/extensions.md#loading-extensions) `dropwizard-emitter` in the extensions load list.
+
+## Introduction
+
+This extension integrates [Dropwizard](http://metrics.dropwizard.io/3.1.0/getting-started/#) metrics library with druid so that dropwizard users can easily absorb druid into their monitoring ecosystem.
+It accumulates druid metrics as dropwizard metrics, and emits them to various sinks via dropwizard supported reporters.
+Currently supported dropwizard metrics types counter, gauge, meter, timer and histogram. 
+These metrics can be emitted using either Console or JMX reporter. 
+
+To use this emitter, set
+
+```
+druid.emitter=dropwizard
+```
+
+## Configuration
+
+All the configuration parameters for Dropwizard emitter are under `druid.emitter.dropwizard`.
+    
+|property|description|required?|default|
+|--------|-----------|---------|-------|
+|`druid.emitter.dropwizard.reporters`|List of dropwizard reporters to be used. Here is a list of [Supported Reporters](#supported-dropwizard-reporters)|yes|none|
+|`druid.emitter.dropwizard.prefix`|Optional prefix to be used for metrics name|no|none|
+|`druid.emitter.dropwizard.includeHost`|Flag to include the host and port as part of the metric name.|no|yes|
+|`druid.emitter.dropwizard.dimensionMapPath`|Path to JSON file defining the dropwizard metric type, and desired dimensions for every Druid metric|no|Default mapping provided. See below.|
+|`druid.emitter.dropwizard.alertEmitters`| List of emitters where alerts will be forwarded to. |no| empty list (no forwarding)|
+|`druid.emitter.dropwizard.maxMetricsRegistrySize`| Maximum size of metrics registry to be cached at any time. |no| 100 Mb|
+
+
+### Druid to Dropwizard Event Conversion
+
+Each metric emitted using Dropwizard must specify a type, one of `[timer, counter, guage, meter, histogram]`. Dropwizard Emitter expects this mapping to
+be provided as a JSON file.  Additionally, this mapping specifies which dimensions should be included for each metric.
+If the user does not specify their own JSON file, a [default mapping](#default-metrics-mapping) is used.
+All metrics are expected to be mapped. Metrics which are not mapped will be ignored.
+Dropwizard metric path is organized using the following schema:
+
+`<druid metric name> : { "dimensions" : <dimension list>, "type" : <Dropwizard metric type>, "timeUnit" : <For timers, timeunit in which metric is emitted>}`
+
+e.g.
+```json
+"query/time" : { "dimensions" : ["dataSource", "type"], "type" : "timer", "timeUnit": "MILLISECONDS"},
+"segment/scan/pending" : { "dimensions" : [], "type" : "gauge"}
+```
+
+For most use-cases, the default mapping is sufficient.
+
+### Supported Dropwizard reporters
+
+#### JMX Reporter
+Used to report druid metrics via JMX.
+```
+
+druid.emitter.dropwizard.reporters=[{"type":"jmx"}]
+
+```
+
+#### Console Reporter
+Used to print Druid Metrics to console logs.
+
+```
+
+druid.emitter.dropwizard.reporters=[{"type":"console","emitIntervalInSecs":30}"}]
+
+```
+
+### Default Metrics Mapping
+Latest default metrics mapping can be found [here](https://github.com/apache/druid/blob/master/extensions-contrib/dropwizard-emitter/src/main/resources/defaultMetricDimensions.json)
diff --git a/docs/35.0.0/design/historical.md b/docs/35.0.0/design/historical.md
new file mode 100644
index 0000000000..d4a0782ba2
--- /dev/null
+++ b/docs/35.0.0/design/historical.md
@@ -0,0 +1,73 @@
+---
+id: historical
+title: "Historical service"
+sidebar_label: "Historical"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+The Historical service is responsible for storing and querying historical data.
+Historical services cache data segments on local disk and serve queries from that cache as well as from an in-memory cache.
+
+## Configuration
+
+For Apache Druid Historical service configuration, see [Historical configuration](../configuration/index.md#historical).
+
+For basic tuning guidance for the Historical service, see [Basic cluster tuning](../operations/basic-cluster-tuning.md#historical).
+
+## HTTP endpoints
+
+For a list of API endpoints supported by the Historical, please see the [Service status API reference](../api-reference/service-status-api.md#historical).
+
+## Running
+
+```
+org.apache.druid.cli.Main server historical
+```
+
+## Loading and serving segments
+
+Each Historical service copies or pulls segment files from deep storage to local disk in an area called the segment cache. To configure the size and location of the segment cache on each Historical service, set the `druid.segmentCache.locations`.
+For more information, see [Segment cache size](../operations/basic-cluster-tuning.md#segment-cache-size).
+
+The [Coordinator](../design/coordinator.md) controls the assignment of segments to Historicals and the balance of segments between Historicals. Historical services do not communicate directly with each other, nor do they communicate directly with the Coordinator. Instead, the Coordinator creates ephemeral entries in ZooKeeper in a [load queue path](../configuration/index.md#path-configuration). Each Historical service maintains a connection to ZooKeeper, watching those paths for segment information.
+
+When a Historical service detects a new entry in the ZooKeeper load queue, it checks its own segment cache. If no information about the segment exists there, the Historical service first retrieves metadata from ZooKeeper about the segment, including where the segment is located in deep storage and how it needs to decompress and process it.
+
+For more information about segment metadata and Druid segments in general, see [Segments](../design/segments.md).
+
+After a Historical service pulls down and processes a segment from deep storage, Druid advertises the segment as being available for queries from the Broker. This announcement by the Historical is made via ZooKeeper, in a [served segments path](../configuration/index.md#path-configuration).
+
+For more information about how the Broker determines what data is available for queries, see [Broker](broker.md).
+
+To make data from the segment cache available for querying as soon as possible, Historical services search the local segment cache upon startup and advertise the segments found there.
+
+## Loading and serving segments from cache
+
+The segment cache uses [memory mapping](https://en.wikipedia.org/wiki/Mmap). The cache consumes memory from the underlying operating system so Historicals can hold parts of segment files in memory to increase query performance at the data level. The in-memory segment cache is affected by the size of the Historical JVM, heap / direct memory buffers, and other services on the operating system itself.
+
+At query time, if the required part of a segment file is available in the memory mapped cache or "page cache", the Historical re-uses it and reads it directly from memory. If it is not in the memory-mapped cache, the Historical reads that part of the segment from disk. In this case, there is potential for new data to flush other segment data from memory. This means that if free operating system memory is close to `druid.server.maxSize`, the more likely that segment data will be available in memory and reduce query times. Conversely, the lower the free operating system memory, the more likely a Historical is to read segments from disk.
+
+Note that this memory-mapped segment cache is in addition to other [query-level caches](../querying/caching.md).
+
+## Querying segments
+
+You can configure a Historical service to log and report metrics for every query it services.
+For information on querying Historical services, see [Querying](../querying/querying.md).
diff --git a/docs/35.0.0/design/index.md b/docs/35.0.0/design/index.md
new file mode 100644
index 0000000000..4d4655a9b1
--- /dev/null
+++ b/docs/35.0.0/design/index.md
@@ -0,0 +1,104 @@
+---
+id: index
+title: "Introduction to Apache Druid"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+Apache Druid is a real-time analytics database designed for fast slice-and-dice analytics ("[OLAP](http://en.wikipedia.org/wiki/Online_analytical_processing)" queries) on large data sets. Most often, Druid powers use cases where real-time ingestion, fast query performance, and high uptime are important.
+
+Druid is commonly used as the database backend for GUIs of analytical applications, or for highly-concurrent APIs that need fast aggregations. Druid works best with event-oriented data.
+
+Common application areas for Druid include:
+
+|Use Case|Description|
+|-----------------|-------------------|
+|Clickstream analytics|Analyze user behavior on websites and mobile applications to understand navigation patterns, popular content, and user engagement|
+|Network telemetry analytics|Monitor and analyze network traffic and performance metrics to optimize network efficiency, identify bottlenecks, and ensure quality of service|
+|Server metrics storage|Collect and store performance metrics such as CPU usage, memory usage, disk I/O, and network activity to monitor server health and optimize resource allocation|
+|Supply chain analytics|Use data from various stages of the supply chain to optimize inventory management, streamline logistics, forecast demand, and improve overall operational efficiency|
+|Application performance metrics|Monitor and analyze the performance of software applications to identify areas for improvement, troubleshoot issues, and ensure optimal user experience|
+|Digital marketing/advertising analytics|Track and analyze the effectiveness of digital marketing campaigns and advertising efforts across various channels, such as social media, search engines, and display ads|
+|Business intelligence (BI)/OLAP (Online Analytical Processing)|Use data analysis tools and techniques to gather insights from large datasets, generate reports, and make data-driven decisions to improve business operations and strategy|
+|Customer analytics|Analyze customer data to understand preferences, behavior, and purchasing patterns, enabling personalized marketing strategies, improved customer service, and customer retention efforts|
+|IoT (Internet of Things) analytics|Process and analyze data generated by IoT devices to gain insights into device performance, user behavior, and environmental conditions, facilitating automation, optimization, and predictive maintenance|
+|Financial analytics|  Evaluate finance data to gauge financial performance, manage risk, detect fraud, and make informed investment decisions|
+|Healthcare analytics|Analyze healthcare data to improve patient outcomes, optimize healthcare delivery, reduce costs, and identify trends and patterns in diseases and treatments|
+|Social media analytics|Monitor and analyze social media activity, such as likes, shares, comments, and mentions, to understand audience sentiment, track brand perception, and identify influencers|
+
+If you are experimenting with a new use case for Druid or have questions about Druid's capabilities and features, join the [Apache Druid Slack](http://apachedruidworkspace.slack.com/) channel. There, you can connect with Druid experts, ask questions, and get help in real time.
+
+## Key features of Druid
+
+Druid's core architecture combines ideas from data warehouses, timeseries databases, and logsearch systems. Some of
+Druid's key features are:
+
+1. **Columnar storage format.** Druid uses column-oriented storage. This means it only loads the exact columns
+needed for a particular query.  This greatly improves speed for queries that retrieve only a few columns. Additionally, to support fast scans and aggregations, Druid optimizes column storage for each column according to its data type.
+2. **Scalable distributed system.** Typical Druid deployments span clusters ranging from tens to hundreds of servers. Druid can ingest data at the rate of millions of records per second while retaining trillions of records and maintaining query latencies ranging from the sub-second to a few seconds.
+3. **Massively parallel processing.** Druid can process each query in parallel across the entire cluster.
+4. **Realtime or batch ingestion.** Druid can ingest data either real-time or in batches. Ingested data is immediately available for
+querying.
+5. **Self-healing, self-balancing, easy to operate.** As an operator, you add servers to scale out or
+remove servers to scale down. The Druid cluster re-balances itself automatically in the background without any downtime. If a
+Druid server fails, the system automatically routes data around the damage until the server can be replaced. Druid
+is designed to run continuously without planned downtime for any reason. This is true for configuration changes and software
+updates.
+6. **Cloud-native, fault-tolerant architecture that won't lose data.** After ingestion, Druid safely stores a copy of your data in [deep storage](architecture.md#deep-storage). Deep storage is typically cloud storage, HDFS, or a shared filesystem. You can recover your data from deep storage even in the unlikely case that all Druid servers fail. For a limited failure that affects only a few Druid servers, replication ensures that queries are still possible during system recoveries.
+7. **Indexes for quick filtering.** Druid uses [Roaring](https://roaringbitmap.org/) or
+[CONCISE](https://arxiv.org/pdf/1004.0403) compressed bitmap indexes to create indexes to enable fast filtering and searching across multiple columns.
+8. **Time-based partitioning.** Druid first partitions data by time. You can optionally implement additional partitioning based upon other fields.
+Time-based queries only access the partitions that match the time range of the query which leads to significant performance improvements.
+9. **Approximate algorithms.** Druid includes algorithms for approximate count-distinct, approximate ranking, and
+computation of approximate histograms and quantiles. These algorithms offer bounded memory usage and are often
+substantially faster than exact computations. For situations where accuracy is more important than speed, Druid also
+offers exact count-distinct and exact ranking.
+10. **Automatic summarization at ingest time.** Druid optionally supports data summarization at ingestion time. This
+summarization partially pre-aggregates your data, potentially leading to significant cost savings and performance boosts.
+
+## When to use Druid
+
+Druid is used by many companies of various sizes for many different use cases. For more information see
+[Powered by Apache Druid](/druid-powered).
+
+Druid is likely a good choice if your use case matches a few of the following:
+
+- Insert rates are very high, but updates are less common.
+- Most of your queries are aggregation and reporting queries. For example "group by" queries. You may also have searching and
+scanning queries.
+- You are targeting query latencies of 100ms to a few seconds.
+- Your data has a time component. Druid includes optimizations and design choices specifically related to time.
+- You may have more than one table, but each query hits just one big distributed table. Queries may potentially hit more
+than one smaller "lookup" table.
+- You have high cardinality data columns, e.g. URLs, user IDs, and need fast counting and ranking over them.
+- You want to load data from Kafka, HDFS, flat files, or object storage like Amazon S3.
+
+Situations where you would likely _not_ want to use Druid include:
+
+- You need low-latency updates of _existing_ records using a primary key. Druid supports streaming inserts, but not streaming updates. You can perform updates using
+background batch jobs.
+- You are building an offline reporting system where query latency is not very important.
+- You want to do "big" joins, meaning joining one big fact table to another big fact table, and you are okay with these queries
+taking a long time to complete.
+
+## Learn more
+- Try the Druid [Quickstart](../tutorials/index.md).
+- Learn more about Druid components in [Design](../design/architecture.md).
+- Read about new features and improvements in [Druid Releases](https://github.com/apache/druid/releases).
diff --git a/docs/35.0.0/design/indexer.md b/docs/35.0.0/design/indexer.md
new file mode 100644
index 0000000000..4b695b290b
--- /dev/null
+++ b/docs/35.0.0/design/indexer.md
@@ -0,0 +1,96 @@
+---
+id: indexer
+layout: doc_page
+title: "Indexer service"
+sidebar_label: "Indexer"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ The Indexer is an optional and experimental feature. If you're primarily performing batch ingestion, we recommend you use either the MiddleManager and Peon task execution system or [MiddleManager-less ingestion using Kubernetes](../development/extensions-core/k8s-jobs.md). If you're primarily doing streaming ingestion, you may want to try either [MiddleManager-less ingestion using Kubernetes](../development/extensions-core/k8s-jobs.md) or the Indexer service.
+:::
+
+The Apache Druid Indexer service is an alternative to the Middle Manager + Peon task execution system. Instead of forking a separate JVM process per-task, the Indexer runs tasks as separate threads within a single JVM process.
+
+The Indexer is designed to be easier to configure and deploy compared to the Middle Manager + Peon system and to better enable resource sharing across tasks.
+
+## Configuration
+
+For Apache Druid Indexer service configuration, see [Indexer Configuration](../configuration/index.md#indexer).
+
+## HTTP endpoints
+
+The Indexer service shares the same HTTP endpoints as the [Middle Manager](../api-reference/service-status-api.md#middle-manager).
+
+## Running
+
+```
+org.apache.druid.cli.Main server indexer
+```
+
+## Task resource sharing
+
+The following resources are shared across all tasks running inside the Indexer service.
+
+### Query resources
+
+The query processing threads and buffers are shared across all tasks. The Indexer serves queries from a single endpoint shared by all tasks.
+
+If [query caching](../configuration/index.md#indexer-caching) is enabled, the query cache is also shared across all tasks.
+
+### Server HTTP threads
+
+The Indexer maintains two equally sized pools of HTTP threads.
+One pool is exclusively used for task control messages between the Overlord and the Indexer ("chat handler threads"). The other pool is used for handling all other HTTP requests.
+
+To configure the number of threads, use the `druid.server.http.numThreads` property. For example, if `druid.server.http.numThreads` is set to 10, there will be 10 chat handler threads and 10 non-chat handler threads.
+
+In addition to these two pools, the Indexer allocates two separate threads for lookup handling. If lookups are not used, these threads will not be used.
+
+### Memory sharing
+
+The Indexer uses the `druid.worker.globalIngestionHeapLimitBytes` property to impose a global heap limit across all of the tasks it is running.
+
+This global limit is evenly divided across the number of task slots configured by `druid.worker.capacity`.
+
+To apply the per-task heap limit, the Indexer overrides `maxBytesInMemory` in task tuning configurations, that is ignoring the default value or any user configured value. It also overrides `maxRowsInMemory` to an essentially unlimited value: the Indexer does not support row limits.
+
+By default, `druid.worker.globalIngestionHeapLimitBytes` is set to 1/6th of the available JVM heap. This default is chosen to align with the default value of `maxBytesInMemory` in task tuning configs when using the Middle Manager + Peon system, which is also 1/6th of the JVM heap.
+
+The peak usage for rows held in heap memory relates to the interaction between the `maxBytesInMemory` and `maxPendingPersists` properties in the task tuning configs. When the amount of row data held in-heap by a task reaches the limit specified by `maxBytesInMemory`, a task will persist the in-heap row data. After the persist has been started, the task can again ingest up to `maxBytesInMemory` bytes worth of row data while the persist is running.
+
+This means that the peak in-heap usage for row data can be up to approximately `maxBytesInMemory * (2 + maxPendingPersists)`. The default value of `maxPendingPersists` is 0, which allows for 1 persist to run concurrently with ingestion work.
+
+The remaining portion of the heap is reserved for query processing and segment persist/merge operations, and miscellaneous heap usage.
+
+### Concurrent segment persist/merge limits
+
+To help reduce peak memory usage, the Indexer imposes a limit on the number of concurrent segment persist/merge operations across all running tasks.
+
+By default, the number of concurrent persist/merge operations is limited to `(druid.worker.capacity / 2)`, rounded down. This limit can be configured with the `druid.worker.numConcurrentMerges` property.
+
+## Current limitations
+
+Separate task logs are not currently supported when using the Indexer; all task log messages will instead be logged in the Indexer service log.
+
+The Indexer currently imposes an identical memory limit on each task. In later releases, the per-task memory limit will be removed and only the global limit will apply. The limit on concurrent merges will also be removed.
+
+In later releases, per-task memory usage will be dynamically managed. Please see https://github.com/apache/druid/issues/7900 for details on future enhancements to the Indexer.
diff --git a/docs/35.0.0/design/indexing-service.md b/docs/35.0.0/design/indexing-service.md
new file mode 100644
index 0000000000..d7dde33ecd
--- /dev/null
+++ b/docs/35.0.0/design/indexing-service.md
@@ -0,0 +1,51 @@
+---
+id: indexing-service
+title: "Indexing Service"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+The Apache Druid indexing service is a highly-available, distributed service that runs indexing related tasks.
+
+Indexing [tasks](../ingestion/tasks.md) are responsible for creating and [killing](../ingestion/tasks.md#kill) Druid [segments](../design/segments.md).
+
+The indexing service is composed of three main components: [Peons](../design/peons.md) that can run a single task, [Middle Managers](../design/middlemanager.md) that manage Peons, and an [Overlord](../design/overlord.md) that manages task distribution to Middle Managers.
+Overlords and Middle Managers may run on the same process or across multiple processes, while Middle Managers and Peons always run on the same process.
+
+Tasks are managed using API endpoints on the Overlord service. Please see [Tasks API](../api-reference/tasks-api.md) for more information.
+
+![Indexing Service](../assets/indexing_service.png "Indexing Service")
+
+## Overlord
+
+See [Overlord](../design/overlord.md).
+
+## Middle Managers
+
+See [Middle Manager](../design/middlemanager.md).
+
+## Peons
+
+See [Peon](../design/peons.md).
+
+## Tasks
+
+See [Tasks](../ingestion/tasks.md).
diff --git a/docs/35.0.0/design/metadata-storage.md b/docs/35.0.0/design/metadata-storage.md
new file mode 100644
index 0000000000..8071753f3e
--- /dev/null
+++ b/docs/35.0.0/design/metadata-storage.md
@@ -0,0 +1,175 @@
+---
+id: metadata-storage
+title: "Metadata storage"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+Apache Druid relies on an external dependency for metadata storage.
+Druid uses the metadata store to house various metadata about the system, but not to store the actual data.
+The metadata store retains all metadata essential for a Druid cluster to work.
+
+The metadata store includes the following:
+- Segments records
+- Rule records
+- Configuration records
+- Task-related tables
+- Audit records
+
+Derby is the default metadata store for Druid, however, it is not suitable for production.
+[MySQL](../development/extensions-core/mysql.md) and [PostgreSQL](../development/extensions-core/postgresql.md) are more production suitable metadata stores.
+See [Metadata storage configuration](../configuration/index.md#metadata-storage) for the default configuration settings.
+
+:::info
+ We also recommend you set up a high availability environment because there is no way to restore lost metadata.
+:::
+
+## Available metadata stores
+
+Druid supports Derby, MySQL, and PostgreSQL for storing metadata. Note that your metadata store must be ACID-compliant. If it isn't ACID-compliant, you can encounter issues, such as tasks failing sporadically.
+
+To avoid issues with upgrades that require schema changes to a large metadata table, consider a metadata store version that supports instant ADD COLUMN semantics.
+See the database-specific docs for guidance on versions.
+
+### MySQL
+
+See [mysql-metadata-storage extension documentation](../development/extensions-core/mysql.md).
+
+### PostgreSQL
+
+See [postgresql-metadata-storage](../development/extensions-core/postgresql.md).
+
+
+### Derby
+
+:::info
+ For production clusters, consider using MySQL or PostgreSQL instead of Derby.
+:::
+
+Configure metadata storage with Derby by setting the following properties in your Druid configuration.
+
+```properties
+druid.metadata.storage.type=derby
+druid.metadata.storage.connector.connectURI=jdbc:derby://localhost:1527//opt/var/druid_state/derby;create=true
+```
+
+## Adding custom DBCP properties
+
+You can add custom properties to customize the database connection pool (DBCP) for connecting to the metadata store.
+Define these properties with a `druid.metadata.storage.connector.dbcp.` prefix.
+For example:
+
+```properties
+druid.metadata.storage.connector.dbcp.maxConnLifetimeMillis=1200000
+druid.metadata.storage.connector.dbcp.defaultQueryTimeout=30000
+```
+
+Certain properties cannot be set through `druid.metadata.storage.connector.dbcp.` and must be set with the prefix `druid.metadata.storage.connector.`:
+* `username`
+* `password`
+* `connectURI`
+* `validationQuery`
+* `testOnBorrow`
+
+See [BasicDataSource Configuration](https://commons.apache.org/proper/commons-dbcp/configuration) for a full list of configurable properties.
+
+## Metadata storage tables
+
+This section describes the various tables in metadata storage.
+
+### Segments table
+
+This is dictated by the `druid.metadata.storage.tables.segments` property.
+
+This table stores metadata about the segments that should be available in the system. (This set of segments is called
+"used segments" elsewhere in the documentation and throughout the project.) The table is polled by the
+[Coordinator](../design/coordinator.md) to determine the set of segments that should be available for querying in the
+system. The table has two main functional columns, the other columns are for indexing purposes.
+
+Value 1 in the `used` column means that the segment should be "used" by the cluster (i.e., it should be loaded and
+available for requests). Value 0 means that the segment should not be loaded into the cluster. We do this as a means of
+unloading segments from the cluster without actually removing their metadata (which allows for simpler rolling back if
+that is ever an issue). The `used` column has a corresponding `used_status_last_updated` column which denotes the time
+when the `used` status of the segment was last updated. This information can be used by the Coordinator to determine if
+a segment is a candidate for deletion (if automated segment killing is enabled).
+
+The `payload` column stores a JSON blob that has all of the metadata for the segment.
+Some of the data in the `payload` column intentionally duplicates data from other columns in the segments table.
+As an example, the `payload` column may take the following form:
+
+```json
+{
+ "dataSource":"wikipedia",
+ "interval":"2012-05-23T00:00:00.000Z/2012-05-24T00:00:00.000Z",
+ "version":"2012-05-24T00:10:00.046Z",
+ "loadSpec":{
+    "type":"s3_zip",
+    "bucket":"bucket_for_segment",
+    "key":"path/to/segment/on/s3"
+ },
+ "dimensions":"comma-delimited-list-of-dimension-names",
+ "metrics":"comma-delimited-list-of-metric-names",
+ "shardSpec":{"type":"none"},
+ "binaryVersion":9,
+ "size":size_of_segment,
+ "identifier":"wikipedia_2012-05-23T00:00:00.000Z_2012-05-24T00:00:00.000Z_2012-05-23T00:10:00.046Z"
+}
+```
+
+### Rule table
+
+The rule table stores the various rules about where segments should
+land. These rules are used by the [Coordinator](../design/coordinator.md)
+  when making segment (re-)allocation decisions about the cluster.
+
+### Config table
+
+The config table stores runtime configuration objects. We do not have
+many of these yet and we are not sure if we will keep this mechanism going
+forward, but it is the beginnings of a method of changing some configuration
+parameters across the cluster at runtime.
+
+### Task-related tables
+
+Task-related tables are created and used by the [Overlord](../design/overlord.md) and [Middle Manager](../design/middlemanager.md) when managing tasks.
+
+### Audit table
+
+The audit table stores the audit history for configuration changes
+such as rule changes done by [Coordinator](../design/coordinator.md) and other
+config changes.
+
+## Metadata storage access
+
+Only the following processes access the metadata storage:
+
+1. Indexing service processes (if any)
+2. Realtime processes (if any)
+3. Coordinator processes
+
+Thus you need to give permissions (e.g., in AWS security groups) for only these machines to access the metadata storage.
+
+## Learn more
+
+See the following topics for more information:
+* [Metadata storage configuration](../configuration/index.md#metadata-storage)
+* [Automated cleanup for metadata records](../operations/clean-metadata-store.md)
+
diff --git a/docs/35.0.0/design/middlemanager.md b/docs/35.0.0/design/middlemanager.md
new file mode 100644
index 0000000000..9037b56a6e
--- /dev/null
+++ b/docs/35.0.0/design/middlemanager.md
@@ -0,0 +1,43 @@
+---
+id: middlemanager
+title: "Middle Manager service"
+sidebar_label: "Middle Manager"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+The Middle Manager service is a worker service that executes submitted tasks. Middle Managers forward tasks to [Peons](../design/peons.md) that run in separate JVMs.
+Druid uses separate JVMs for tasks to isolate resources and logs. Each Peon is capable of running only one task at a time, whereas a Middle Manager may have multiple Peons.
+
+## Configuration
+
+For Apache Druid Middle Manager service configuration, see [Middle Manager and Peons](../configuration/index.md#middle-manager-and-peon).
+
+For basic tuning guidance for the Middle Manager service, see [Basic cluster tuning](../operations/basic-cluster-tuning.md#middle-manager).
+
+## HTTP endpoints
+
+For a list of API endpoints supported by the Middle Manager, see the [Service status API reference](../api-reference/service-status-api.md#middle-manager).
+
+## Running
+
+```
+org.apache.druid.cli.Main server middleManager
+```
diff --git a/docs/35.0.0/design/overlord.md b/docs/35.0.0/design/overlord.md
new file mode 100644
index 0000000000..d8458e750a
--- /dev/null
+++ b/docs/35.0.0/design/overlord.md
@@ -0,0 +1,59 @@
+---
+id: overlord
+title: "Overlord service"
+sidebar_label: "Overlord"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+The Overlord service is responsible for accepting tasks, coordinating task distribution, creating locks around tasks, and returning statuses to callers. The Overlord can be configured to run in one of two modes - local or remote (local being default).
+In local mode, the Overlord is also responsible for creating Peons for executing tasks. When running the Overlord in local mode, all Middle Manager and Peon configurations must be provided as well.
+Local mode is typically used for simple workflows. In remote mode, the Overlord and Middle Manager are run in separate services and you can run each on a different server.
+This mode is recommended if you intend to use the indexing service as the single endpoint for all Druid indexing.
+
+## Configuration
+
+For Apache Druid Overlord service configuration, see [Overlord Configuration](../configuration/index.md#overlord).
+
+For basic tuning guidance for the Overlord service, see [Basic cluster tuning](../operations/basic-cluster-tuning.md#overlord).
+
+## HTTP endpoints
+
+For a list of API endpoints supported by the Overlord, please see the [Service status API reference](../api-reference/service-status-api.md#overlord).
+
+## Blacklisted workers
+
+If a Middle Manager has task failures above a threshold, the Overlord will blacklist these Middle Managers. No more than 20% of the Middle Managers can be blacklisted. Blacklisted Middle Managers will be periodically whitelisted.
+
+The following variables can be used to set the threshold and blacklist timeouts.
+
+```
+druid.indexer.runner.maxRetriesBeforeBlacklist
+druid.indexer.runner.workerBlackListBackoffTime
+druid.indexer.runner.workerBlackListCleanupPeriod
+druid.indexer.runner.maxPercentageBlacklistWorkers
+```
+
+## Autoscaling
+
+The autoscaling mechanisms currently in place are tightly coupled with our deployment infrastructure but the framework should be in place for other implementations. We are highly open to new implementations or extensions of the existing mechanisms. In our own deployments, Middle Manager services are Amazon AWS EC2 nodes and they are provisioned to register themselves in a [galaxy](https://github.com/ning/galaxy) environment.
+
+If autoscaling is enabled, new Middle Managers may be added when a task has been in pending state for too long. Middle Managers may be terminated if they have not run any tasks for a period of time.
diff --git a/docs/35.0.0/design/peons.md b/docs/35.0.0/design/peons.md
new file mode 100644
index 0000000000..b31bd8ec1a
--- /dev/null
+++ b/docs/35.0.0/design/peons.md
@@ -0,0 +1,48 @@
+---
+id: peons
+title: "Peon service"
+sidebar_label: "Peon"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+The Peon service is a task execution engine spawned by the Middle Manager. Each Peon runs a separate JVM and is responsible for executing a single task. Peons always run on the same host as the Middle Manager that spawned them.
+
+## Configuration
+
+For Apache Druid Peon configuration, see [Peon Query Configuration](../configuration/index.md#peon-query-configuration) and [Additional Peon Configuration](../configuration/index.md#additional-peon-configuration).
+
+For basic tuning guidance for Middle Manager tasks, see [Basic cluster tuning](../operations/basic-cluster-tuning.md#task-configurations).
+
+## HTTP endpoints
+
+Peons run a single task in a single JVM. The Middle Manager is responsible for creating Peons for running tasks.
+Peons should rarely run on their own.
+
+## Running
+
+The Peon should seldom run separately from the Middle Manager, except for development purposes.
+
+```
+org.apache.druid.cli.Main internal peon <task_file> <status_file>
+```
+
+The task file contains the task JSON object.
+The status file indicates where the task status will be output.
diff --git a/docs/35.0.0/design/router.md b/docs/35.0.0/design/router.md
new file mode 100644
index 0000000000..ffe9358e48
--- /dev/null
+++ b/docs/35.0.0/design/router.md
@@ -0,0 +1,230 @@
+---
+id: router
+title: "Router service"
+sidebar_label: "Router"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+The Router service distributes queries between different Broker services. By default, the Broker routes queries based on preconfigured [data retention rules](../operations/rule-configuration.md). For example, if one month of recent data is loaded into a `hot` cluster, queries that fall within the recent month can be routed to a dedicated set of Brokers. Queries outside this range are routed to another set of Brokers. This set up provides query isolation such that queries for more important data are not impacted by queries for less important data.
+
+For query routing purposes, you should only ever need the Router service if you have a Druid cluster well into the terabyte range.
+
+In addition to query routing, the Router also runs the [web console](../operations/web-console.md), a UI for loading data, managing datasources and tasks, and viewing server status and segment information.
+
+## Configuration
+
+For Apache Druid Router service configuration, see [Router configuration](../configuration/index.md#router).
+
+For basic tuning guidance for the Router service, see [Basic cluster tuning](../operations/basic-cluster-tuning.md#router).
+
+## HTTP endpoints
+
+For a list of API endpoints supported by the Router, see [Legacy metadata API reference](../api-reference/legacy-metadata-api.md#datasource-information).
+
+## Running
+
+```
+org.apache.druid.cli.Main server router
+```
+
+## Router as management proxy
+
+You can configure the Router to forward requests to the active Coordinator or Overlord service. This may be useful for
+setting up a highly available cluster in situations where the HTTP redirect mechanism of the inactive to active
+Coordinator or Overlord service does not function correctly, such as when servers are behind a load balancer or the hostname used in the redirect is only resolvable internally.
+
+### Enable the management proxy
+
+To enable the management proxy, set the following in the Router's `runtime.properties`:
+
+```
+druid.router.managementProxy.enabled=true
+```
+
+### Management proxy routing
+
+The management proxy supports implicit and explicit routes. Implicit routes are those where the destination can be
+determined from the original request path based on Druid API path conventions. For the Coordinator the convention is
+`/druid/coordinator/*` and for the Overlord the convention is `/druid/indexer/*`. These are convenient because they mean
+that using the management proxy does not require modifying the API request other than issuing the request to the Router
+instead of the Coordinator or Overlord. Most Druid API requests can be routed implicitly.
+
+Explicit routes are those where the request to the Router contains a path prefix indicating which service the request
+should be routed to. For the Coordinator this prefix is `/proxy/coordinator` and for the Overlord it is `/proxy/overlord`.
+This is required for API calls with an ambiguous destination. For example, the `/status` API is present on all Druid
+services, so explicit routing needs to be used to indicate the proxy destination.
+
+This is summarized in the table below:
+
+|Request Route|Destination|Rewritten Route|Example|
+|-------------|-----------|---------------|-------|
+|`/druid/coordinator/*`|Coordinator|`/druid/coordinator/*`|`router:8888/druid/coordinator/v1/datasources` -> `coordinator:8081/druid/coordinator/v1/datasources`|
+|`/druid/indexer/*`|Overlord|`/druid/indexer/*`|`router:8888/druid/indexer/v1/task` -> `overlord:8090/druid/indexer/v1/task`|
+|`/proxy/coordinator/*`|Coordinator|`/*`|`router:8888/proxy/coordinator/status` -> `coordinator:8081/status`|
+|`/proxy/overlord/*`|Overlord|`/*`|`router:8888/proxy/overlord/druid/indexer/v1/isLeader` -> `overlord:8090/druid/indexer/v1/isLeader`|
+
+## Router strategies
+
+The Router has a configurable list of strategies to determine which Brokers to route queries to. The order of the strategies is important because the Broker is selected immediately after the strategy condition is satisfied.
+
+### timeBoundary
+
+```json
+{
+  "type":"timeBoundary"
+}
+```
+
+Including this strategy means all `timeBoundary` queries are always routed to the highest priority Broker.
+
+### priority
+
+```json
+{
+  "type":"priority",
+  "minPriority":0,
+  "maxPriority":1
+}
+```
+
+Queries with a priority set to less than `minPriority` are routed to the lowest priority Broker. Queries with priority set to greater than `maxPriority` are routed to the highest priority Broker. By default, `minPriority` is 0 and `maxPriority` is 1. Using these default values, if a query with priority 0 (the default query priority is 0) is sent, the query skips the priority selection logic.
+
+### manual
+
+This strategy reads the parameter `brokerService` from the query context and routes the query to that broker service. If no valid `brokerService` is specified in the query context, the field `defaultManualBrokerService` is used to determine target broker service given the value is valid and non-null. A value is considered valid if it is present in `druid.router.tierToBrokerMap`.
+This strategy can route both native and SQL queries.
+
+The following example strategy routes queries to the Broker `druid:broker-hot` if no valid `brokerService` is found in the query context.
+
+```json
+{
+  "type": "manual",
+  "defaultManualBrokerService": "druid:broker-hot"
+}
+```
+
+### JavaScript
+
+Allows defining arbitrary routing rules using a JavaScript function. The function takes the configuration and the query to be executed, and returns the tier it should be routed to, or null for the default tier.
+
+The following example function sends queries containing more than three aggregators to the lowest priority Broker.
+
+```json
+{
+  "type" : "javascript",
+  "function" : "function (config, query) { if (query.getAggregatorSpecs && query.getAggregatorSpecs().size() >= 3) { var size = config.getTierToBrokerMap().values().size(); if (size > 0) { return config.getTierToBrokerMap().values().toArray()[size-1] } else { return config.getDefaultBrokerServiceName() } } else { return null } }"
+}
+```
+
+:::info
+ JavaScript-based functionality is disabled by default. Please refer to the Druid [JavaScript programming guide](../development/javascript.md) for guidelines about using Druid's JavaScript functionality, including instructions on how to enable it.
+:::
+
+## Routing of SQL queries using strategies
+
+To enable routing of SQL queries using strategies, set `druid.router.sql.enable` to `true`. The Broker service for a
+given SQL query is resolved using only the provided Router strategies. If not resolved using any of the strategies, the
+Router uses the `defaultBrokerServiceName`. This behavior is slightly different from native queries where the Router
+first tries to resolve the Broker service using strategies, then load rules and finally using the `defaultBrokerServiceName`
+if still not resolved. When `druid.router.sql.enable` is set to `false` (default value), the Router uses the
+`defaultBrokerServiceName`.
+
+Setting `druid.router.sql.enable` does not affect either Avatica JDBC requests or native queries.
+Druid always routes native queries using the strategies and load rules as documented.
+Druid always routes Avatica JDBC requests based on connection ID.
+
+## Avatica query balancing
+
+All Avatica JDBC requests with a given connection ID must be routed to the same Broker, since Druid Brokers do not share connection state with each other.
+
+To accomplish this, Druid provides two built-in balancers that use rendezvous hashing and consistent hashing of a request's connection ID respectively to assign requests to Brokers.
+
+Note that when multiple Routers are used, all Routers should have identical balancer configuration to ensure that they make the same routing decisions.
+
+### Rendezvous hash balancer
+
+This balancer uses [Rendezvous Hashing](https://en.wikipedia.org/wiki/Rendezvous_hashing) on an Avatica request's connection ID to assign the request to a Broker.
+
+To use this balancer, specify the following property:
+
+```
+druid.router.avatica.balancer.type=rendezvousHash
+```
+
+If no `druid.router.avatica.balancer` property is set, the Router defaults to using the rendezvous hash balancer.
+
+### Consistent hash balancer
+
+This balancer uses [Consistent Hashing](https://en.wikipedia.org/wiki/Consistent_hashing) on an Avatica request's connection ID to assign the request to a Broker.
+
+To use this balancer, specify the following property:
+
+```
+druid.router.avatica.balancer.type=consistentHash
+```
+
+This is a non-default implementation that is provided for experimentation purposes. The consistent hasher has longer setup times on initialization and when the set of Brokers changes, but has a faster Broker assignment time than the rendezvous hasher when tested with 5 Brokers. Benchmarks for both implementations have been provided in `ConsistentHasherBenchmark` and `RendezvousHasherBenchmark`. The consistent hasher also requires locking, while the rendezvous hasher does not.
+
+## Example production configuration
+
+In this example, we have two tiers in our production cluster: `hot` and `_default_tier`. Queries for the `hot` tier are routed through the `broker-hot` set of Brokers, and queries for the `_default_tier` are routed through the `broker-cold` set of Brokers. If any exceptions or network problems occur, queries are routed to the `broker-cold` set of brokers. In our example, we are running with a c3.2xlarge EC2 instance. We assume a `common.runtime.properties` already exists.
+
+JVM settings:
+
+```
+-server
+-Xmx13g
+-Xms13g
+-XX:NewSize=256m
+-XX:MaxNewSize=256m
+-XX:+UseConcMarkSweepGC
+-XX:+PrintGCDetails
+-XX:+PrintGCTimeStamps
+-XX:+UseLargePages
+-XX:+HeapDumpOnOutOfMemoryError
+-XX:HeapDumpPath=/mnt/galaxy/deploy/current/
+-Duser.timezone=UTC
+-Dfile.encoding=UTF-8
+-Djava.io.tmpdir=/mnt/tmp
+
+-Dcom.sun.management.jmxremote.port=17071
+-Dcom.sun.management.jmxremote.authenticate=false
+-Dcom.sun.management.jmxremote.ssl=false
+```
+
+Runtime.properties:
+
+```
+druid.host=#{IP_ADDR}:8080
+druid.plaintextPort=8080
+druid.service=druid/router
+
+druid.router.defaultBrokerServiceName=druid:broker-cold
+druid.router.coordinatorServiceName=druid:coordinator
+druid.router.tierToBrokerMap={"hot":"druid:broker-hot","_default_tier":"druid:broker-cold"}
+druid.router.http.numConnections=50
+druid.router.http.readTimeout=PT5M
+
+# Number of threads used by the Router proxy http client
+druid.router.http.numMaxThreads=100
+
+druid.server.http.numThreads=100
+```
diff --git a/docs/35.0.0/design/segments.md b/docs/35.0.0/design/segments.md
new file mode 100644
index 0000000000..6d2d9b5bad
--- /dev/null
+++ b/docs/35.0.0/design/segments.md
@@ -0,0 +1,217 @@
+---
+id: segments
+title: "Segments"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+Apache Druid stores its data and indexes in *segment files* partitioned by time. Druid creates a segment for each segment interval that contains data. If an interval is empty—that is, containing no rows—no segment exists for that time interval. Druid may create multiple segments for the same interval if you ingest data for that period via different ingestion jobs. [Compaction](../data-management/compaction.md) is the Druid process that attempts to combine these segments into a single segment per interval for optimal performance.
+
+The time interval is configurable in the `segmentGranularity` parameter of the [`granularitySpec`](../ingestion/ingestion-spec.md#granularityspec).
+
+For Druid to operate well under heavy query load, it is important for the segment
+file size to be within the recommended range of 300-700 MB. If your
+segment files are larger than this range, then consider either
+changing the granularity of the segment time interval or partitioning your
+data and/or adjusting the `targetRowsPerSegment` in your `partitionsSpec`.
+A good starting point for this parameter is 5 million rows.
+See the Sharding section below and the "Partitioning specification" section of
+the [Batch ingestion](../ingestion/hadoop.md#partitionsspec) documentation
+for more guidance.
+
+## Segment file structure
+
+Segment files are *columnar*: the data for each column is laid out in
+separate data structures. By storing each column separately, Druid decreases query latency by scanning only those columns actually needed for a query. There are three basic column types: timestamp, dimensions, and metrics:
+
+![Druid column types](../assets/druid-column-types.png "Druid Column Types")
+
+Timestamp and metrics type columns are arrays of integer or floating point values compressed with
+[LZ4](https://github.com/lz4/lz4-java). Once a query identifies which rows to select, it decompresses them, pulls out the relevant rows, and applies the
+desired aggregation operator. If a query doesn’t require a column, Druid skips over that column's data.
+
+Dimension columns are different because they support filter and
+group-by operations, so each dimension requires the following
+three data structures:
+
+- __Dictionary__: Maps values (which are always treated as strings) to integer IDs, allowing compact representation of the list and bitmap values.
+- __List__: The column’s values, encoded using the dictionary. Required for GroupBy and TopN queries. These operators allow queries that solely aggregate metrics based on filters to run without accessing the list of values.
+- __Bitmap__: One bitmap for each distinct value in the column, to indicate which rows contain that value. Bitmaps allow for quick filtering operations because they are convenient for quickly applying AND and OR operators. Also known as inverted indexes.
+
+To get a better sense of these data structures, consider the "Page" column from the example data above, represented by the following data structures:
+
+```
+1: Dictionary
+   {
+    "Justin Bieber": 0,
+    "Ke$ha":         1
+   }
+
+2: List of column data
+   [0,
+   0,
+   1,
+   1]
+
+3: Bitmaps
+   value="Justin Bieber": [1,1,0,0]
+   value="Ke$ha":         [0,0,1,1]
+```
+
+Note that the bitmap is different from the dictionary and list data structures: the dictionary and list grow linearly with the size of the data, but the size of the bitmap section is the product of data size and column cardinality. That is, there is one bitmap per separate column value. Columns with the same value share the same bitmap.
+
+For each row in the list of column data, there is only a single bitmap that has a non-zero entry. This means that high cardinality columns have extremely sparse, and therefore highly compressible, bitmaps. Druid exploits this using compression algorithms that are specially suited for bitmaps, such as [Roaring bitmap compression](https://github.com/RoaringBitmap/RoaringBitmap).
+
+## Handling null values
+
+String columns always store the null value if present in any row as id 0, the first position in the value dictionary and an associated entry in the bitmap value indexes used to filter null values. Numeric columns also store a null value bitmap index to indicate the null valued rows, which is used to null check aggregations and for filter matching null values. 
+
+## Segments with different schemas
+
+Druid segments for the same datasource may have different schemas. If a string column (dimension) exists in one segment but not another, queries that involve both segments still work. In default mode, queries for the segment without the dimension behave as if the dimension contains only blank values. In SQL-compatible mode, queries for the segment without the dimension behave as if the dimension contains only null values. Similarly, if one segment has a numeric column (metric) but another does not, queries on the segment without the metric generally operate as expected. Aggregations over the missing metric operate as if the metric doesn't exist.
+
+## Column format
+
+Each column is stored as two parts:
+
+- A Jackson-serialized `ColumnDescriptor`.
+- The binary data for the column.
+
+A `ColumnDescriptor` is  Jackson-serialized instance of the internal Druid `ColumnDescriptor` class . It allows the use of Jackson's polymorphic deserialization to add new and interesting methods of serialization with minimal impact to the code. It consists of some metadata about the column (for example: type, whether it's multi-value) and a list of serialization/deserialization logic that can deserialize the rest of the binary.
+
+### Multi-value columns
+
+A multi-value column allows a single row to contain multiple strings for a column. You can think of it as an array of strings. If a datasource uses multi-value columns, then the data structures within the segment files look a bit different. Let's imagine that in the example above, the second row is tagged with both the `Ke$ha` *and* `Justin Bieber` topics, as follows:
+
+```
+1: Dictionary
+   {
+    "Justin Bieber": 0,
+    "Ke$ha":         1
+   }
+
+2: List of column data
+   [0,
+   [0,1],  <--Row value in a multi-value column can contain an array of values
+   1,
+   1]
+
+3: Bitmaps
+   value="Justin Bieber": [1,1,0,0]
+   value="Ke$ha":         [0,1,1,1]
+                            ^
+                            |
+                            |
+   Multi-value column contains multiple non-zero entries
+```
+
+Note the changes to the second row in the list of column data and the `Ke$ha`
+bitmap. If a row has more than one value for a column, its entry in
+the list is an array of values. Additionally, a row with *n* values in the list has *n* non-zero valued entries in bitmaps.
+
+## Compression
+
+Druid uses LZ4 by default to compress blocks of values for string, long, float, and double columns. Druid uses Roaring to compress bitmaps for string columns and numeric null values. We recommend that you use these defaults unless you've experimented with your data and query patterns suggest that non-default options will perform better in your specific case. 
+
+Druid also supports Concise bitmap compression. For string column bitmaps, the differences between using Roaring and Concise are most pronounced for high cardinality columns. In this case, Roaring is substantially faster on filters that match many values, but in some cases Concise can have a lower footprint due to the overhead of the Roaring format (but is still slower when many values are matched). You configure compression at the segment level, not for individual columns. See [IndexSpec](../ingestion/ingestion-spec.md#indexspec) for more details.
+
+## Segment identification
+
+Segment identifiers typically contain the segment datasource, interval start time (in ISO 8601 format), interval end time (in ISO 8601 format), and version information. If data is additionally sharded beyond a time range, the segment identifier also contains a partition number:
+
+`datasource_intervalStart_intervalEnd_version_partitionNum`
+
+### Segment ID examples
+
+The increasing partition numbers in the following segments indicate that multiple segments exist for the same interval:
+
+```
+foo_2015-01-01/2015-01-02_v1_0
+foo_2015-01-01/2015-01-02_v1_1
+foo_2015-01-01/2015-01-02_v1_2
+```
+
+If you reindex the data with a new schema, Druid allocates a new version ID to the newly created segments:
+
+```
+foo_2015-01-01/2015-01-02_v2_0
+foo_2015-01-01/2015-01-02_v2_1
+foo_2015-01-01/2015-01-02_v2_2
+```
+
+## Sharding
+
+Multiple segments can exist for a single time interval and datasource. These segments form a `block` for an interval. Depending on the type of `shardSpec` used to shard the data, Druid queries may only complete if a `block` is complete. For example, if a block consists of the following three segments:
+
+```
+sampleData_2011-01-01T02:00:00:00Z_2011-01-01T03:00:00:00Z_v1_0
+sampleData_2011-01-01T02:00:00:00Z_2011-01-01T03:00:00:00Z_v1_1
+sampleData_2011-01-01T02:00:00:00Z_2011-01-01T03:00:00:00Z_v1_2
+```
+
+All three segments must load before a query for the interval `2011-01-01T02:00:00:00Z_2011-01-01T03:00:00:00Z` can complete.
+
+Linear shard specs are an exception to this rule. Linear shard specs do not enforce "completeness" so queries can complete even if shards are not completely loaded.
+
+For example, if a real-time ingestion creates three segments that were sharded with linear shard spec, and only two of the segments are loaded, queries return results for those two segments.
+
+## Segment components
+
+A segment contains several files:
+
+* `version.bin`
+
+    4 bytes representing the current segment version as an integer. For example, for v9 segments the version is 0x0, 0x0, 0x0, 0x9.
+
+* `meta.smoosh`
+
+    A file containing metadata (filenames and offsets) about the contents of the other `smoosh` files.
+
+* `XXXXX.smoosh`
+
+    Smoosh (`.smoosh`) files contain concatenated binary data. This file consolidation reduces the number of file descriptors that must be open when accessing data. The files are 2 GB or less in size to remain within the limit of a memory-mapped `ByteBuffer` in Java. 
+    Smoosh files contain the following: 
+    - Individual files for each column in the data, including one for the `__time` column that refers to the timestamp of the segment. 
+    - An `index.drd` file that contains additional segment metadata.
+
+In the codebase, segments have an internal format version. The current segment format version is `v9`.
+
+## Implications of updating segments
+
+Druid uses versioning to manage updates to create a form of multi-version concurrency control (MVCC). These MVCC versions are distinct from the segment format version discussed above.
+
+Note that updates that span multiple segment intervals are only atomic within each interval. They are not atomic across the entire update. For example, if you have the following segments:
+
+```
+foo_2015-01-01/2015-01-02_v1_0
+foo_2015-01-02/2015-01-03_v1_1
+foo_2015-01-03/2015-01-04_v1_2
+```
+
+`v2` segments are loaded into the cluster as soon as they are built and replace `v1` segments for the period of time the segments overlap. Before `v2` segments are completely loaded, the cluster may contain a mixture of `v1` and `v2` segments.
+
+```
+foo_2015-01-01/2015-01-02_v1_0
+foo_2015-01-02/2015-01-03_v2_1
+foo_2015-01-03/2015-01-04_v1_2
+```
+
+In this case, queries may hit a mixture of `v1` and `v2` segments.
diff --git a/docs/35.0.0/design/storage.md b/docs/35.0.0/design/storage.md
new file mode 100644
index 0000000000..365819639e
--- /dev/null
+++ b/docs/35.0.0/design/storage.md
@@ -0,0 +1,140 @@
+---
+id: storage
+title: "Storage overview"
+sidebar_label: "Storage"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+Druid stores data in datasources, which are similar to tables in a traditional RDBMS. Each datasource is partitioned by time and, optionally, further partitioned by other attributes. Each time range is called a chunk (for example, a single day, if your datasource is partitioned by day). Within a chunk, data is partitioned into one or more [segments](../design/segments.md). Each segment is a single file, typically comprising up to a few million rows of data. Since segments are organized into time chunks, it's sometimes helpful to think of segments as living on a timeline like the following:
+
+![Segment timeline](../assets/druid-timeline.png)
+
+A datasource may have anywhere from just a few segments, up to hundreds of thousands and even millions of segments. Each segment is created by a Middle Manager as mutable and uncommitted. Data is queryable as soon as it is added to an uncommitted segment. The segment building process accelerates later queries by producing a data file that is compact and indexed:
+
+- Conversion to columnar format
+- Indexing with bitmap indexes
+- Compression
+    - Dictionary encoding with id storage minimization for String columns
+    - Bitmap compression for bitmap indexes
+    - Type-aware compression for all columns
+
+Periodically, segments are committed and published to [deep storage](deep-storage.md), become immutable, and move from Middle Managers to the Historical services. An entry about the segment is also written to the [metadata store](metadata-storage.md). This entry is a self-describing bit of metadata about the segment, including things like the schema of the segment, its size, and its location on deep storage. These entries tell the Coordinator what data is available on the cluster.
+
+For details on the segment file format, see [segment files](segments.md).
+
+For details on modeling your data in Druid, see [schema design](../ingestion/schema-design.md).
+
+## Indexing and handoff
+
+Indexing is the mechanism by which new segments are created, and handoff is the mechanism by which they are published and served by Historical services. 
+
+On the indexing side:
+
+1. An indexing task starts running and building a new segment. It must determine the identifier of the segment before it starts building it. For a task that is appending (like a Kafka task, or an index task in append mode) this is done by calling an "allocate" API on the Overlord to potentially add a new partition to an existing set of segments. For
+a task that is overwriting (like a Hadoop task, or an index task not in append mode) this is done by locking an interval and creating a new version number and new set of segments.
+2. If the indexing task is a realtime task (like a Kafka task) then the segment is immediately queryable at this point. It's available, but unpublished.
+3. When the indexing task has finished reading data for the segment, it pushes it to deep storage and then publishes it by writing a record into the metadata store.
+4. If the indexing task is a realtime task, then to ensure data is continuously available for queries, it waits for a Historical service to load the segment. If the indexing task is not a realtime task, it exits immediately.
+
+On the Coordinator / Historical side:
+
+1. The Coordinator polls the metadata store periodically (by default, every 1 minute) for newly published segments.
+2. When the Coordinator finds a segment that is published and used, but unavailable, it chooses a Historical service to load that segment and instructs that Historical to do so.
+3. The Historical loads the segment and begins serving it.
+4. At this point, if the indexing task was waiting for handoff, it will exit.
+
+## Segment identifiers
+
+Segments all have a four-part identifier with the following components:
+
+- Datasource name.
+- Time interval for the time chunk containing the segment; this corresponds to the `segmentGranularity` specified at ingestion time. Uses the same format as [query granularity](../querying/granularities.md).
+- Version number (generally an ISO8601 timestamp corresponding to when the segment set was first started).
+- Partition number (an integer, unique within a datasource+interval+version; may not necessarily be contiguous).
+
+For example, this is the identifier for a segment in datasource `clarity-cloud0`, time chunk
+`2018-05-21T16:00:00.000Z/2018-05-21T17:00:00.000Z`, version `2018-05-21T15:56:09.909Z`, and partition number 1:
+
+```
+clarity-cloud0_2018-05-21T16:00:00.000Z_2018-05-21T17:00:00.000Z_2018-05-21T15:56:09.909Z_1
+```
+
+Segments with partition number 0 (the first partition in a chunk) omit the partition number, like the following example, which is a segment in the same time chunk as the previous one, but with partition number 0 instead of 1:
+
+```
+clarity-cloud0_2018-05-21T16:00:00.000Z_2018-05-21T17:00:00.000Z_2018-05-21T15:56:09.909Z
+```
+
+## Segment versioning
+
+The version number provides a form of [multi-version concurrency control](https://en.wikipedia.org/wiki/Multiversion_concurrency_control) (MVCC) to support batch-mode overwriting. If all you ever do is append data, then there will be just a single version for each time chunk. But when you overwrite data, Druid will seamlessly switch from querying the old version to instead query the new, updated versions. Specifically, a new set of segments is created with the same datasource, same time interval, but a higher version number. This is a signal to the rest of the Druid system that the older version should be removed from the cluster, and the new version should replace it.
+
+The switch appears to happen instantaneously to a user, because Druid handles this by first loading the new data (but not allowing it to be queried), and then, as soon as the new data is all loaded, switching all new queries to use those new segments. Then it drops the old segments a few minutes later.
+
+## Segment lifecycle
+
+Each segment has a lifecycle that involves the following three major areas:
+
+1. **Metadata store:** Segment metadata (a small JSON payload generally no more than a few KB) is stored in the [metadata store](metadata-storage.md) once a segment is done being constructed. The act of inserting a record for a segment into the metadata store is called publishing. These metadata records have a boolean flag named `used`, which controls whether the segment is intended to be queryable or not. Segments created by realtime tasks will be
+available before they are published, since they are only published when the segment is complete and will not accept any additional rows of data.
+2. **Deep storage:** Segment data files are pushed to deep storage once a segment is done being constructed. This happens immediately before publishing metadata to the metadata store.
+3. **Availability for querying:** Segments are available for querying on some Druid data server, like a realtime task, directly from deep storage, or a Historical service.
+
+You can inspect the state of currently active segments using the Druid SQL
+[`sys.segments` table](../querying/sql-metadata-tables.md#segments-table). It includes the following flags:
+
+- `is_published`: True if segment metadata has been published to the metadata store and `used` is true.
+- `is_available`: True if the segment is currently available for querying, either on a realtime task or Historical service.
+- `is_realtime`: True if the segment is only available on realtime tasks. For datasources that use realtime ingestion, this will generally start off `true` and then become `false` as the segment is published and handed off.
+- `is_overshadowed`: True if the segment is published (with `used` set to true) and is fully overshadowed by some other published segments. Generally this is a transient state, and segments in this state will soon have their `used` flag automatically set to false.
+
+## Availability and consistency
+
+Druid has an architectural separation between ingestion and querying, as described above in
+[Indexing and handoff](#indexing-and-handoff). This means that when understanding Druid's availability and consistency properties, we must look at each function separately.
+
+On the ingestion side, Druid's primary [ingestion methods](../ingestion/index.md#ingestion-methods) are all pull-based and offer transactional guarantees. This means that you are guaranteed that ingestion using these methods will publish in an all-or-nothing manner:
+
+- Supervised "seekable-stream" ingestion methods like [Kafka](../ingestion/kafka-ingestion.md) and [Kinesis](../ingestion/kinesis-ingestion.md). With these methods, Druid commits stream offsets to its [metadata store](metadata-storage.md) alongside segment metadata, in the same transaction. Note that ingestion of data that has not yet been published can be rolled back if ingestion tasks fail. In this case, partially-ingested data is
+discarded, and Druid will resume ingestion from the last committed set of stream offsets. This ensures exactly-once publishing behavior.
+- [Hadoop-based batch ingestion](../ingestion/hadoop.md). Each task publishes all segment metadata in a single transaction.
+- [Native batch ingestion](../ingestion/native-batch.md). In parallel mode, the supervisor task publishes all segment metadata in a single transaction after the subtasks are finished. In simple (single-task) mode, the single task publishes all segment metadata in a single transaction after it is complete.
+
+Additionally, some ingestion methods offer an _idempotency_ guarantee. This means that repeated executions of the same ingestion will not cause duplicate data to be ingested:
+
+- Supervised "seekable-stream" ingestion methods like [Kafka](../ingestion/kafka-ingestion.md) and [Kinesis](../ingestion/kinesis-ingestion.md) are idempotent due to the fact that stream offsets and segment metadata are stored together and updated in lock-step.
+- [Hadoop-based batch ingestion](../ingestion/hadoop.md) is idempotent unless one of your input sources is the same Druid datasource that you are ingesting into. In this case, running the same task twice is non-idempotent, because you are adding to existing data instead of overwriting it.
+- [Native batch ingestion](../ingestion/native-batch.md) is idempotent unless
+[`appendToExisting`](../ingestion/native-batch.md) is true, or one of your input sources is the same Druid datasource that you are ingesting into. In either of these two cases, running the same task twice is non-idempotent, because you are adding to existing data instead of overwriting it.
+
+On the query side, the Druid Broker is responsible for ensuring that a consistent set of segments is involved in a given query. It selects the appropriate set of segment versions to use when the query starts based on what is currently available. This is supported by atomic replacement, a feature that ensures that from a user's perspective, queries flip instantaneously from an older version of data to a newer set of data, with no consistency or performance impact.
+This is used for Hadoop-based batch ingestion, native batch ingestion when `appendToExisting` is false, and compaction.
+
+Note that atomic replacement happens for each time chunk individually. If a batch ingestion task or compaction involves multiple time chunks, then each time chunk will undergo atomic replacement soon after the task finishes, but the replacements will not all happen simultaneously.
+
+Typically, atomic replacement in Druid is based on a core set concept that works in conjunction with segment versions.
+When a time chunk is overwritten, a new core set of segments is created with a higher version number. The core set must all be available before the Broker will use them instead of the older set. There can also only be one core set per version per time chunk. Druid will also only use a single version at a time per time chunk. Together, these properties provide Druid's atomic replacement guarantees.
+
+Druid also supports an experimental segment locking mode that is activated by setting
+[`forceTimeChunkLock`](../ingestion/tasks.md#context-parameters) to false in the context of an ingestion task. In this case, Druid creates an atomic update group using the existing version for the time chunk, instead of creating a new core set with a new version number. There can be multiple atomic update groups with the same version number per time chunk. Each one replaces a specific set of earlier segments in the same time chunk and with the same version number. Druid will query the latest one that is fully available. This is a more powerful version of the core set concept, because it enables atomically replacing a subset of data for a time chunk, as well as doing atomic replacement and appending simultaneously.
+
+If segments become unavailable due to multiple Historicals going offline simultaneously (beyond your replication factor), then Druid queries will include only the segments that are still available. In the background, Druid will reload these unavailable segments on other Historicals as quickly as possible, at which point they will be included in queries again.
diff --git a/docs/35.0.0/design/zookeeper.md b/docs/35.0.0/design/zookeeper.md
new file mode 100644
index 0000000000..a01f12ed74
--- /dev/null
+++ b/docs/35.0.0/design/zookeeper.md
@@ -0,0 +1,76 @@
+---
+id: zookeeper
+title: "ZooKeeper"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+Apache Druid uses [Apache ZooKeeper](http://zookeeper.apache.org/) (ZK) for management of current cluster state.
+
+## Minimum ZooKeeper versions
+
+Apache Druid supports ZooKeeper versions 3.5.x and above.
+
+:::info
+ Note: Starting with Apache Druid 0.22.0, support for ZooKeeper 3.4.x has been removed
+ Starting with Apache Druid 31.0.0, support for Zookeeper-based segment loading has been removed.
+:::
+
+## ZooKeeper Operations
+
+The operations that happen over ZK are
+
+1.  [Coordinator](../design/coordinator.md) leader election
+2.  Segment "publishing" protocol from [Historical](../design/historical.md)
+3.  [Overlord](../design/overlord.md) leader election
+4.  [Overlord](../design/overlord.md) and [Middle Manager](../design/middlemanager.md) task management
+
+## Coordinator Leader Election
+
+We use the Curator [LeaderLatch](https://curator.apache.org/curator-recipes/leader-latch.html) recipe to perform leader election at path
+
+```
+${druid.zk.paths.coordinatorPath}/_COORDINATOR
+```
+
+## Segment "publishing" protocol from Historical and Realtime
+
+The `announcementsPath` and `liveSegmentsPath` are used for this.
+
+All [Historical](../design/historical.md) processes publish themselves on the `announcementsPath`, specifically, they will create an ephemeral znode at
+
+```
+${druid.zk.paths.announcementsPath}/${druid.host}
+```
+
+Which signifies that they exist. They will also subsequently create a permanent znode at
+
+```
+${druid.zk.paths.liveSegmentsPath}/${druid.host}
+```
+
+And as they load up segments, they will attach ephemeral znodes that look like
+
+```
+${druid.zk.paths.liveSegmentsPath}/${druid.host}/_segment_identifier_
+```
+
+Processes like the [Coordinator](../design/coordinator.md) and [Broker](../design/broker.md) can then watch these paths to see which processes are currently serving which segments.
diff --git a/docs/35.0.0/development/build.md b/docs/35.0.0/development/build.md
new file mode 100644
index 0000000000..3bfaca192d
--- /dev/null
+++ b/docs/35.0.0/development/build.md
@@ -0,0 +1,110 @@
+---
+id: build
+title: "Build from source"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+You can build Apache Druid directly from source. Use the version of this page
+that matches the version you want to build.
+For building the latest code in master, follow the latest version of this page
+[here](https://github.com/apache/druid/blob/master/docs/development/build.md):
+make sure it has `/master/` in the URL.
+
+## Prerequisites
+
+### Installing Java and Maven
+
+- See our [Java documentation](../operations/java.md) for information about obtaining a supported JDK
+- [Maven version 3.x](http://maven.apache.org/download.cgi)
+
+### Other Dependencies
+
+- Distribution builds require Python 3.x and the `pyyaml` module.
+- Integration tests require `pyyaml` version 5.1 or later.
+
+## Downloading the Source Code
+
+```bash
+git clone git@github.com:apache/druid.git
+cd druid
+```
+
+## Building from Source
+
+The basic command to build Druid from source is:
+
+```bash
+mvn clean install
+```
+
+This will run static analysis, unit tests, compile classes, and package the projects into JARs. It will _not_ generate the source or binary distribution tarball. Note that this build may take some time to complete.
+
+In addition to the basic stages, you may also want to add the following profiles and properties:
+
+- **-Pdist** - Distribution profile: Generates the binary distribution tarball by pulling in core extensions and dependencies and packaging the files as `distribution/target/apache-druid-x.x.x-bin.tar.gz`
+- **-Papache-release** - Apache release profile: Generates GPG signature and checksums, and builds the source distribution tarball as `distribution/target/apache-druid-x.x.x-src.tar.gz`
+- **-Prat** - Apache Rat profile: Runs the Apache Rat license audit tool
+- **-DskipTests** - Skips unit tests (which reduces build time)
+- **-Dweb.console.skip=true** - Skip front end project
+
+Putting these together, if you wish to build the source and binary distributions with signatures and checksums, audit licenses, and skip the unit tests, you would run:
+
+```bash
+mvn clean install -Papache-release,dist,rat -DskipTests
+```
+
+### Building for Development
+
+For development, use only the dist profile and skip the Apache release and Apache rat profiles.
+
+```bash
+mvn clean install -Pdist -DskipTests
+```
+
+If you want to speed up the build even more, you can enable parallel building with the `-T1C` option and skip some static analysis checks.
+
+```bash
+mvn clean install -Pdist -T1C -DskipTests -Dforbiddenapis.skip=true -Dcheckstyle.skip=true -Dpmd.skip=true -Dmaven.javadoc.skip=true -Denforcer.skip=true
+```
+
+You will expect to find your distribution tar file under the `distribution/target` directory.
+
+## Potential issues
+
+### Missing `pyyaml`
+
+You are building Druid from source following the instructions on this page but you get
+```
+[ERROR] Failed to execute goal org.codehaus.mojo:exec-maven-plugin:1.6.0:exec (generate-binary-license) on project distribution: Command execution failed.: Process exited with an error: 1 (Exit value: 1) -> [Help 1]
+```
+
+Resolution: Make sure you have Python installed as well as the `yaml` module:
+
+```bash
+pip install pyyaml
+```
+
+On some systems, ensure you use the Python 3.x version of `pip`:
+
+```bash
+pip3 install pyyaml
+```
diff --git a/docs/35.0.0/development/docs-contribute.md b/docs/35.0.0/development/docs-contribute.md
new file mode 100644
index 0000000000..270713e158
--- /dev/null
+++ b/docs/35.0.0/development/docs-contribute.md
@@ -0,0 +1,227 @@
+---
+id: contribute-to-docs
+title: "Contribute to Druid docs"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+Apache Druid is a [community-led project](https://druid.apache.org/community/). We are delighted to receive contributions to the docs ranging from minor fixes to big new features.
+
+Druid docs contributors:
+
+* Improve existing content
+* Create new content
+
+## Getting started
+
+Druid docs contributors can open an issue about documentation, or contribute a change with a pull request (PR).
+
+The open source Druid docs are located here:
+https://druid.apache.org/docs/latest/design/index.html
+
+If you need to update a Druid doc, locate and update the doc in the Druid repo following the instructions below.
+
+## Druid repo branches
+
+The Druid team works on the `master` branch and then branches for a release, such as `26.0.0`.
+
+See [`CONTRIBUTING.md`](https://github.com/apache/incubator-druid/blob/master/CONTRIBUTING.md) for instructions on contributing to Apache Druid.
+
+## Before you begin
+
+Before you can contribute to the Druid docs for the first time, you must complete the following steps:
+
+1. Fork the [Druid repo](https://github.com/apache/druid). Your fork will be the `origin` remote.
+2. Clone your fork:
+
+   ```bash
+   git clone git@github.com:GITHUB_USERNAME/druid.git
+   ```
+
+   Replace `GITHUB_USERNAME` with your GitHub username.
+3. In the directory where you cloned your fork, set up `apache/druid`  as your your remote `upstream` repo:
+
+   ```bash
+   git remote add upstream https://github.com/apache/druid.git
+   ```
+
+4. Confirm that your fork shows up as the origin repo and `apache/druid` shows up as the upstream repo:
+
+   ```bash
+   git remote -v
+   ```
+
+5. Verify that you have your email configured for GitHub:
+
+   ```bash
+   git config user.email
+   ```
+
+   If you need to set your email, see the [GitHub instructions](https://docs.github.com/en/github-ae@latest/account-and-profile/setting-up-and-managing-your-github-user-account/managing-email-preferences/setting-your-commit-email-address#setting-your-commit-email-address-in-git).
+
+6. Install Docusaurus so that you can build the site locally. Run either `npm install` or `yarn install` in the `website` directory.
+
+## Contributing
+
+Before you contribute, make sure your local branch of `master` and the upstream Apache branch are up-to-date and in sync. This can help you avoid merge conflicts. Run the following commands on your fork's `master` branch:
+
+```bash
+git fetch origin
+git fetch upstream
+```
+
+Then run either one of the following commands:
+
+```bash
+git rebase upstream/master
+# or
+git merge upstream/master
+```
+
+Now you're up to date, and you can make your changes.
+
+1. Create your working branch:
+
+   ```bash
+   git checkout -b MY-BRANCH
+   ```
+
+   Provide a name for your feature branch in `MY-BRANCH`.
+
+2. Find the file that you want to make changes to. All the source files for the docs are written in Markdown and located in the `docs` directory. The URL for the page includes the subdirectory the source file is in. For example, the SQL-based ingestion tutorial found at `https://druid.apache.org/docs/latest/tutorials/tutorial-msq-extern.html` is in the `tutorials` subdirectory.
+
+   If you're adding a page, create a new Markdown file in the appropriate subdirectory. Then, copy the front matter and Apache license from an existing file. Update the `title` and `id` fields. Don't forget to add it to `website/sidebars.json` so that your new page shows up in the navigation.
+
+3. Test changes locally by building the site and navigating to your changes. In the `website` directory, run `npm run start`. By default, this starts the site on `localhost:3000`. If port `3000` is already in use, it'll increment the port number from there.
+
+4. Use the following commands to run the link and spellcheckers locally:
+
+   ```bash
+   cd website
+   # You only need to install once
+   npm install
+   npm run build
+
+   npm run spellcheck
+   npm run link-lint
+   ```
+
+   This step can save you time during the review process since they'll run faster than the GitHub Action version of the checks and warn you of issues before you create a PR.
+
+5. Push your changes to your fork:
+
+   ```bash
+   git push --set-upstream origin MY-BRANCH
+   ```
+
+6. Go to the Druid repo. GitHub should recognize that you have a new branch in your fork. Create a pull request from your Druid fork and branch to the `master` branch in the Apache Druid repo.
+
+The pull request template is extensive. You may not need all the information there, so feel free to delete unneeded sections as you fill it out. Once you create the pull request, GitHub automatically labels the issue so that reviewers can take a look.
+
+The docs go through a review process similar to the code where community members will offer feedback. Once the review process is complete and your changes are merged, they'll be available on the live site when the site gets republished.
+
+## Style guide
+
+Consistent style, formatting, and tone make documentation easier to consume.
+For the majority of style considerations, the Apache Druid documentation follows the [Google Developer Documentation Style Guide](https://developers.google.com/style).
+The style guide should serve as a point of reference to enable contributors and reviewers to maintain documentation quality.
+
+### Notable style exceptions
+
+In some cases, Google Style might make the Druid docs more difficult to read and understand. This section highlights those exceptions.
+
+#### SQL keyword syntax
+
+For SQL keywords and functions, use all caps, but do not use code font.
+
+:::tip
+
+**Correct**
+
+The UNNEST clause unnests array values.
+
+**Incorrect**
+
+The \`UNNEST\` clause unnests array values.
+:::
+
+#### Optional parameters and arguments
+
+For optional parameters and arguments, enclose the optional parameter and leading command in brackets.
+
+:::tip
+
+**Correct**
+
+HUMAN_READABLE_BINARY_BYTE_FORMAT(value[, precision])
+
+**Incorrect**
+
+HUMAN_READABLE_BINARY_BYTE_FORMAT(value, \[precision])
+:::
+
+#### Markdown table format
+
+When editing or adding tables, do not include extra characters to "prettify" the table format within the Markdown source.
+Some code editors may format tables by default.
+See the developer [style guide](https://github.com/apache/druid/blob/master/dev/style-conventions.md) for more information.
+
+:::tip
+
+**Correct**
+
+```markdown
+| Column 1 | Column 2 | Column 3 |
+| --- | --- | --- |
+| value 1 | val 2 | a-very-long-value 3 |
+```
+
+**Incorrect**
+
+```markdown
+| Column 1 | Column 2 | Column 3            |
+| -------- | -------- | ------------------- |
+| value 1  | val 2    | a-very-long-value 3 |
+```
+
+:::
+
+### Style checklist
+
+Before publishing new content or updating an existing topic, you can audit your documentation using the following checklist to make sure your contributions align with existing documentation:
+
+* Use descriptive link text. If a link downloads a file, make sure to indicate this action.
+* Use present tense where possible.
+* Avoid negative constructions when possible. In other words, try to tell people what they should do instead of what they shouldn't.
+* Use clear and direct language.
+* Use descriptive headings and titles.
+* Avoid using a present participle or gerund as the first word in a heading or title. A shortcut for this is to not start with a word that ends in `-ing`. For example, don't use "Configuring Druid." Use "Configure Druid."
+* Use sentence case in document titles and headings.
+* Don’t use images of text or code samples.
+* Use SVG over PNG for images if you can.
+* Provide alt text or an equivalent text explanation with each image.
+* Use the appropriate text-formatting. For example, make sure code snippets and property names are in code font and UI elements are bold. Generally, you should  avoid using bold or italics to emphasize certain words unless there's a good reason.
+* Put conditional clauses before instructions. In the following example, "to drop a segment" is the conditional clause: to drop a segment, do the following.
+* Avoid gender-specific pronouns, instead use "they."
+* Use second person singular — "you" instead of "we."
+* When American spelling is different from Commonwealth/"British" spelling, use the American spelling.
+* Don’t use terms considered disrespectful. Refer to a list like Google’s [Word list](https://developers.google.com/style/word-list) for guidance and alternatives.
+* Use straight quotation marks and straight apostrophes instead of the curly versions.
+* Introduce a list, a table, or a procedure with an introductory sentence that prepares the reader for what they're about to read.
diff --git a/docs/35.0.0/development/experimental.md b/docs/35.0.0/development/experimental.md
new file mode 100644
index 0000000000..96a9b5085e
--- /dev/null
+++ b/docs/35.0.0/development/experimental.md
@@ -0,0 +1,37 @@
+---
+id: experimental
+title: "Experimental features"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+Features often start out in "experimental" status that indicates they are still evolving.
+This can mean any of the following things:
+
+1. The feature's API may change even in minor releases or patch releases.
+2. The feature may have known "missing" pieces that will be added later.
+3. The feature may or may not have received full battle-testing in production environments.
+
+All experimental features are optional.
+
+Note that not all of these points apply to every experimental feature. Some have been battle-tested in terms of
+implementation, but are still marked experimental due to an evolving API. Please check the documentation for each
+feature for full details.
diff --git a/docs/35.0.0/development/extensions-contrib/aliyun-oss-extensions.md b/docs/35.0.0/development/extensions-contrib/aliyun-oss-extensions.md
new file mode 100644
index 0000000000..ab0573bdc4
--- /dev/null
+++ b/docs/35.0.0/development/extensions-contrib/aliyun-oss-extensions.md
@@ -0,0 +1,236 @@
+---
+id: aliyun-oss
+title: "Aliyun OSS"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+[Alibaba Cloud](https://www.aliyun.com) is the 3rd largest cloud infrastructure provider in the world. It provides its own storage solution known as OSS, [Object Storage Service](https://www.aliyun.com/product/oss).
+This document describes how to use OSS as Druid deep storage.
+
+## Installation
+
+Use the [pull-deps](../../operations/pull-deps.md) tool shipped with Druid to install the `aliyun-oss-extensions` extension, as described [here](../../configuration/extensions.md#community-extensions) on middle manager and historical nodes.
+
+```bash
+java -classpath "{YOUR_DRUID_DIR}/lib/*" org.apache.druid.cli.Main tools pull-deps -c org.apache.druid.extensions.contrib:aliyun-oss-extensions:{YOUR_DRUID_VERSION}
+```
+
+## Enabling
+
+After installation, add this `aliyun-oss-extensions` extension to `druid.extensions.loadList` in common.runtime.properties and then restart middle manager and historical nodes.
+
+## Configuration
+
+First add the following OSS configurations to common.runtime.properties
+
+|Property|Description|Required|
+|--------|---------------|-----------|
+|`druid.oss.accessKey`|The `AccessKey ID` of the account to be used to access the OSS bucket|yes|
+|`druid.oss.secretKey`|The `AccessKey Secret` of the account to be used to access the OSS bucket| yes|
+|`druid.oss.endpoint`|The endpoint URL of your OSS storage. <br/>If your Druid cluster is also hosted in the same region on Alibaba Cloud as the region of your OSS bucket, it's recommended to use the internal network endpoint url, so that any inbound and outbound traffic to the OSS bucket is free of charge. | yes|
+
+To use OSS as deep storage, add the following configurations:
+
+|Property|Description|Required|
+|--------|---------------|-----------|
+|`druid.storage.type`| Global deep storage provider. Must be set to `oss` to make use of this extension. |yes|
+|`druid.storage.oss.bucket`|Storage bucket name.| yes |
+|`druid.storage.oss.prefix`| Folder where segments will be published to. `druid/segments` is recommended. | No |
+
+If OSS is used as deep storage for segment files, it's also recommended saving index logs in the OSS too. 
+To do this, add following configurations:
+
+|Property|Description|Required|
+|--------|---------------|-----------|
+|`druid.indexer.logs.type`| Global deep storage provider. Must be set to `oss` to make use of this extension. | yes |
+|`druid.indexer.logs.oss.bucket`|The bucket used to keep logs. It could be the same as `druid.storage.oss.bucket`| yes |
+|`druid.indexer.logs.oss.prefix`|Folder where log files will be published to. `druid/logs` is recommended. | no |
+
+
+## Reading data from OSS
+
+Currently, Web Console does not support ingestion from OSS, but it could be done by submitting an ingestion task with OSS's input source configuration.
+
+Below shows the configurations of OSS's input source.
+
+### OSS Input Source
+
+|property|description|Required|
+|--------|-----------|-------|
+|type|This should be `oss`.|yes|
+|uris|JSON array of URIs where OSS objects to be ingested are located.<br/>For example, `oss://{your_bucket}/{source_file_path}`|`uris` or `prefixes` or `objects` must be set|
+|prefixes|JSON array of URI prefixes for the locations of OSS objects to be ingested. Empty objects starting with one of the given prefixes will be skipped.|`uris` or `prefixes` or `objects` must be set|
+|objects|JSON array of [OSS Objects](#oss-object) to be ingested. |`uris` or `prefixes` or `objects` must be set|
+|properties|[Properties Object](#properties-object) for overriding the default OSS configuration. See below for more information.|no (defaults will be used if not given)
+
+#### OSS Object
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|---------|
+|bucket|Name of the OSS bucket|None|yes|
+|path|The path where data is located.|None|yes|
+
+#### Properties Object
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|---------|
+|accessKey|The [Password Provider](../../operations/password-provider.md) or plain text string of this OSS InputSource's access key|None|yes|
+|secretKey|The [Password Provider](../../operations/password-provider.md) or plain text string of this OSS InputSource's secret key|None|yes|
+|endpoint|The endpoint of this OSS InputSource|None|no|
+
+### Reading from a file 
+
+Say that the file `rollup-data.json`, which can be found under Druid's `quickstart/tutorial` directory, has been uploaded to a folder `druid` in your OSS bucket, the bucket for which your Druid is configured.
+In this case, the `uris` property of the OSS's input source can be used for reading, as shown:
+
+```json
+{
+  "type" : "index_parallel",
+  "spec" : {
+    "dataSchema" : {
+      "dataSource" : "rollup-tutorial-from-oss",
+      "timestampSpec": {
+        "column": "timestamp",
+        "format": "iso"
+      },
+      "dimensionsSpec" : {
+        "dimensions" : [
+          "srcIP",
+          "dstIP"
+        ]
+      },
+      "metricsSpec" : [
+        { "type" : "count", "name" : "count" },
+        { "type" : "longSum", "name" : "packets", "fieldName" : "packets" },
+        { "type" : "longSum", "name" : "bytes", "fieldName" : "bytes" }
+      ],
+      "granularitySpec" : {
+        "type" : "uniform",
+        "segmentGranularity" : "week",
+        "queryGranularity" : "minute",
+        "intervals" : ["2018-01-01/2018-01-03"],
+        "rollup" : true
+      }
+    },
+    "ioConfig" : {
+      "type" : "index_parallel",
+      "inputSource" : {
+        "type" : "oss",
+        "uris" : [
+          "oss://{YOUR_BUCKET_NAME}/druid/rollup-data.json"
+        ]
+      },
+      "inputFormat" : {
+        "type" : "json"
+      },
+      "appendToExisting" : false
+    },
+    "tuningConfig" : {
+      "type" : "index_parallel",
+      "maxRowsPerSegment" : 5000000,
+      "maxRowsInMemory" : 25000
+    }
+  }
+}
+```
+
+By posting the above ingestion task spec to `http://{YOUR_ROUTER_IP}:8888/druid/indexer/v1/task`, an ingestion task will be created by the indexing service to ingest.
+
+### Reading files in folders
+
+If we want to read files in a same folder, we could use the `prefixes` property to specify the folder name where Druid could find input files instead of specifying file URIs one by one.
+
+```json
+...
+    "ioConfig" : {
+      "type" : "index_parallel",
+      "inputSource" : {
+        "type" : "oss",
+        "prefixes" : [
+          "oss://{YOUR_BUCKET_NAME}/2020", "oss://{YOUR_BUCKET_NAME}/2021"
+        ]
+      },
+      "inputFormat" : {
+        "type" : "json"
+      },
+      "appendToExisting" : false
+    }
+...
+```
+
+The spec above tells the ingestion task to read all files under `2020` and `2021` folders.
+
+### Reading from other buckets 
+
+If you want to read from files in buckets which are different from the bucket Druid is configured, use `objects` property of OSS's InputSource for task submission as below:
+
+```json
+...
+    "ioConfig" : {
+      "type" : "index_parallel",
+      "inputSource" : {
+        "type" : "oss",
+        "objects" : [
+          {"bucket": "YOUR_BUCKET_NAME", "path": "druid/rollup-data.json"}
+        ]
+      },
+      "inputFormat" : {
+        "type" : "json"
+      },
+      "appendToExisting" : false
+    }
+...
+```
+
+### Reading with customized accessKey
+
+If the default `druid.oss.accessKey` is not able to access a bucket, `properties` could be used to customize these secret information as below:
+
+```json
+...
+    "ioConfig" : {
+      "type" : "index_parallel",
+      "inputSource" : {
+        "type" : "oss",
+        "objects" : [
+          {"bucket": "YOUR_BUCKET_NAME", "path": "druid/rollup-data.json"}
+        ],
+        "properties": {
+          "endpoint": "YOUR_ENDPOINT_OF_BUCKET",
+          "accessKey": "YOUR_ACCESS_KEY",
+          "secretKey": "YOUR_SECRET_KEY"
+        }
+      },
+      "inputFormat" : {
+        "type" : "json"
+      },
+      "appendToExisting" : false
+    }
+...
+```
+
+This `properties` could be applied to any of `uris`, `objects`, `prefixes` property above.
+
+
+## Troubleshooting
+
+When using OSS as deep storage or reading from OSS, the most problems that users will encounter are related to OSS permission. 
+Please refer to the official [OSS permission troubleshooting document](https://www.alibabacloud.com/help/doc-detail/42777.htm) to find a solution.
diff --git a/docs/35.0.0/development/extensions-contrib/ambari-metrics-emitter.md b/docs/35.0.0/development/extensions-contrib/ambari-metrics-emitter.md
new file mode 100644
index 0000000000..ee82ca6d78
--- /dev/null
+++ b/docs/35.0.0/development/extensions-contrib/ambari-metrics-emitter.md
@@ -0,0 +1,98 @@
+---
+id: ambari-metrics-emitter
+title: "Ambari Metrics Emitter"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+To use this Apache Druid extension, [include](../../configuration/extensions.md#loading-extensions) `ambari-metrics-emitter` in the extensions load list.
+
+## Introduction
+
+This extension emits Druid metrics to an ambari-metrics carbon server. Events are sent after been pickled (i.e., batched). The size of the batch is configurable.
+
+## Configuration
+
+All the configuration parameters for ambari-metrics emitter are under `druid.emitter.ambari-metrics`.
+
+|property|description|required?|default|
+|--------|-----------|---------|-------|
+|`druid.emitter.ambari-metrics.hostname`|The hostname of the ambari-metrics server.|yes|none|
+|`druid.emitter.ambari-metrics.port`|The port of the ambari-metrics server.|yes|none|
+|`druid.emitter.ambari-metrics.protocol`|The protocol used to send metrics to ambari metrics collector. One of http/https|no|http|
+|`druid.emitter.ambari-metrics.trustStorePath`|Path to trustStore to be used for https|no|none|
+|`druid.emitter.ambari-metrics.trustStoreType`|trustStore type to be used for https|no|none|
+|`druid.emitter.ambari-metrics.trustStoreType`|trustStore password to be used for https|no|none|
+|`druid.emitter.ambari-metrics.batchSize`|Number of events to send as one batch.|no|100|
+|`druid.emitter.ambari-metrics.eventConverter`| Filter and converter of druid events to ambari-metrics timeline event(please see next section). |yes|none|
+|`druid.emitter.ambari-metrics.flushPeriod` | Queue flushing period in milliseconds. |no|1 minute|
+|`druid.emitter.ambari-metrics.maxQueueSize`| Maximum size of the queue used to buffer events. |no|`MAX_INT`|
+|`druid.emitter.ambari-metrics.alertEmitters`| List of emitters where alerts will be forwarded to. |no| empty list (no forwarding)|
+|`druid.emitter.ambari-metrics.emitWaitTime` | wait time in milliseconds to try to send the event otherwise emitter will throwing event. |no|0|
+|`druid.emitter.ambari-metrics.waitForEventTime` | waiting time in milliseconds if necessary for an event to become available. |no|1000 (1 sec)|
+
+### Druid to Ambari Metrics Timeline Event Converter
+
+Ambari Metrics Timeline Event Converter defines a mapping between druid metrics name plus dimensions to a timeline event metricName.
+ambari-metrics metric path is organized using the following schema:
+`<namespacePrefix>.[<druid service name>].[<druid hostname>].<druid metrics dimensions>.<druid metrics name>`
+Properly naming the metrics is critical to avoid conflicts, confusing data and potentially wrong interpretation later on.
+
+Example `druid.historical.hist-host1:8080.MyDataSourceName.GroupBy.query/time`:
+
+ * `druid` -> namespace prefix
+ * `historical` -> service name
+ * `hist-host1:8080` -> druid hostname
+ * `MyDataSourceName` -> dimension value
+ * `GroupBy` -> dimension value
+ * `query/time` -> metric name
+
+We have two different implementation of event converter:
+
+#### Send-All converter
+
+The first implementation called `all`, will send all the druid service metrics events.
+The path will be in the form `<namespacePrefix>.[<druid service name>].[<druid hostname>].<dimensions values ordered by dimension's name>.<metric>`
+User has control of `<namespacePrefix>.[<druid service name>].[<druid hostname>].`
+
+```json
+
+druid.emitter.ambari-metrics.eventConverter={"type":"all", "namespacePrefix": "druid.test", "appName":"druid"}
+
+```
+
+#### White-list based converter
+
+The second implementation called `whiteList`, will send only the white listed metrics and dimensions.
+Same as for the `all` converter user has control of `<namespacePrefix>.[<druid service name>].[<druid hostname>].`
+White-list based converter comes with the following  default white list map located under resources in `./src/main/resources/defaultWhiteListMap.json`
+
+Although user can override the default white list map by supplying a property called `mapPath`.
+This property is a String containing  the path for the file containing **white list map JSON object**.
+For example the following converter will read the map from the file `/pathPrefix/fileName.json`.
+
+```json
+
+druid.emitter.ambari-metrics.eventConverter={"type":"whiteList", "namespacePrefix": "druid.test", "ignoreHostname":true, "appName":"druid", "mapPath":"/pathPrefix/fileName.json"}
+
+```
+
+**Druid emits a huge number of metrics we highly recommend to use the `whiteList` converter**
diff --git a/docs/35.0.0/development/extensions-contrib/cassandra.md b/docs/35.0.0/development/extensions-contrib/cassandra.md
new file mode 100644
index 0000000000..916bacb917
--- /dev/null
+++ b/docs/35.0.0/development/extensions-contrib/cassandra.md
@@ -0,0 +1,30 @@
+---
+id: cassandra
+title: "Apache Cassandra"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+To use this Apache Druid extension, [include](../../configuration/extensions.md#loading-extensions) `druid-cassandra-storage` in the extensions load list.
+
+[Apache Cassandra](http://www.datastax.com/what-we-offer/products-services/datastax-enterprise/apache-cassandra) can also
+be leveraged for deep storage.  This requires some additional Druid configuration as well as setting up the necessary
+schema within a Cassandra keystore.
diff --git a/docs/35.0.0/development/extensions-contrib/cloudfiles.md b/docs/35.0.0/development/extensions-contrib/cloudfiles.md
new file mode 100644
index 0000000000..d4e7592ee7
--- /dev/null
+++ b/docs/35.0.0/development/extensions-contrib/cloudfiles.md
@@ -0,0 +1,42 @@
+---
+id: cloudfiles
+title: "Rackspace Cloud Files"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+To use this Apache Druid extension, [include](../../configuration/extensions.md#loading-extensions) `druid-cloudfiles-extensions` in the extensions load list.
+
+## Deep Storage
+
+[Rackspace Cloud Files](http://www.rackspace.com/cloud/files/) is another option for deep storage. This requires some additional Druid configuration.
+
+|Property|Possible Values|Description|Default|
+|--------|---------------|-----------|-------|
+|`druid.storage.type`|cloudfiles||Must be set.|
+|`druid.storage.region`||Rackspace Cloud Files region.|Must be set.|
+|`druid.storage.container`||Rackspace Cloud Files container name.|Must be set.|
+|`druid.storage.basePath`||Rackspace Cloud Files base path to use in the container.|Must be set.|
+|`druid.storage.operationMaxRetries`||Number of tries before cancel a Rackspace operation.|10|
+|`druid.cloudfiles.userName`||Rackspace Cloud username|Must be set.|
+|`druid.cloudfiles.apiKey`||Rackspace Cloud API key.|Must be set.|
+|`druid.cloudfiles.provider`|rackspace-cloudfiles-us,rackspace-cloudfiles-uk|Name of the provider depending on the region.|Must be set.|
+|`druid.cloudfiles.useServiceNet`|true,false|Whether to use the internal service net.|true|
diff --git a/docs/35.0.0/development/extensions-contrib/compressed-big-decimal.md b/docs/35.0.0/development/extensions-contrib/compressed-big-decimal.md
new file mode 100644
index 0000000000..28a52185fd
--- /dev/null
+++ b/docs/35.0.0/development/extensions-contrib/compressed-big-decimal.md
@@ -0,0 +1,280 @@
+---
+id: compressed-big-decimal
+title: "Compressed Big Decimal"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+## Overview
+**Compressed Big Decimal** is an extension which provides support for Mutable big decimal value that can be used to accumulate values without losing precision or reallocating memory. This type helps in absolute precision arithmetic on large numbers in applications, where  greater level of accuracy is required, such as financial applications, currency based transactions.  This helps avoid rounding issues where in potentially large amount of money can be lost.
+
+Accumulation requires that the two numbers have the same scale, but does not require that they are  of the same size. If the value being accumulated has a larger underlying array than this value (the result), then the higher order bits are dropped, similar to  what happens when adding a long to an int and storing the result in an int. A compressed big decimal that holds its data with an embedded array.
+
+Compressed big decimal is an absolute number based complex type based on big decimal in Java. This supports all the functionalities supported by Java Big Decimal.  Java Big Decimal is not mutable in order to avoid big garbage collection issues.   Compressed big decimal is needed to mutate the value in the accumulator.
+
+#### Main enhancements provided by this extension:
+1. Functionality: Mutating Big decimal type with greater precision 
+2. Accuracy: Provides greater level of accuracy in decimal arithmetic
+
+## Operations
+To use this extension, make sure to [load](../../configuration/extensions.md#loading-extensions) `druid-compressed-bigdecimal` to your config file.
+
+## Configuration
+There are currently no configuration properties specific to Compressed Big Decimal
+
+## Limitations
+* Compressed Big Decimal does not provide correct result when the value being accumulated has a larger underlying array than this value (the result), then the higher order bits are dropped, similar to  what happens when adding a long to an int and storing the result in an int.
+
+
+### Ingestion Spec:
+* Most properties in the Ingest spec derived from  [Ingestion Spec](../../ingestion/index.md) / [Data Formats](../../ingestion/data-formats.md)
+
+
+|property|description|required?|
+|--------|-----------|---------|
+|metricsSpec|Metrics Specification, In metrics specification while specifying metrics details such as name, type should be specified as compressedBigDecimal|Yes|
+
+### Query spec:
+* Most properties in the query spec derived from  [groupBy query](../../querying/groupbyquery.md) / [timeseries](../../querying/timeseriesquery.md), see documentation for these query types.
+
+|property|description|required?|
+|--------|-----------|---------|
+|queryType|This String should always be either "groupBy" OR "timeseries"; this is the first thing Druid looks at to figure out how to interpret the query.|yes|
+|dataSource|A String or Object defining the data source to query, very similar to a table in a relational database. See [DataSource](../../querying/datasource.md) for more information.|yes|
+|dimensions|A JSON list of [DimensionSpec](../../querying/dimensionspecs.md) (Notice that property is optional)|no|
+|limitSpec|See [LimitSpec](../../querying/limitspec.md)|no|
+|having|See [Having](../../querying/having.md)|no|
+|granularity|A period granularity; See [Period Granularities](../../querying/granularities.md#period-granularities)|yes|
+|filter|See [Filters](../../querying/filters.md)|no|
+|aggregations|Aggregations forms the input to Averagers; See [Aggregations](../../querying/aggregations.md). The Aggregations must specify type, scale and size as follows for compressedBigDecimal Type ```"aggregations": [{"type": "compressedBigDecimal","name": "..","fieldName": "..","scale": [Numeric],"size": [Numeric]}```.  Please refer query example in Examples section.  |Yes|
+|postAggregations|Supports only aggregations as input; See [Post Aggregations](../../querying/post-aggregations.md)|no|
+|intervals|A JSON Object representing ISO-8601 Intervals. This defines the time ranges to run the query over.|yes|
+|context|An additional JSON Object which can be used to specify certain flags.|no|
+
+## Examples
+
+Consider the data as
+
+|Date|Item|SaleAmount|
+|--------|-----------|---------|
+
+```
+20201208,ItemA,0.0
+20201208,ItemB,10.000000000
+20201208,ItemA,-1.000000000
+20201208,ItemC,9999999999.000000000
+20201208,ItemB,5000000000.000000005
+20201208,ItemA,2.0
+20201208,ItemD,0.0
+```
+
+IngestionSpec syntax:
+
+```json
+{
+	"type": "index_parallel",
+	"spec": {
+		"dataSchema": {
+			"dataSource": "invoices",
+			"timestampSpec": {
+				"column": "timestamp",
+				"format": "yyyyMMdd"
+			},
+			"dimensionsSpec": {
+				"dimensions": [{
+					"type": "string",
+					"name": "itemName"
+				}]
+			},
+			"metricsSpec": [{
+				"name": "saleAmount",
+				"type": "compressedBigDecimalSum",
+				"fieldName": "saleAmount"
+			}],
+			"transformSpec": {
+				"filter": null,
+				"transforms": []
+			},
+			"granularitySpec": {
+				"type": "uniform",
+				"rollup": false,
+				"segmentGranularity": "DAY",
+				"queryGranularity": "none",
+				"intervals": ["2020-12-08/2020-12-09"]
+			}
+		},
+		"ioConfig": {
+			"type": "index_parallel",
+			"inputSource": {
+				"type": "local",
+				"baseDir": "/home/user/sales/data/staging/invoice-data",
+				"filter": "invoice-001.20201208.txt"
+			},
+			"inputFormat": {
+				"type": "tsv",
+                                "delimiter": ",",
+                                "skipHeaderRows": 0,
+				"columns": [
+						"timestamp",
+						"itemName",
+						"saleAmount"
+					]
+			}
+		},
+		"tuningConfig": {
+			"type": "index_parallel"
+		}
+	}
+}
+```
+
+SQL-based ingestion sample query:
+```sql
+
+REPLACE INTO "bigdecimal" OVERWRITE ALL
+WITH "ext" AS (
+  SELECT *
+  FROM TABLE(
+    EXTERN(
+      '{"type":"local","baseDir":""/home/user/sales/data/staging/invoice-data","filter":"invoice-001.20201208.txt"}',
+      '{"type":"csv","findColumnsFromHeader":false,"columns":["timestamp","itemName","saleAmount"]}',
+      '[{"name":"timestamp","type":"string"},{"name":"itemName","type":"string"},{"name":"saleAmount","type":"double"}]'
+    )
+  ) 
+)
+SELECT
+  TIME_PARSE(TRIM("timestamp")) AS "__time",
+  "itemName",
+  BIG_SUM("saleAmount") as amount
+FROM "ext"
+group by TIME_PARSE(TRIM("timestamp")) , itemName
+PARTITIONED BY DAY
+```
+
+
+### Group By Query  example
+
+Calculating sales groupBy all.
+
+Query syntax:
+
+```json
+{
+    "queryType": "groupBy",
+    "dataSource": "invoices",
+    "granularity": "ALL",
+    "dimensions": [
+    ],
+    "aggregations": [
+        {
+            "type": "compressedBigDecimalSum",
+            "name": "saleAmount",
+            "fieldName": "saleAmount",
+            "scale": 9,
+            "size": 3
+
+        }
+    ],
+    "intervals": [
+        "2020-01-08T00:00:00.000Z/P1D"
+    ]
+}
+```
+
+Result:
+
+```json
+[ {
+  "version" : "v1",
+  "timestamp" : "2020-12-08T00:00:00.000Z",
+  "event" : {
+    "revenue" : 15000000010.000000005
+  }
+} ]
+```
+
+Had you used *doubleSum* instead of *compressedBigDecimalSum* the result would be 
+
+```json
+[ {
+  "timestamp" : "2020-12-08T00:00:00.000Z",
+  "result" : {
+    "revenue" : 1.500000001E10
+  }
+} ]
+```
+As shown above the precision is lost and could lead to loss in money.
+
+### TimeSeries Query Example 
+
+Query syntax:
+
+```json
+{
+    "queryType": "timeseries",
+    "dataSource": "invoices",
+    "granularity": "ALL",
+    "aggregations": [
+        {
+            "type": "compressedBigDecimalSum",
+            "name": "revenue",
+            "fieldName": "revenue",
+            "scale": 9,
+            "size": 3
+        }
+    ],
+    "filter": {
+        "type": "not",
+        "field": {
+            "type": "selector",
+            "dimension": "itemName",
+            "value": "ItemD"
+        }
+    },
+    "intervals": [
+        "2020-12-08T00:00:00.000Z/P1D"
+    ]
+}
+```
+
+Result:
+
+```json
+[ {
+  "timestamp" : "2020-12-08T00:00:00.000Z",
+  "result" : {
+    "revenue" : 15000000010.000000005
+  }
+} ]
+```
+
+### Supported Query Functions 
+
+Native aggregation functions:
+
+ * `compressedBigDecimalSum`
+ * `compressedBigDecimalMin`
+ * `compressedBigDecimalMax`
+
+SQL aggregation functions:
+ * `big_sum()`
+ * `big_min()`
+ * `big_max()`
+
diff --git a/docs/35.0.0/development/extensions-contrib/ddsketch-quantiles.md b/docs/35.0.0/development/extensions-contrib/ddsketch-quantiles.md
new file mode 100644
index 0000000000..bd1a1e1dab
--- /dev/null
+++ b/docs/35.0.0/development/extensions-contrib/ddsketch-quantiles.md
@@ -0,0 +1,139 @@
+---
+id: ddsketch-quantiles
+title: "DDSketches for Approximate Quantiles module"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+This module provides aggregators for approximate quantile queries using the [DDSketch](https://github.com/datadog/sketches-java) library. The DDSketch library provides a fast, and fully-mergeable quantile sketch with relative error. If the true quantile is 100, a sketch with relative error of 1% guarantees a quantile value between 101 and 99. This is important and highly valuable behavior for long tail distributions. The best use case for these sketches is for accurately describing the upper quantiles of long tailed distributions such as network latencies.
+
+To use this Apache Druid extension, [include](../../configuration/extensions.md#loading-extensions) in the extensions load list.
+
+```
+druid.extensions.loadList=["druid-ddsketch", ...]
+```
+
+### Aggregator
+
+The result of the aggregation is a DDSketch that is the union of all sketches either built from raw data or read from the segments. The single number that is returned represents the total number of included data points. The default aggregator type of `ddSketch` uses the collapsingLowestDense strategy for storing and merging sketch. This means that in favor of keeping the highest values represented at the highest accuracy, the sketch will collapse and merge lower, smaller values in the sketch. Collapsed bins will lose accuracy guarantees. The default number of bins is 1000. Sketches can only be merged when using the same relativeError values.
+
+The `ddSketch` aggregator operates over raw data and precomputed sketches.
+
+```json
+{
+  "type" : "ddSketch",
+  "name" : <output_name>,
+  "fieldName" : <input_name>,
+  "relativeError" : <double(0, 1)>,
+  "numBins": <int>
+ }
+```
+
+|property|description|required?|
+|--------|-----------|---------|
+|type|Must be "ddSketch" |yes|
+|name|A String for the output (result) name of the calculation.|yes|
+|fieldName|A String for the name of the input field (can contain sketches or raw numeric values).|yes|
+|relativeError|Describes the precision in which to store the sketch. Must be a number between 0 and 1.|no, defaults to 0.01 (1% error)|
+|numBins|Total number of bins the sketch is allowed to use to describe the distribution. This has a direct impact on max memory used. The more total bins available, the larger the range of accurate quantiles. With relative accuracy of 2%, only 275 bins are required to cover values between 1 millisecond and 1 minute. 800 bins are required to cover values between 1 nanosecond and 1 day.|no, defaults to 1000|
+
+
+### Post Aggregators
+
+To compute approximate quantiles, use `quantilesFromDDSketch` to query for a set of quantiles or `quantileFromDDSketch` to query for a single quantile. Call these post-aggregators on the sketches created by the `ddSketch` aggregators.
+
+
+#### quantilesFromDDSketch
+
+Use `quantilesFromDDSketch` to fetch multiple quantiles.
+
+```json
+{
+  "type"  : "quantilesFromDDSketch",
+  "name" : <output_name>,
+  "field" : <reference to DDSketch>,
+  "fractions" : <array of doubles in [0,1]>
+}
+```
+
+|property|description|required?|
+|--------|-----------|---------|
+|type|Must be "quantilesFromDDSketch" |yes|
+|name|A String for the output (result) name of the calculation.|yes|
+|field|A computed ddSketch.|yes|
+|fractions|Array of doubles from 0 to 1 of the quantiles to compute|yes|
+
+#### quantileFromDDSketch
+
+Use `quantileFromDDSketch` to fetch a single quantile.
+
+```json
+{
+  "type"  : "quantileFromDDSketch",
+  "name" : <output_name>,
+  "field" : <reference to DDsketch>,
+  "fraction" : <double [0,1]>
+}
+```
+
+|property|description|required?|
+|--------|-----------|---------|
+|type|Must be "quantileFromDDSketch" |yes|
+|name|A String for the output (result) name of the calculation.|yes|
+|field|A computed ddSketch.|yes|
+|fraction|A double from 0 to 1 of the quantile to compute|yes|
+
+
+### Example
+
+As an example of a query with sketches pre-aggregated at ingestion time, one could set up the following aggregator at ingest:
+
+```json
+{
+  "type": "ddSketch",
+  "name": "sketch",
+  "fieldName": "value",
+  "relativeError": 0.01,
+  "numBins": 1000,
+}
+```
+
+Compute quantiles from the pre-aggregated sketches using the following aggregator and post-aggregator.
+
+```json
+{
+  "aggregations": [{
+    "type": "ddSketch",
+    "name": "sketch",
+    "fieldName": "sketch",
+  }],
+  "postAggregations": [
+  {
+    "type": "quantilesFromDDSketch",
+    "name": "quantiles",
+    "fractions": [0.5, 0.75, 0.9, 0.99],
+    "field": {
+      "type": "fieldAccess",
+      "fieldName": "sketch"
+    }
+  }]
+}
+```
diff --git a/docs/35.0.0/development/extensions-contrib/delta-lake.md b/docs/35.0.0/development/extensions-contrib/delta-lake.md
new file mode 100644
index 0000000000..88f3a2c77f
--- /dev/null
+++ b/docs/35.0.0/development/extensions-contrib/delta-lake.md
@@ -0,0 +1,54 @@
+---
+id: delta-lake
+title: "Delta Lake extension"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+Delta Lake is an open source storage framework that enables building a
+Lakehouse architecture with various compute engines. [DeltaLakeInputSource](../../ingestion/input-sources.md#delta-lake-input-source) lets
+you ingest data stored in a Delta Lake table into Apache Druid. To use the Delta Lake extension, add the `druid-deltalake-extensions` to the list of loaded extensions.
+See [Loading extensions](../../configuration/extensions.md#loading-extensions) for more information.
+
+The Delta input source reads the configured Delta Lake table and extracts the underlying Delta files in the table's latest snapshot
+based on an optional Delta filter. These Delta Lake files are versioned Parquet files.
+
+## Version support
+
+The Delta Lake extension uses the Delta Kernel introduced in Delta Lake 3.0.0, which is compatible with Apache Spark 3.5.x.
+Older versions are unsupported, so consider upgrading to Delta Lake 3.0.x or higher to use this extension.
+
+## Downloading Delta Lake extension
+
+To download `druid-deltalake-extensions`, run the following command after replacing `<VERSION>` with the desired
+Druid version:
+
+```shell
+java \
+  -cp "lib/*" \
+  -Ddruid.extensions.directory="extensions" \
+  -Ddruid.extensions.hadoopDependenciesDir="hadoop-dependencies" \
+  org.apache.druid.cli.Main tools pull-deps \
+  --no-default-hadoop \
+  -c "org.apache.druid.extensions.contrib:druid-deltalake-extensions:<VERSION>"
+```
+
+See [Loading community extensions](../../configuration/extensions.md#loading-community-extensions) for more information.
\ No newline at end of file
diff --git a/docs/35.0.0/development/extensions-contrib/distinctcount.md b/docs/35.0.0/development/extensions-contrib/distinctcount.md
new file mode 100644
index 0000000000..38f8e5efba
--- /dev/null
+++ b/docs/35.0.0/development/extensions-contrib/distinctcount.md
@@ -0,0 +1,99 @@
+---
+id: distinctcount
+title: "DistinctCount Aggregator"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+To use this Apache Druid extension, [include](../../configuration/extensions.md#loading-extensions) the `druid-distinctcount` in the extensions load list.
+
+Additionally, follow these steps:
+
+1. First, use a single dimension hash-based partition spec to partition data by a single dimension. For example visitor_id. This to make sure all rows with a particular value for that dimension will go into the same segment, or this might over count.
+2. Second, use distinctCount to calculate the distinct count, make sure queryGranularity is divided exactly by segmentGranularity or else the result will be wrong.
+
+There are some limitations, when used with groupBy, the groupBy keys' numbers should not exceed maxIntermediateRows in every segment. If exceeded the result will be wrong. When used with topN, numValuesPerPass should not be too big. If too big the distinctCount will use a lot of memory and might cause the JVM to go our of memory.
+
+Example:
+
+## Timeseries query
+
+```json
+{
+  "queryType": "timeseries",
+  "dataSource": "sample_datasource",
+  "granularity": "day",
+  "aggregations": [
+    {
+      "type": "distinctCount",
+      "name": "uv",
+      "fieldName": "visitor_id"
+    }
+  ],
+  "intervals": [
+    "2016-03-01T00:00:00.000/2013-03-20T00:00:00.000"
+  ]
+}
+```
+
+## TopN query
+
+```json
+{
+  "queryType": "topN",
+  "dataSource": "sample_datasource",
+  "dimension": "sample_dim",
+  "threshold": 5,
+  "metric": "uv",
+  "granularity": "all",
+  "aggregations": [
+    {
+      "type": "distinctCount",
+      "name": "uv",
+      "fieldName": "visitor_id"
+    }
+  ],
+  "intervals": [
+    "2016-03-06T00:00:00/2016-03-06T23:59:59"
+  ]
+}
+```
+
+## GroupBy query
+
+```json
+{
+  "queryType": "groupBy",
+  "dataSource": "sample_datasource",
+  "dimensions": ["sample_dim"],
+  "granularity": "all",
+  "aggregations": [
+    {
+      "type": "distinctCount",
+      "name": "uv",
+      "fieldName": "visitor_id"
+    }
+  ],
+  "intervals": [
+    "2016-03-06T00:00:00/2016-03-06T23:59:59"
+  ]
+}
+```
diff --git a/docs/35.0.0/development/extensions-contrib/druid-exact-count-bitmap.md b/docs/35.0.0/development/extensions-contrib/druid-exact-count-bitmap.md
new file mode 100644
index 0000000000..b39ed38dd6
--- /dev/null
+++ b/docs/35.0.0/development/extensions-contrib/druid-exact-count-bitmap.md
@@ -0,0 +1,452 @@
+---
+id: druid-exact-count-bitmap
+title: "Exact Count Bitmap"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+This extension provides exact cardinality counting functionality for LONG type columns using [Roaring Bitmaps](https://roaringbitmap.org/). Unlike approximate cardinality aggregators like HyperLogLog, this aggregator provides precise distinct counts.
+
+## Installation
+
+To use this Apache Druid extension, [include](../../configuration/extensions.md#loading-extensions) `druid-exact-count-bitmap` in the extensions load list.
+
+## Comparison with Similar Aggregations
+
+The [Distinct Count Aggregator](https://druid.apache.org/docs/latest/development/extensions-contrib/distinctcount/) works in a similar way to the Exact Count Aggregator. Hence, it is important to understand the difference between the behavior of these two aggregators. 
+
+| Exact Count | Distinct Count |
+| -- | -- |
+| No prerequisites needed (e.g. configuring hash partition, segment granularity) | Prerequisites needed to perform aggregation |
+| Works on 64-bit number columns only (BIGINT) | Works on dimension columns (Including Strings, Complex Types, etc) |
+
+## How it Works
+
+The extension uses `Roaring64NavigableMap` as its underlying data structure to efficiently store and compute exact cardinality of 64-bit integers. It provides two types of aggregators that serve different purposes:
+
+### Build Aggregator (Bitmap64ExactCountBuild)
+
+The BUILD aggregator is used when you want to compute cardinality directly from raw LONG values:
+
+- Used during ingestion or when querying raw data
+- Must be used on columns of type LONG.
+
+Example:
+
+```json
+{
+  "type": "Bitmap64ExactCountBuild",
+  "name": "unique_values",
+  "fieldName": "id"
+}
+```
+
+### Merge Aggregator (Bitmap64ExactCountMerge)
+
+The MERGE aggregator is used when working with pre-computed bitmaps:
+
+- Used for querying pre-aggregated data (columns that were previously aggregated using BUILD)
+- Combines multiple bitmaps using bitwise operations.
+- Must be used on columns that are aggregated using BUILD, or by a previous MERGE.
+- `Bitmap64ExactCountMerge` aggregator is recommended for use in `timeseries` type queries, though it also works for `topN` and `groupBy` queries.
+
+Example:
+
+```json
+{
+  "type": "Bitmap64ExactCountMerge",
+  "name": "total_unique_values",
+  "fieldName": "unique_values" // Must be a pre-computed bitmap
+}
+```
+
+### Typical Workflow
+
+1. During ingestion, use BUILD to create the initial bitmap:
+    ```json
+    {
+      "type": "index",
+      "spec": {
+        "dataSchema": {
+          "metricsSpec": [
+            {
+              "type": "Bitmap64ExactCountBuild",
+              "name": "unique_users",
+              "fieldName": "user_id"
+            }
+          ]
+        }
+      }
+    }
+    ```
+
+2. When querying the aggregated data, use MERGE to combine bitmaps:
+    ```json
+    {
+      "queryType": "timeseries",
+      "aggregations": [
+        {
+          "type": "Bitmap64ExactCountMerge",
+          "name": "total_unique_users",
+          "fieldName": "unique_users"
+        }
+      ]
+    }
+    ```
+
+## Usage
+
+### SQL Query
+
+You can use the `BITMAP64_EXACT_COUNT` function in SQL queries:
+
+```sql
+SELECT BITMAP64_EXACT_COUNT(column_name)
+FROM datasource
+WHERE ...
+GROUP BY ...
+```
+
+### Post-Aggregator
+
+You can also use the post-aggregator for further processing:
+
+```json
+{
+  "type": "bitmap64ExactCount",
+  "name": "<output_name>",
+  "fieldName": "<aggregator_name>"
+}
+```
+
+## Considerations
+
+- **Memory Usage**: While Roaring Bitmaps are efficient, storing exact unique values will generally consume more memory than approximate algorithms like HyperLogLog.
+- **Input Type**: This aggregator only works with LONG (64-bit integer) columns. String or other data types must be converted to longs before using this aggregator.
+- **Build vs Merge**: Always use BUILD for raw numeric data and MERGE for pre-aggregated data. Using BUILD on pre-aggregated data or MERGE on raw data will not work correctly.
+
+## Example Use Cases
+
+1. **User Analytics**: Count unique users over time
+
+```sql
+-- First ingest with BUILD aggregator
+-- Then query with:
+SELECT 
+  TIME_FLOOR(__time, 'PT1H') AS hour,
+  BITMAP64_EXACT_COUNT(unique_users) as distinct_users
+FROM user_metrics
+GROUP BY 1
+```
+
+2. **High-Precision Metrics**: When exact counts are required
+
+```json
+{
+  "type": "groupBy",
+  "dimensions": [
+    "country"
+  ],
+  "aggregations": [
+    {
+      "type": "Bitmap64ExactCountMerge",
+      "name": "exact_user_count",
+      "fieldName": "unique_users"
+    }
+  ]
+}
+```
+
+## Walkthrough Using Wikipedia datasource
+
+### Batch Ingestion Task Spec
+
+```json
+{
+  "type": "index",
+  "spec": {
+    "dataSchema": {
+      "dataSource": "wikipedia_metrics",
+      "timestampSpec": {
+        "column": "__time",
+        "format": "auto"
+      },
+      "dimensionsSpec": {
+        "dimensions": [
+          "channel",
+          "namespace",
+          "page",
+          "user",
+          "cityName",
+          "countryName",
+          "regionName",
+          "isRobot",
+          "isUnpatrolled",
+          "isNew",
+          "isAnonymous"
+        ]
+      },
+      "metricsSpec": [
+        {
+          "type": "Bitmap64ExactCountBuild",
+          "name": "unique_added_values",
+          "fieldName": "added"
+        },
+        {
+          "type": "Bitmap64ExactCountBuild",
+          "name": "unique_delta_values",
+          "fieldName": "delta"
+        },
+        {
+          "type": "Bitmap64ExactCountBuild",
+          "name": "unique_comment_lengths",
+          "fieldName": "commentLength"
+        },
+        {
+          "name": "count",
+          "type": "count"
+        },
+        {
+          "name": "sum_added",
+          "type": "longSum",
+          "fieldName": "added"
+        },
+        {
+          "name": "sum_delta",
+          "type": "longSum",
+          "fieldName": "delta"
+        }
+      ],
+      "granularitySpec": {
+        "type": "uniform",
+        "segmentGranularity": "DAY",
+        "queryGranularity": "HOUR",
+        "rollup": true,
+        "intervals": [
+          "2016-06-27/2016-06-28"
+        ]
+      }
+    },
+    "ioConfig": {
+      "type": "index",
+      "inputSource": {
+        "type": "druid",
+        "dataSource": "wikipedia",
+        "interval": "2016-06-27/2016-06-28"
+      },
+      "inputFormat": {
+        "type": "tsv",
+        "findColumnsFromHeader": true
+      }
+    },
+    "tuningConfig": {
+      "type": "index",
+      "maxRowsPerSegment": 5000000,
+      "maxRowsInMemory": 25000
+    }
+  }
+}
+```
+
+### Query from datasource with raw bytes
+
+```json
+{
+  "queryType": "timeseries",
+  "dataSource": {
+    "type": "table",
+    "name": "wikipedia_metrics"
+  },
+  "intervals": {
+    "type": "intervals",
+    "intervals": [
+      "-146136543-09-08T08:23:32.096Z/146140482-04-24T15:36:27.903Z"
+    ]
+  },
+  "granularity": {
+    "type": "all"
+  },
+  "aggregations": [
+    {
+      "type": "Bitmap64ExactCountBuild",
+      "name": "a0",
+      "fieldName": "unique_added_values"
+    }
+  ]
+}
+```
+
+### Query from datasource with pre-aggregated bitmap
+
+```json
+{
+  "queryType": "timeseries",
+  "dataSource": {
+    "type": "table",
+    "name": "wikipedia_metrics"
+  },
+  "intervals": {
+    "type": "intervals",
+    "intervals": [
+      "-146136543-09-08T08:23:32.096Z/146140482-04-24T15:36:27.903Z"
+    ]
+  },
+  "granularity": {
+    "type": "all"
+  },
+  "aggregations": [
+    {
+      "type": "Bitmap64ExactCountMerge",
+      "name": "a0",
+      "fieldName": "unique_added_values"
+    }
+  ]
+}
+```
+
+## Other Examples
+
+### Kafka ingestion task spec
+
+```json
+{
+  "type": "kafka",
+  "spec": {
+    "dataSchema": {
+      "dataSource": "ticker_event_bitmap64_exact_count_rollup",
+      "timestampSpec": {
+        "column": "timestamp",
+        "format": "millis",
+        "missingValue": null
+      },
+      "dimensionsSpec": {
+        "dimensions": [
+          {
+            "type": "string",
+            "name": "key"
+          }
+        ],
+        "dimensionExclusions": []
+      },
+      "metricsSpec": [
+        {
+          "type": "Bitmap64ExactCountBuild",
+          "name": "count",
+          "fieldName": "value"
+        }
+      ],
+      "granularitySpec": {
+        "type": "uniform",
+        "segmentGranularity": "HOUR",
+        "queryGranularity": "HOUR",
+        "rollup": true,
+        "intervals": null
+      },
+      "transformSpec": {
+        "filter": null,
+        "transforms": []
+      }
+    },
+    "ioConfig": {
+      "topic": "ticker_event",
+      "inputFormat": {
+        "type": "json",
+        "flattenSpec": {
+          "useFieldDiscovery": true,
+          "fields": []
+        },
+        "featureSpec": {}
+      },
+      "replicas": 1,
+      "taskCount": 1,
+      "taskDuration": "PT3600S",
+      "consumerProperties": {
+        "bootstrap.servers": "localhost:9092"
+      },
+      "pollTimeout": 100,
+      "startDelay": "PT5S",
+      "period": "PT30S",
+      "useEarliestOffset": false,
+      "completionTimeout": "PT1800S",
+      "lateMessageRejectionPeriod": null,
+      "earlyMessageRejectionPeriod": null,
+      "lateMessageRejectionStartDateTime": null,
+      "stream": "ticker_event",
+      "useEarliestSequenceNumber": false,
+      "type": "kafka"
+    }
+  }
+}
+```
+
+### Query with Post-aggregator:
+
+```json
+{
+  "queryType": "timeseries",
+  "dataSource": {
+    "type": "table",
+    "name": "ticker_event_bitmap64_exact_count_rollup"
+  },
+  "intervals": {
+    "type": "intervals",
+    "intervals": [
+      "2020-09-13T06:35:35.000Z/146140482-04-24T15:36:27.903Z"
+    ]
+  },
+  "descending": false,
+  "virtualColumns": [],
+  "filter": null,
+  "granularity": {
+    "type": "all"
+  },
+  "aggregations": [
+    {
+      "type": "count",
+      "name": "cnt"
+    },
+    {
+      "type": "Bitmap64ExactCountMerge",
+      "name": "a0",
+      "fieldName": "count"
+    }
+  ],
+  "postAggregations": [
+    {
+      "type": "arithmetic",
+      "fn": "/",
+      "fields": [
+        {
+          "type": "bitmap64ExactCount",
+          "name": "a0",
+          "fieldName": "a0"
+        },
+        {
+          "type": "fieldAccess",
+          "name": "cnt",
+          "fieldName": "cnt"
+        }
+      ],
+      "name": "rollup_rate"
+    }
+  ],
+  "limit": 2147483647
+}
+```
diff --git a/docs/35.0.0/development/extensions-contrib/druid-ranger-security.md b/docs/35.0.0/development/extensions-contrib/druid-ranger-security.md
new file mode 100644
index 0000000000..502358f801
--- /dev/null
+++ b/docs/35.0.0/development/extensions-contrib/druid-ranger-security.md
@@ -0,0 +1,130 @@
+---
+id: druid-ranger-security
+title: "Apache Ranger Security"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+This Apache Druid extension adds an Authorizer which implements access control for Druid, backed by [Apache Ranger](https://ranger.apache.org/). Please see [Authentication and Authorization](../../operations/auth.md) for more information on the basic facilities this extension provides.
+
+Make sure to [include](../../configuration/extensions.md#loading-extensions) `druid-ranger-security` in the extensions load list.
+
+
+## Configuration
+
+Support for Apache Ranger authorization consists of three elements:
+* configuring the extension in Apache Druid
+* configuring the connection to Apache Ranger
+* providing the service definition for Druid to Apache Ranger
+
+### Enabling the extension
+Ensure that you have a valid authenticator chain and escalator set in your `common.runtime.properties`. For every authenticator your wish to use the authorizer for, set `druid.auth.authenticator.<authenticatorName>.authorizerName` to the name you will give the authorizer, e.g. `ranger`.
+
+Then add the following and amend to your needs (in case you need to use multiple authorizers):
+
+```
+druid.auth.authorizers=["ranger"]
+druid.auth.authorizer.ranger.type=ranger
+```
+
+The following is an example that showcases using `druid-basic-security` for authentication and `druid-ranger-security` for authorization.
+
+```
+druid.auth.authenticatorChain=["basic"]
+druid.auth.authenticator.basic.type=basic
+druid.auth.authenticator.basic.initialAdminPassword=password1
+druid.auth.authenticator.basic.initialInternalClientPassword=password2
+druid.auth.authenticator.basic.credentialsValidator.type=metadata
+druid.auth.authenticator.basic.skipOnFailure=false
+druid.auth.authenticator.basic.enableCacheNotifications=true
+druid.auth.authenticator.basic.authorizerName=ranger
+
+druid.auth.authorizers=["ranger"]
+druid.auth.authorizer.ranger.type=ranger
+
+# Escalator
+druid.escalator.type=basic
+druid.escalator.internalClientUsername=druid_system
+druid.escalator.internalClientPassword=password2
+druid.escalator.authorizerName=ranger
+```
+
+:::info
+ Contrary to the documentation of `druid-basic-auth` Ranger does not automatically provision a highly privileged system user, you will need to do this yourself. This system user in the case of `druid-basic-auth` is named `druid_system` and for the escalator it is configurable, as shown above. Make sure to take note of these user names and configure `READ` access to `state:STATE` and to `config:security` in your ranger policies, otherwise system services will not work properly.
+:::
+
+#### Properties to configure the extension in Apache Druid
+|Property|Description|Default|required|
+|--------|-----------|-------|--------|
+|`druid.auth.ranger.keytab`|Defines the keytab to be used while authenticating against Apache Ranger to obtain policies and provide auditing|null|No|
+|`druid.auth.ranger.principal`|Defines the principal to be used while authenticating against Apache Ranger to obtain policies and provide auditing|null|No|
+|`druid.auth.ranger.use_ugi`|Determines if groups that the authenticated user belongs to should be obtained from Hadoop's `UserGroupInformation`|null|No|
+
+### Configuring the connection to Apache Ranger
+
+The Apache Ranger authorization extension will read several configuration files. Discussing the contents of those files is beyond the scope of this document. Depending on your needs you will need to create them. The minimum you will need to have is a `ranger-druid-security.xml` file that you will need to put in the classpath (e.g. `_common`). For auditing, the configuration is in `ranger-druid-audit.xml`.
+
+### Adding the service definition for Apache Druid to Apache Ranger
+
+At the time of writing of this document Apache Ranger (2.0) does not include an out of the box service and service definition for Druid. You can add the service definition to Apache Ranger by entering the following command:
+
+`curl -u <user>:<password> -d "@ranger-servicedef-druid.json" -X POST -H "Accept: application/json" -H "Content-Type: application/json" http://localhost:6080/service/public/v2/api/servicedef/`
+
+You should get back `json` describing the service definition you just added. You can now go to the web interface of Apache Ranger which should now include a widget for "Druid". Click the plus sign and create the new service. Ensure your service name is equal to what you configured in `ranger-druid-security.xml`.
+
+#### Configuring Apache Ranger policies
+
+When installing a new Druid service in Apache Ranger for the first time, Ranger will provision the policies to allow the administrative user `read/write` access to all properties and data sources. You might want to limit this. Do not forget to add the correct policies for the `druid_system` user and the `internalClientUserName` of the escalator.
+
+:::info
+ Loading new data sources requires `write` access to the `datasource` prior to the loading itself. So if you want to create a datasource `wikipedia` you are required to have an `allow` policy inside Apache Ranger before trying to load the spec.
+:::
+
+## Usage
+
+### HTTP methods
+
+For information on what HTTP methods are supported for a particular request endpoint, please refer to the [API documentation](../../api-reference/api-reference.md).
+
+GET requires READ permission, while POST and DELETE require WRITE permission.
+
+### SQL Permissions
+
+Queries on Druid datasources require DATASOURCE READ permissions for the specified datasource.
+
+Queries on the [INFORMATION_SCHEMA tables](../../querying/sql-metadata-tables.md#information-schema) will return information about datasources that the caller has DATASOURCE READ access to. Other datasources will be omitted.
+
+Queries on the [system schema tables](../../querying/sql-metadata-tables.md#system-schema) require the following permissions:
+- `segments`: Segments will be filtered based on DATASOURCE READ permissions.
+- `servers`: The user requires STATE READ permissions.
+- `server_segments`: The user requires STATE READ permissions and segments will be filtered based on DATASOURCE READ permissions.
+- `tasks`: Tasks will be filtered based on DATASOURCE READ permissions.
+
+
+### Debugging
+
+If you face difficulty grasping why access is denied to certain elements, and the `audit` section in Apache Ranger does not give you any detail, you can enable debug logging for `org.apache.druid.security.ranger`. To do so add the following in your `log4j2.xml`:
+
+```xml
+<!-- Set level="debug" to see access requests to Apache Ranger -->
+<Logger name="org.apache.druid.security" level="debug" additivity="false">
+  <Appender-ref ref="Console"/>
+</Logger>
+```
diff --git a/docs/35.0.0/development/extensions-contrib/gce-extensions.md b/docs/35.0.0/development/extensions-contrib/gce-extensions.md
new file mode 100644
index 0000000000..2a8da66154
--- /dev/null
+++ b/docs/35.0.0/development/extensions-contrib/gce-extensions.md
@@ -0,0 +1,103 @@
+---
+id: gce-extensions
+title: "GCE Extensions"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+To use this Apache Druid extension, [include](../../configuration/extensions.md#loading-extensions) `gce-extensions` in the extensions load list.
+
+At the moment, this extension enables only Druid to autoscale instances in GCE.
+
+The extension manages the instances to be scaled up and down through the use of the [Managed Instance Groups](https://cloud.google.com/compute/docs/instance-groups/creating-groups-of-managed-instances#resize_managed_group)
+of GCE (MIG from now on). This choice has been made to ease the configuration of the machines and simplify their
+management.
+
+For this reason, in order to use this extension, the user must have created
+1. An instance template with the right machine type and image to bu used to run the Middle Manager
+2. A MIG that has been configured to use the instance template created in the point above
+
+Moreover, in order to be able to rescale the machines in the MIG, the Overlord must run with a service account
+guaranteeing the following two scopes from the [Compute Engine API](https://developers.google.com/identity/protocols/googlescopes#computev1)
+- `https://www.googleapis.com/auth/cloud-platform`
+- `https://www.googleapis.com/auth/compute`
+
+## Overlord Dynamic Configuration
+
+The Overlord can dynamically change worker behavior.
+
+The JSON object can be submitted to the Overlord via a POST request at:
+
+```
+http://<OVERLORD_IP>:<port>/druid/indexer/v1/worker
+```
+
+Optional Header Parameters for auditing the config change can also be specified.
+
+|Header Param Name| Description | Default |
+|----------|-------------|---------|
+|`X-Druid-Author`| author making the config change|""|
+|`X-Druid-Comment`| comment describing the change being done|""|
+
+A sample worker config spec is shown below:
+
+```json
+{
+  "autoScaler": {
+    "envConfig" : {
+      "numInstances" : 1,
+      "projectId" : "super-project",
+      "zoneName" : "us-central-1",
+      "managedInstanceGroupName" : "druid-middlemanagers"
+    },
+    "maxNumWorkers" : 4,
+    "minNumWorkers" : 2,
+    "type" : "gce"
+  }
+}
+```
+
+The configuration of the autoscaler is quite simple and it is made of two levels only.
+
+The external level specifies the `type`—always `gce` in this case— and two numeric values,
+the `maxNumWorkers` and `minNumWorkers` used to define the boundaries in between which the
+number of instances must be at any time.
+
+The internal level is the `envConfig` and it is used to specify
+
+- The `numInstances` used to specify how many workers will be spawned at each 
+request to provision more workers.  This is safe to be left to `1`
+- The `projectId` used to specify the name of the project in which the MIG resides
+- The `zoneName` used to identify in which zone of the worlds the MIG is
+- The `managedInstanceGroupName` used to specify the MIG containing the instances created or 
+removed
+
+Please refer to the Overlord Dynamic Configuration section in the main [documentation](../../configuration/index.md)
+for parameters other than the ones specified here, such as `selectStrategy` etc.
+
+## Known limitations
+
+- The module internally uses the [ListManagedInstances](https://cloud.google.com/compute/docs/reference/rest/v1/instanceGroupManagers/listManagedInstances)
+ call from the API and, while the documentation of the API states that the call can be paged through using the
+ `pageToken` argument, the responses to such call do not provide any `nextPageToken` to set such parameter. This means
+ that the extension can operate safely with a maximum of 500 Middle Managers instances at any time (the maximum number
+ of instances to be returned for each call).
+ 
\ No newline at end of file
diff --git a/docs/35.0.0/development/extensions-contrib/graphite.md b/docs/35.0.0/development/extensions-contrib/graphite.md
new file mode 100644
index 0000000000..a6e04e9b00
--- /dev/null
+++ b/docs/35.0.0/development/extensions-contrib/graphite.md
@@ -0,0 +1,117 @@
+---
+id: graphite
+title: "Graphite Emitter"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+To use this Apache Druid extension, [include](../../configuration/extensions.md#loading-extensions) `graphite-emitter` in the extensions load list.
+
+## Introduction
+
+This extension emits druid metrics to a graphite carbon server.
+Metrics can be sent by using [plaintext](http://graphite.readthedocs.io/en/latest/feeding-carbon.html#the-plaintext-protocol) or [pickle](http://graphite.readthedocs.io/en/latest/feeding-carbon.html#the-pickle-protocol) protocol.
+The pickle protocol is more efficient and supports sending batches of metrics (plaintext protocol send only one metric) in one request; batch size is configurable.
+
+## Configuration
+
+All the configuration parameters for graphite emitter are under `druid.emitter.graphite`.
+
+|property|description|required?|default|
+|--------|-----------|---------|-------|
+|`druid.emitter.graphite.hostname`|The hostname of the graphite server.|yes|none|
+|`druid.emitter.graphite.port`|The port of the graphite server.|yes|none|
+|`druid.emitter.graphite.batchSize`|Number of events to send as one batch (only for pickle protocol)|no|100|
+|`druid.emitter.graphite.protocol`|Graphite protocol; available protocols: pickle, plaintext.|no|pickle|
+|`druid.emitter.graphite.eventConverter`| Filter and converter of druid events to graphite event (please see next section).|yes|none|
+|`druid.emitter.graphite.flushPeriod` | Queue flushing period in milliseconds. |no|1 minute|
+|`druid.emitter.graphite.maxQueueSize`| Maximum size of the queue used to buffer events. |no|`MAX_INT`|
+|`druid.emitter.graphite.alertEmitters`| List of emitters where alerts will be forwarded to. This is a JSON list of emitter names, e.g. `["logging", "http"]`|no| empty list (no forwarding)|
+|`druid.emitter.graphite.requestLogEmitters`| List of emitters where request logs (i.e., query logging events sent to emitters when `druid.request.logging.type` is set to `emitter`) will be forwarded to. This is a JSON list of emitter names, e.g. `["logging", "http"]`|no| empty list (no forwarding)|
+|`druid.emitter.graphite.emitWaitTime` | wait time in milliseconds to try to send the event otherwise emitter will throwing event. |no|0|
+|`druid.emitter.graphite.waitForEventTime` | waiting time in milliseconds if necessary for an event to become available. |no|1000 (1 sec)|
+
+### Supported event types
+
+The graphite emitter only emits service metric events to graphite (See [Druid Metrics](../../operations/metrics.md) for a list of metrics).
+
+Alerts and request logs are not sent to graphite. These event types are not well represented in Graphite, which is more suited for timeseries views on numeric metrics, vs. storing non-numeric log events.
+
+Instead, alerts and request logs are optionally forwarded to other emitter implementations, specified by `druid.emitter.graphite.alertEmitters` and `druid.emitter.graphite.requestLogEmitters` respectively.
+
+### Druid to Graphite Event Converter
+
+Graphite Event Converter defines a mapping between druid metrics name plus dimensions to a Graphite metric path.
+Graphite metric path is organized using the following schema:
+`<namespacePrefix>.[<druid service name>].[<druid hostname>].<druid metrics dimensions>.<druid metrics name>`
+Properly naming the metrics is critical to avoid conflicts, confusing data and potentially wrong interpretation later on.
+
+Example `druid.historical.hist-host1_yahoo_com:8080.MyDataSourceName.GroupBy.query/time`:
+
+ * `druid` -> namespace prefix
+ * `historical` -> service name
+ * `hist-host1.yahoo.com:8080` -> druid hostname
+ * `MyDataSourceName` -> dimension value
+ * `GroupBy` -> dimension value
+ * `query/time` -> metric name
+
+We have two different implementation of event converter:
+
+#### Send-All converter
+
+The first implementation called `all`, will send all the druid service metrics events.
+The path will be in the form `<namespacePrefix>.[<druid service name>].[<druid hostname>].<dimensions values ordered by dimension's name>.<metric>`
+User has control of `<namespacePrefix>.[<druid service name>].[<druid hostname>].`
+
+You can omit the hostname by setting `ignoreHostname=true`
+`druid.SERVICE_NAME.dataSourceName.queryType.query/time`
+
+You can omit the service name by setting `ignoreServiceName=true`
+`druid.HOSTNAME.dataSourceName.queryType.query/time`
+
+Elements in metric name by default are separated by "/", so graphite will create all metrics on one level. If you want to have metrics in the tree structure, you have to set `replaceSlashWithDot=true`
+Original: `druid.HOSTNAME.dataSourceName.queryType.query/time`
+Changed: `druid.HOSTNAME.dataSourceName.queryType.query.time`
+
+
+```json
+
+druid.emitter.graphite.eventConverter={"type":"all", "namespacePrefix": "druid.test", "ignoreHostname":true, "ignoreServiceName":true}
+
+```
+
+#### White-list based converter
+
+The second implementation called `whiteList`, will send only the white listed metrics and dimensions.
+Same as for the `all` converter user has control of `<namespacePrefix>.[<druid service name>].[<druid hostname>].`
+White-list based converter comes with the following  default white list map located under resources in `./src/main/resources/defaultWhiteListMap.json`
+
+Although user can override the default white list map by supplying a property called `mapPath`.
+This property is a String containing the path for the file containing **white list map JSON object**.
+For example the following converter will read the map from the file `/pathPrefix/fileName.json`.
+
+```json
+
+druid.emitter.graphite.eventConverter={"type":"whiteList", "namespacePrefix": "druid.test", "ignoreHostname":true, "ignoreServiceName":true, "mapPath":"/pathPrefix/fileName.json"}
+
+```
+
+**Druid emits a huge number of metrics we highly recommend to use the `whiteList` converter**
diff --git a/docs/35.0.0/development/extensions-contrib/iceberg.md b/docs/35.0.0/development/extensions-contrib/iceberg.md
new file mode 100644
index 0000000000..e2a5a06cb9
--- /dev/null
+++ b/docs/35.0.0/development/extensions-contrib/iceberg.md
@@ -0,0 +1,149 @@
+---
+id: iceberg 
+title: "Iceberg extension"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+<!-- If the URL changes for this topic, make modifications
+to Apache Iceberg docs: https://github.com/apache/iceberg/blob/main/docs/mkdocs.yml -->
+
+## Iceberg Ingest extension
+
+Apache Iceberg is an open table format for huge analytic datasets. [IcebergInputSource](../../ingestion/input-sources.md#iceberg-input-source) lets you ingest data stored in the Iceberg table format into Apache Druid. To use the iceberg extension, add the `druid-iceberg-extensions` to the list of loaded extensions. See [Loading extensions](../../configuration/extensions.md#loading-extensions) for more information.
+
+Iceberg manages most of its metadata in metadata files in the object storage. However, it is still dependent on a metastore to manage a certain amount of metadata.
+Iceberg refers to these metastores as catalogs. The Iceberg extension lets you connect to the following Iceberg catalog types:
+
+* Glue catalog
+* REST-based catalog
+* Hive metastore catalog
+* Local catalog
+
+For a given catalog, Iceberg input source reads the table name from the catalog, applies the filters, and extracts all the underlying live data files up to the latest snapshot.
+The data files can be in Parquet, ORC, or Avro formats. The data files typically reside in a warehouse location, which can be in HDFS, S3, or the local filesystem.
+The `druid-iceberg-extensions` extension relies on the existing input source connectors in Druid to read the data files from the warehouse. Therefore, the Iceberg input source can be considered as an intermediate input source, which provides the file paths for other input source implementations.
+
+## Hive metastore catalog
+
+For Druid to seamlessly talk to the Hive metastore, ensure that the Hive configuration files such as `hive-site.xml` and `core-site.xml` are available in the Druid classpath for peon processes.  
+You can also specify Hive properties under the `catalogProperties` object in the ingestion spec. 
+
+The `druid-iceberg-extensions` extension presently only supports HDFS, S3 and local warehouse directories.
+
+### Read from HDFS warehouse 
+
+To read from a HDFS warehouse, load the `druid-hdfs-storage` extension. Druid extracts data file paths from the Hive metastore catalog and uses [HDFS input source](../../ingestion/input-sources.md#hdfs-input-source) to ingest these files.
+The `warehouseSource` type in the ingestion spec should be `hdfs`.
+
+For authenticating with Kerberized clusters, include `principal` and `keytab` properties in the `catalogProperties` object:
+
+```json
+"catalogProperties": {
+  "principal": "krb_principal",
+  "keytab": "/path/to/keytab"
+}
+```
+Only Kerberos based authentication is supported as of now.
+
+### Read from S3 warehouse
+
+To read from a S3 warehouse, load the `druid-s3-extensions` extension. Druid extracts the data file paths from the Hive metastore catalog and uses `S3InputSource` to ingest these files.
+Set the `type` property of the `warehouseSource` object to `s3` in the ingestion spec. If the S3 endpoint for the warehouse is different from the endpoint configured as the deep storage, include the following properties in the `warehouseSource` object to define the S3 endpoint settings:
+
+```json
+"warehouseSource": {
+  "type": "s3",
+  "endpointConfig": {
+    "url": "S3_ENDPOINT_URL",
+    "signingRegion": "us-east-1"
+  },
+  "clientConfig": {
+    "protocol": "http",
+    "disableChunkedEncoding": true,
+    "enablePathStyleAccess": true,
+    "forceGlobalBucketAccessEnabled": false
+  },
+  "properties": {
+    "accessKeyId": {
+      "type": "default",
+      "password": "<ACCESS_KEY_ID"
+    },
+    "secretAccessKey": {
+      "type": "default",
+      "password": "<SECRET_ACCESS_KEY>"
+    }
+  }
+}
+```
+
+This extension uses the [Hadoop AWS module](https://hadoop.apache.org/docs/stable/hadoop-aws/tools/hadoop-aws/) to connect to S3 and retrieve the metadata and data file paths.
+The following properties are required in the `catalogProperties`:
+
+```json
+"catalogProperties": {
+  "fs.s3a.access.key" : "S3_ACCESS_KEY",
+  "fs.s3a.secret.key" : "S3_SECRET_KEY",
+  "fs.s3a.endpoint" : "S3_API_ENDPOINT"
+}
+```
+Since the Hadoop AWS connector uses the `s3a` filesystem client, specify the warehouse path with the `s3a://` protocol instead of `s3://`.
+
+## Local catalog
+
+The local catalog type can be used for catalogs configured on the local filesystem. Set the `icebergCatalog` type to `local`. You can use this catalog for demos or localized tests. It is not recommended for production use cases.
+The `warehouseSource` is set to `local` because this catalog only supports reading from a local filesystem.
+
+## REST catalog
+
+To connect to an Iceberg REST Catalog server, configure the `icebergCatalog` type as `rest`. The Iceberg REST Open API spec gives catalogs greater control over the implementation and in most cases, the `warehousePath` does not have to be provided by the client.
+Security credentials may be provided in the `catalogProperties` object.
+
+## Glue catalog
+
+Configure the `icebergCatalog` type as `glue`.`warehousePath` and properties must be provided in `catalogProperties` object.
+Refer [Iceberg Glue Catalog documentation](https://iceberg.apache.org/docs/1.6.0/aws/#glue-catalog) for setting properties. 
+
+
+## Downloading Iceberg extension
+
+To download `druid-iceberg-extensions`, run the following command after replacing `<VERSION>` with the desired
+Druid version:
+
+```shell
+java \
+  -cp "lib/*" \
+  -Ddruid.extensions.directory="extensions" \
+  -Ddruid.extensions.hadoopDependenciesDir="hadoop-dependencies" \
+  org.apache.druid.cli.Main tools pull-deps \
+  --no-default-hadoop \
+  -c "org.apache.druid.extensions.contrib:druid-iceberg-extensions:<VERSION>"
+```
+
+See [Loading community extensions](../../configuration/extensions.md#loading-community-extensions) for more information.
+
+## Known limitations
+
+This section lists the known limitations that apply to the Iceberg extension.
+
+- This extension does not fully utilize the Iceberg features such as snapshotting or schema evolution.
+- The Iceberg input source reads every single live file on the Iceberg table up to the latest snapshot, which makes the table scan less performant. It is recommended to use Iceberg filters on partition columns in the ingestion spec in order to limit the number of data files being retrieved. Since, Druid doesn't store the last ingested iceberg snapshot ID, it cannot identify the files created between that snapshot and the latest snapshot on Iceberg.
+- It does not handle Iceberg [schema evolution](https://iceberg.apache.org/docs/latest/evolution/) yet. In cases where an existing Iceberg table column is deleted and recreated with the same name, ingesting this table into Druid may bring the data for this column before it was deleted.
+- The Hive catalog has not been tested on Hadoop 2.x.x and is not guaranteed to work with Hadoop 2.
\ No newline at end of file
diff --git a/docs/35.0.0/development/extensions-contrib/influx.md b/docs/35.0.0/development/extensions-contrib/influx.md
new file mode 100644
index 0000000000..eec9fb555e
--- /dev/null
+++ b/docs/35.0.0/development/extensions-contrib/influx.md
@@ -0,0 +1,67 @@
+---
+id: influx
+title: "InfluxDB Line Protocol Parser"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+To use this Apache Druid extension, [include](../../configuration/extensions.md#loading-extensions) `druid-influx-extensions` in the extensions load list.
+
+This extension enables Druid to parse the [InfluxDB Line Protocol](https://docs.influxdata.com/influxdb/v1.5/write_protocols/line_protocol_tutorial/), a popular text-based timeseries metric serialization format.
+
+## Line Protocol
+
+A typical line looks like this:
+
+```cpu,application=dbhost=prdb123,region=us-east-1 usage_idle=99.24,usage_user=0.55 1520722030000000000```
+
+which contains four parts:
+
+  - measurement: A string indicating the name of the measurement represented (e.g. cpu, network, web_requests)
+  - tags: zero or more key-value pairs (i.e. dimensions)
+  - measurements: one or more key-value pairs; values can be numeric, boolean, or string
+  - timestamp: nanoseconds since Unix epoch (the parser truncates it to milliseconds)
+
+The parser extracts these fields into a map, giving the measurement the key `measurement` and the timestamp the key `_ts`. The tag and measurement keys are copied verbatim, so users should take care to avoid name collisions. It is up to the ingestion spec to decide which fields should be treated as dimensions and which should be treated as metrics (typically tags correspond to dimensions and measurements correspond to metrics).
+
+The parser is configured like so:
+
+```json
+"parser": {
+      "type": "string",
+      "parseSpec": {
+        "format": "influx",
+        "timestampSpec": {
+          "column": "__ts",
+          "format": "millis"
+        },
+        "dimensionsSpec": {
+          "dimensionExclusions": [
+            "__ts"
+          ]
+        },
+        "whitelistMeasurements": [
+          "cpu"
+        ]
+      }
+```
+
+The `whitelistMeasurements` field is an optional list of strings. If present, measurements that do not match one of the strings in the list will be ignored.
diff --git a/docs/35.0.0/development/extensions-contrib/influxdb-emitter.md b/docs/35.0.0/development/extensions-contrib/influxdb-emitter.md
new file mode 100644
index 0000000000..1086a5121e
--- /dev/null
+++ b/docs/35.0.0/development/extensions-contrib/influxdb-emitter.md
@@ -0,0 +1,78 @@
+---
+id: influxdb-emitter
+title: "InfluxDB Emitter"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+To use this Apache Druid extension, [include](../../configuration/extensions.md#loading-extensions) `druid-influxdb-emitter` in the extensions load list.
+
+## Introduction
+
+This extension emits druid metrics to [InfluxDB](https://www.influxdata.com/time-series-platform/influxdb/) over HTTP. Currently this emitter only emits service metric events to InfluxDB (See [Druid metrics](../../operations/metrics.md) for a list of metrics).
+When a metric event is fired it is added to a queue of events. After a configurable amount of time, the events on the queue are transformed to InfluxDB's line protocol
+and POSTed to the InfluxDB HTTP API. The entire queue is flushed at this point. The queue is also flushed as the emitter is shutdown.
+
+Note that authentication and authorization must be [enabled](https://docs.influxdata.com/influxdb/v1.7/administration/authentication_and_authorization/) on the InfluxDB server.
+
+## Configuration
+
+All the configuration parameters for the influxdb emitter are under `druid.emitter.influxdb`.
+
+|Property|Description|Required?|Default|
+|--------|-----------|---------|-------|
+|`druid.emitter.influxdb.hostname`|The hostname of the InfluxDB server.|Yes|N/A|
+|`druid.emitter.influxdb.port`|The port of the InfluxDB server.|No|8086|
+|`druid.emitter.influxdb.protocol`|The protocol used to send metrics to InfluxDB. One of http/https|No|http|
+|`druid.emitter.influxdb.trustStorePath`|The path to the trustStore to be used for https|No|none|
+|`druid.emitter.influxdb.trustStoreType`|The trustStore type to be used for https|No|`jks`|
+|`druid.emitter.influxdb.trustStorePassword`|The trustStore password to be used for https|No|none|
+|`druid.emitter.influxdb.databaseName`|The name of the database in InfluxDB.|Yes|N/A|
+|`druid.emitter.influxdb.maxQueueSize`|The size of the queue that holds events.|No|Integer.MAX_VALUE(=2^31-1)|
+|`druid.emitter.influxdb.flushPeriod`|How often (in milliseconds) the events queue is parsed into Line Protocol and POSTed to InfluxDB.|No|60000|
+|`druid.emitter.influxdb.flushDelay`|How long (in milliseconds) the scheduled method will wait until it first runs.|No|60000|
+|`druid.emitter.influxdb.influxdbUserName`|The username for authenticating with the InfluxDB database.|Yes|N/A|
+|`druid.emitter.influxdb.influxdbPassword`|The password of the database authorized user|Yes|N/A|
+|`druid.emitter.influxdb.dimensionWhitelist`|A whitelist of metric dimensions to include as tags|No|`["dataSource","type","numMetrics","numDimensions","threshold","dimension","taskType","taskStatus","tier"]`|
+
+## InfluxDB Line Protocol
+
+An example of how this emitter parses a Druid metric event into InfluxDB's [line protocol](https://docs.influxdata.com/influxdb/v1.7/write_protocols/line_protocol_reference/) is given here:
+
+The syntax of the line protocol is :
+
+`<measurement>[,<tag_key>=<tag_value>[,<tag_key>=<tag_value>]] <field_key>=<field_value>[,<field_key>=<field_value>] [<timestamp>]`
+
+where timestamp is in nanoseconds since epoch.
+
+A typical service metric event as recorded by Druid's logging emitter is: `Event [{"feed":"metrics","timestamp":"2017-10-31T09:09:06.857Z","service":"druid/historical","host":"historical001:8083","version":"0.11.0-SNAPSHOT","metric":"query/cache/total/hits","value":34787256}]`.
+
+This event is parsed into line protocol according to these rules:
+
+* The measurement becomes druid_query since query is the first part of the metric.
+* The tags are service=druid/historical, hostname=historical001, metric=druid_cache_total. (The metric tag is the middle part of the druid metric separated with _ and preceded by druid_. Another example would be if an event has metric=query/time then there is no middle part and hence no metric tag)
+* The field is druid_hits since this is the last part of the metric.
+
+This gives the following String which can be POSTed to InfluxDB: `"druid_query,service=druid/historical,hostname=historical001,metric=druid_cache_total druid_hits=34787256 1509440946857000000"`
+
+The InfluxDB emitter has a white list of dimensions
+which will be added as a tag to the line protocol string if the metric has a dimension from the white list.
+The value of the dimension is sanitized such that every occurrence of a dot or whitespace is replaced with a `_` .
diff --git a/docs/35.0.0/development/extensions-contrib/kafka-emitter.md b/docs/35.0.0/development/extensions-contrib/kafka-emitter.md
new file mode 100644
index 0000000000..772c0ff405
--- /dev/null
+++ b/docs/35.0.0/development/extensions-contrib/kafka-emitter.md
@@ -0,0 +1,66 @@
+---
+id: kafka-emitter
+title: "Kafka Emitter"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+To use this Apache Druid extension, [include](../../configuration/extensions.md#loading-extensions) `kafka-emitter` in the extensions load list.
+
+## Introduction
+
+This extension emits Druid metrics to [Apache Kafka](https://kafka.apache.org) directly with JSON format.<br />
+Currently, Kafka has not only their nice ecosystem but also consumer API readily available.
+So, If you currently use Kafka, It's easy to integrate various tool or UI
+to monitor the status of your Druid cluster with this extension.
+
+## Configuration
+
+All the configuration parameters for the Kafka emitter are under `druid.emitter.kafka`.
+
+| Property                                           | Description                                                                                                                               | Required | Default               |
+|----------------------------------------------------|-------------------------------------------------------------------------------------------------------------------------------------------|-----------|-----------------------|
+| `druid.emitter.kafka.bootstrap.servers`            | Comma-separated Kafka broker. (`[hostname:port],[hostname:port]...`)                                                                      | yes       | none                  |
+| `druid.emitter.kafka.event.types`                  | Comma-separated event types. <br/>Supported types are `alerts`, `metrics`, `requests`, and `segment_metadata`.                            | no        | `["metrics", "alerts"]` |
+| `druid.emitter.kafka.metric.topic`                 | Kafka topic name for emitter's target to emit service metrics. If `event.types` contains `metrics`, this field cannot be empty.           | no        | none                  |
+| `druid.emitter.kafka.alert.topic`                  | Kafka topic name for emitter's target to emit alerts. If `event.types` contains `alerts`, this field cannot empty.                        | no        | none                  |
+| `druid.emitter.kafka.request.topic`                | Kafka topic name for emitter's target to emit request logs. If `event.types` contains `requests`, this field cannot be empty.             | no        | none                  |
+| `druid.emitter.kafka.segmentMetadata.topic`        | Kafka topic name for emitter's target to emit segment metadata. If `event.types` contains `segment_metadata`, this field cannot be empty. | no        | none                  |
+| `druid.emitter.kafka.producer.config`              | JSON configuration to set additional properties to Kafka producer.                                                                        | no        | none                  |
+| `druid.emitter.kafka.clusterName`                  | Optional value to specify the name of your Druid cluster. It can help make groups in your monitoring environment.                         | no        | none                  |
+| `druid.emitter.kafka.extra.dimensions` | Optional JSON configuration to specify a map of extra string dimensions for the events emitted. These can help make groups in your monitoring environment. | no | none |
+| `druid.emitter.kafka.producer.hiddenProperties`    | JSON configuration to specify sensitive Kafka producer properties such as username and password.  This property accepts a [DynamicConfigProvider](../../operations/dynamic-config-provider.md) implementation. | no | none |
+| `druid.emitter.kafka.producer.shutdownTimeout`    | Duration in milliseconds the Kafka producer waits for pending requests to finish before shutting down. | no | Long.MAX_VALUE |
+
+### Example
+
+```
+druid.emitter.kafka.bootstrap.servers=hostname1:9092,hostname2:9092
+druid.emitter.kafka.event.types=["metrics", "alerts", "requests", "segment_metadata"]
+druid.emitter.kafka.metric.topic=druid-metric
+druid.emitter.kafka.alert.topic=druid-alert
+druid.emitter.kafka.request.topic=druid-request-logs
+druid.emitter.kafka.segmentMetadata.topic=druid-segment-metadata 
+druid.emitter.kafka.producer.config={"max.block.ms":10000}
+druid.emitter.kafka.extra.dimensions={"region":"us-east-1","environment":"preProd"}
+druid.emitter.kafka.producer.hiddenProperties={"config":{"sasl.jaas.config": "org.apache.kafka.common.security.plain.PlainLoginModule required username=\\"KV...NI\\" password=\\"gA3...n6a/\\";"}}
+```
+
diff --git a/docs/35.0.0/development/extensions-contrib/materialized-view.md b/docs/35.0.0/development/extensions-contrib/materialized-view.md
new file mode 100644
index 0000000000..a493c3c417
--- /dev/null
+++ b/docs/35.0.0/development/extensions-contrib/materialized-view.md
@@ -0,0 +1,136 @@
+---
+id: materialized-view
+title: "Materialized View"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+To use this Apache Druid feature, make sure to load `materialized-view-selection` and `materialized-view-maintenance`. In addition, this feature currently requires a Hadoop cluster.
+
+This feature enables Druid to greatly improve the query performance, especially when the query dataSource has a very large number of dimensions but the query only required several dimensions. This feature includes two parts. One is `materialized-view-maintenance`, and the other is `materialized-view-selection`.
+
+## Materialized-view-maintenance
+In materialized-view-maintenance, dataSources user ingested are called "base-dataSource". For each base-dataSource, we can submit `derivativeDataSource` supervisors to create and maintain other dataSources which we called  "derived-dataSource". The dimensions and metrics of derived-dataSources are the subset of base-dataSource's.
+The `derivativeDataSource` supervisor is used to keep the timeline of derived-dataSource consistent with base-dataSource. Each `derivativeDataSource` supervisor  is responsible for one derived-dataSource.
+
+A sample derivativeDataSource supervisor spec is shown below:
+
+```json
+   {
+       "type": "derivativeDataSource",
+       "baseDataSource": "wikiticker",
+       "dimensionsSpec": {
+           "dimensions": [
+               "isUnpatrolled",
+               "metroCode",
+               "namespace",
+               "page",
+               "regionIsoCode",
+               "regionName",
+               "user"
+           ]
+       },
+       "metricsSpec": [
+           {
+               "name": "count",
+               "type": "count"
+           },
+           {
+               "name": "added",
+               "type": "longSum",
+               "fieldName": "added"
+           }
+       ],
+       "tuningConfig": {
+           "type": "hadoop"
+       }
+   }
+```
+
+**Supervisor Configuration**
+
+|Field|Description|Required|
+|--------|-----------|---------|
+|Type	|The supervisor type. This should always be `derivativeDataSource`.|yes|
+|baseDataSource	|The name of base dataSource. This dataSource data should be already stored inside Druid, and the dataSource will be used as input data.|yes|
+|dimensionsSpec	|Specifies the dimensions of the data. These dimensions must be the subset of baseDataSource's dimensions.|yes|
+|metricsSpec	|A list of aggregators. These metrics must be the subset of baseDataSource's metrics. See [aggregations](../../querying/aggregations.md).|yes|
+|tuningConfig	|TuningConfig must be HadoopTuningConfig. See [Hadoop tuning config](../../ingestion/hadoop.md#tuningconfig).|yes|
+|dataSource	|The name of this derived dataSource. 	|no(default=baseDataSource-hashCode of supervisor)|
+|hadoopDependencyCoordinates	|A JSON array of Hadoop dependency coordinates that Druid will use, this property will override the default Hadoop coordinates. Once specified, Druid will look for those Hadoop dependencies from the location specified by druid.extensions.hadoopDependenciesDir	|no|
+|classpathPrefix	|Classpath that will be prepended for the Peon process.	|no|
+|context	|See below.	|no|
+
+**Context**
+
+|Field|Description|Required|
+|--------|-----------|---------|
+|maxTaskCount |The max number of tasks the supervisor can submit simultaneously.	|no(default=1)|
+
+##  Materialized-view-selection
+
+In materialized-view-selection, we implement a new query type `view`. When we request a view query, Druid will try its best to optimize the query based on query dataSource and intervals.
+
+A sample view query spec is shown below:
+
+```json
+   {
+       "queryType": "view",
+       "query": {
+           "queryType": "groupBy",
+           "dataSource": "wikiticker",
+           "granularity": "all",
+           "dimensions": [
+               "user"
+           ],
+           "limitSpec": {
+               "type": "default",
+               "limit": 1,
+               "columns": [
+                   {
+                       "dimension": "added",
+                       "direction": "descending",
+                       "dimensionOrder": "numeric"
+                   }
+               ]
+           },
+           "aggregations": [
+               {
+                   "type": "longSum",
+                   "name": "added",
+                   "fieldName": "added"
+               }
+           ],
+           "intervals": [
+               "2015-09-12/2015-09-13"
+           ]
+       }
+   }
+```
+
+There are 2 parts in a view query:
+
+|Field|Description|Required|
+|--------|-----------|---------|
+|queryType	|The query type. This should always be view	|yes|
+|query	|The real query of this `view` query. The real query must be [groupBy](../../querying/groupbyquery.md), [topN](../../querying/topnquery.md), or [timeseries](../../querying/timeseriesquery.md) type.|yes|
+
+**Note that Materialized View is currently designated as experimental. Please make sure the time of all processes are the same and increase monotonically. Otherwise, some unexpected errors may happen on query results.**
diff --git a/docs/35.0.0/development/extensions-contrib/momentsketch-quantiles.md b/docs/35.0.0/development/extensions-contrib/momentsketch-quantiles.md
new file mode 100644
index 0000000000..eaad48f69c
--- /dev/null
+++ b/docs/35.0.0/development/extensions-contrib/momentsketch-quantiles.md
@@ -0,0 +1,121 @@
+---
+id: momentsketch-quantiles
+title: "Moment Sketches for Approximate Quantiles module"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+This module provides aggregators for approximate quantile queries using the [momentsketch](https://github.com/stanford-futuredata/momentsketch) library.
+The momentsketch provides coarse quantile estimates with less space and aggregation time overheads than traditional sketches, approaching the performance of counts and sums by reconstructing distributions from computed statistics.
+
+To use this Apache Druid extension, [include](../../configuration/extensions.md#loading-extensions) in the extensions load list.
+
+### Aggregator
+
+The result of the aggregation is a momentsketch that is the union of all sketches either built from raw data or read from the segments.
+
+The `momentSketch` aggregator operates over raw data while the `momentSketchMerge` aggregator should be used when aggregating precomputed sketches.
+
+```json
+{
+  "type" : <aggregator_type>,
+  "name" : <output_name>,
+  "fieldName" : <input_name>,
+  "k" : <int>,
+  "compress" : <boolean>
+ }
+```
+
+|property|description|required?|
+|--------|-----------|---------|
+|type|Type of aggregator desired. Either "momentSketch" or "momentSketchMerge" |yes|
+|name|A String for the output (result) name of the calculation.|yes|
+|fieldName|A String for the name of the input field (can contain sketches or raw numeric values).|yes|
+|k|Parameter that determines the accuracy and size of the sketch. Higher k means higher accuracy but more space to store sketches. Usable range is generally [3,15] |no, defaults to 13.|
+|compress|Flag for whether the aggregator compresses numeric values using arcsinh. Can improve robustness to skewed and long-tailed distributions, but reduces accuracy slightly on more uniform distributions.| no, defaults to true
+
+### Post Aggregators
+
+Users can query for a set of quantiles using the `momentSketchSolveQuantiles` post-aggregator on the sketches created by the `momentSketch` or `momentSketchMerge` aggregators.
+
+```json
+{
+  "type"  : "momentSketchSolveQuantiles",
+  "name" : <output_name>,
+  "field" : <reference to moment sketch>,
+  "fractions" : <array of doubles in [0,1]>
+}
+```
+
+Users can also query for the min/max of a distribution:
+
+```json
+{
+  "type" : "momentSketchMin" | "momentSketchMax",
+  "name" : <output_name>,
+  "field" : <reference to moment sketch>,
+}
+```
+
+### Example
+As an example of a query with sketches pre-aggregated at ingestion time, one could set up the following aggregator at ingest:
+
+```json
+{
+  "type": "momentSketch",
+  "name": "sketch",
+  "fieldName": "value",
+  "k": 10,
+  "compress": true,
+}
+```
+
+and make queries using the following aggregator + post-aggregator:
+
+```json
+{
+  "aggregations": [{
+    "type": "momentSketchMerge",
+    "name": "sketch",
+    "fieldName": "sketch",
+    "k": 10,
+    "compress": true
+  }],
+  "postAggregations": [
+  {
+    "type": "momentSketchSolveQuantiles",
+    "name": "quantiles",
+    "fractions": [0.1, 0.5, 0.9],
+    "field": {
+      "type": "fieldAccess",
+      "fieldName": "sketch"
+    }
+  },
+  {
+    "type": "momentSketchMin",
+    "name": "min",
+    "field": {
+      "type": "fieldAccess",
+      "fieldName": "sketch"
+    }
+  }]
+}
+```
\ No newline at end of file
diff --git a/docs/35.0.0/development/extensions-contrib/moving-average-query.md b/docs/35.0.0/development/extensions-contrib/moving-average-query.md
new file mode 100644
index 0000000000..0fcc9c4f5b
--- /dev/null
+++ b/docs/35.0.0/development/extensions-contrib/moving-average-query.md
@@ -0,0 +1,364 @@
+---
+id: moving-average-query
+title: "Moving Average Query"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+## Overview
+**Moving Average Query** is an extension which provides support for [Moving Average](https://en.wikipedia.org/wiki/Moving_average) and other Aggregate [Window Functions](https://en.wikibooks.org/wiki/Structured_Query_Language/Window_functions) in Druid queries.
+
+These Aggregate Window Functions consume standard Druid Aggregators and outputs additional windowed aggregates called [Averagers](#averagers).
+
+#### High level algorithm
+
+Moving Average encapsulates the [groupBy query](../../querying/groupbyquery.md) (Or [timeseries](../../querying/timeseriesquery.md) in case of no dimensions) in order to rely on the maturity of these query types.
+
+It runs the query in two main phases:
+
+1. Runs an inner [groupBy](../../querying/groupbyquery.md) or [timeseries](../../querying/timeseriesquery.md) query to compute Aggregators (i.e. daily count of events).
+2. Passes over aggregated results in Broker, in order to compute Averagers (i.e. moving 7 day average of the daily count).
+
+#### Main enhancements provided by this extension:
+1. Functionality: Extending druid query functionality (i.e. initial introduction of Window Functions).
+2. Performance: Improving performance of such moving aggregations by eliminating multiple segment scans.
+
+#### Further reading
+[Moving Average](https://en.wikipedia.org/wiki/Moving_average)
+
+[Window Functions](https://en.wikibooks.org/wiki/Structured_Query_Language/Window_functions)
+
+[Analytic Functions](https://cloud.google.com/bigquery/docs/reference/standard-sql/analytic-function-concepts)
+
+
+## Operations
+
+### Installation
+Use [pull-deps](../../operations/pull-deps.md) tool shipped with Druid to install this [extension](../../configuration/extensions.md#community-extensions) on all Druid broker and router nodes.
+
+```bash
+java -classpath "<your_druid_dir>/lib/*" org.apache.druid.cli.Main tools pull-deps -c org.apache.druid.extensions.contrib:druid-moving-average-query:{VERSION}
+```
+
+### Enabling
+After installation, to enable this extension, just add `druid-moving-average-query` to `druid.extensions.loadList` in broker and routers' `runtime.properties` file and then restart broker and router nodes.
+
+For example:
+
+```bash
+druid.extensions.loadList=["druid-moving-average-query"]
+```
+
+## Configuration
+There are currently no configuration properties specific to Moving Average.
+
+## Limitations
+* movingAverage is missing support for the following groupBy properties: `subtotalsSpec`, `virtualColumns`.
+* movingAverage is missing support for the following timeseries properties: `descending`.
+* movingAverage averagers consider empty buckets and null aggregation values as 0 unless otherwise noted.
+
+## Query spec
+* Most properties in the query spec derived from  [groupBy query](../../querying/groupbyquery.md) / [timeseries](../../querying/timeseriesquery.md), see documentation for these query types.
+
+|property|description|required?|
+|--------|-----------|---------|
+|queryType|This String should always be "movingAverage"; this is the first thing Druid looks at to figure out how to interpret the query.|yes|
+|dataSource|A String or Object defining the data source to query, very similar to a table in a relational database. See [DataSource](../../querying/datasource.md) for more information.|yes|
+|dimensions|A JSON list of [DimensionSpec](../../querying/dimensionspecs.md) (Notice that property is optional)|no|
+|limitSpec|See [LimitSpec](../../querying/limitspec.md)|no|
+|having|See [Having](../../querying/having.md)|no|
+|granularity|A period granularity; See [Period Granularities](../../querying/granularities.md#period-granularities)|yes|
+|filter|See [Filters](../../querying/filters.md)|no|
+|aggregations|Aggregations forms the input to Averagers; See [Aggregations](../../querying/aggregations.md)|yes|
+|postAggregations|Supports only aggregations as input; See [Post Aggregations](../../querying/post-aggregations.md)|no|
+|intervals|A JSON Object representing ISO-8601 Intervals. This defines the time ranges to run the query over.|yes|
+|context|An additional JSON Object which can be used to specify certain flags.|no|
+|averagers|Defines the moving average function; See [Averagers](#averagers)|yes|
+|postAveragers|Support input of both averagers and aggregations; Syntax is identical to postAggregations (See [Post Aggregations](../../querying/post-aggregations.md))|no|
+
+## Averagers
+
+Averagers are used to define the Moving-Average function. Averagers are not limited to an average - they can also provide other types of window functions such as MAX()/MIN().
+
+### Properties
+
+These are properties which are common to all Averagers:
+
+|property|description|required?|
+|--------|-----------|---------|
+|type|Averager type; See [Averager types](#averager-types)|yes|
+|name|Averager name|yes|
+|fieldName|Input name (An aggregation name)|yes|
+|buckets|Number of lookback buckets (time periods), including current one. Must be >0|yes|
+|cycleSize|Cycle size; Used to calculate day-of-week option; See [Cycle size (Day of Week)](#cycle-size-day-of-week)|no, defaults to 1|
+
+
+### Averager types:
+
+* [Standard averagers](#standard-averagers):
+  * doubleMean
+  * doubleMeanNoNulls
+  * doubleSum
+  * doubleMax
+  * doubleMin
+  * longMean
+  * longMeanNoNulls
+  * longSum
+  * longMax
+  * longMin
+
+#### Standard averagers
+
+These averagers offer four functions:
+
+* Mean (Average)
+* MeanNoNulls (Ignores empty buckets).
+* Sum
+* Max
+* Min
+
+**Ignoring nulls**:
+Using a MeanNoNulls averager is useful when the interval starts at the dataset beginning time.
+In that case, the first records will ignore missing buckets and average won't be artificially low.
+However, this also means that empty days in a sparse dataset will also be ignored.
+
+Example of usage:
+
+```json
+{ "type" : "doubleMean", "name" : <output_name>, "fieldName": <input_name> }
+```
+
+### Cycle size (Day of Week)
+This optional parameter is used to calculate over a single bucket within each cycle instead of all buckets.
+A prime example would be weekly buckets, resulting in a Day of Week calculation. (Other examples: Month of year, Hour of day).
+
+I.e. when using these parameters:
+
+* *granularity*: period=P1D (daily)
+* *buckets*: 28
+* *cycleSize*: 7
+
+Within each output record, the averager will compute the result over the following buckets: current (#0), #7, #14, #21.
+Whereas without specifying cycleSize it would have computed over all 28 buckets.
+
+## Examples
+
+All examples are based on the Wikipedia dataset provided in the Druid [tutorials](../../tutorials/index.md).
+
+### Basic example
+
+Calculating a 7-buckets moving average for Wikipedia edit deltas.
+
+Query syntax:
+
+```json
+{
+  "queryType": "movingAverage",
+  "dataSource": "wikipedia",
+  "granularity": {
+    "type": "period",
+    "period": "PT30M"
+  },
+  "intervals": [
+    "2015-09-12T00:00:00Z/2015-09-13T00:00:00Z"
+  ],
+  "aggregations": [
+    {
+      "name": "delta30Min",
+      "fieldName": "delta",
+      "type": "longSum"
+    }
+  ],
+  "averagers": [
+    {
+      "name": "trailing30MinChanges",
+      "fieldName": "delta30Min",
+      "type": "longMean",
+      "buckets": 7
+    }
+  ]
+}
+```
+
+Result:
+
+```json
+[ {
+   "version" : "v1",
+   "timestamp" : "2015-09-12T00:30:00.000Z",
+   "event" : {
+     "delta30Min" : 30490,
+     "trailing30MinChanges" : 4355.714285714285
+   }
+ }, {
+   "version" : "v1",
+   "timestamp" : "2015-09-12T01:00:00.000Z",
+   "event" : {
+     "delta30Min" : 96526,
+     "trailing30MinChanges" : 18145.14285714286
+   }
+ }, {
+...
+...
+...
+}, {
+  "version" : "v1",
+  "timestamp" : "2015-09-12T23:00:00.000Z",
+  "event" : {
+    "delta30Min" : 119100,
+    "trailing30MinChanges" : 198697.2857142857
+  }
+}, {
+  "version" : "v1",
+  "timestamp" : "2015-09-12T23:30:00.000Z",
+  "event" : {
+    "delta30Min" : 177882,
+    "trailing30MinChanges" : 193890.0
+  }
+}
+```
+
+### Post averager example
+
+Calculating a 7-buckets moving average for Wikipedia edit deltas, plus a ratio between the current period and the moving average.
+
+Query syntax:
+
+```json
+{
+  "queryType": "movingAverage",
+  "dataSource": "wikipedia",
+  "granularity": {
+    "type": "period",
+    "period": "PT30M"
+  },
+  "intervals": [
+    "2015-09-12T22:00:00Z/2015-09-13T00:00:00Z"
+  ],
+  "aggregations": [
+    {
+      "name": "delta30Min",
+      "fieldName": "delta",
+      "type": "longSum"
+    }
+  ],
+  "averagers": [
+    {
+      "name": "trailing30MinChanges",
+      "fieldName": "delta30Min",
+      "type": "longMean",
+      "buckets": 7
+    }
+  ],
+  "postAveragers" : [
+    {
+      "name": "ratioTrailing30MinChanges",
+      "type": "arithmetic",
+      "fn": "/",
+      "fields": [
+        {
+          "type": "fieldAccess",
+          "fieldName": "delta30Min"
+        },
+        {
+          "type": "fieldAccess",
+          "fieldName": "trailing30MinChanges"
+        }
+      ]
+    }
+  ]
+}
+```
+
+Result:
+
+```json
+[ {
+  "version" : "v1",
+  "timestamp" : "2015-09-12T22:00:00.000Z",
+  "event" : {
+    "delta30Min" : 144269,
+    "trailing30MinChanges" : 204088.14285714287,
+    "ratioTrailing30MinChanges" : 0.7068955500319539
+  }
+}, {
+  "version" : "v1",
+  "timestamp" : "2015-09-12T22:30:00.000Z",
+  "event" : {
+    "delta30Min" : 242860,
+    "trailing30MinChanges" : 214031.57142857142,
+    "ratioTrailing30MinChanges" : 1.134692411867141
+  }
+}, {
+  "version" : "v1",
+  "timestamp" : "2015-09-12T23:00:00.000Z",
+  "event" : {
+    "delta30Min" : 119100,
+    "trailing30MinChanges" : 198697.2857142857,
+    "ratioTrailing30MinChanges" : 0.5994042624782422
+  }
+}, {
+  "version" : "v1",
+  "timestamp" : "2015-09-12T23:30:00.000Z",
+  "event" : {
+    "delta30Min" : 177882,
+    "trailing30MinChanges" : 193890.0,
+    "ratioTrailing30MinChanges" : 0.9174377224199288
+  }
+} ]
+```
+
+
+### Cycle size example
+
+Calculating an average of every first 10-minutes of the last 3 hours:
+
+Query syntax:
+
+```json
+{
+  "queryType": "movingAverage",
+  "dataSource": "wikipedia",
+  "granularity": {
+    "type": "period",
+    "period": "PT10M"
+  },
+  "intervals": [
+    "2015-09-12T00:00:00Z/2015-09-13T00:00:00Z"
+  ],
+  "aggregations": [
+    {
+      "name": "delta10Min",
+      "fieldName": "delta",
+      "type": "doubleSum"
+    }
+  ],
+  "averagers": [
+    {
+      "name": "trailing10MinPerHourChanges",
+      "fieldName": "delta10Min",
+      "type": "doubleMeanNoNulls",
+      "buckets": 18,
+      "cycleSize": 6
+    }
+  ]
+}
+```
diff --git a/docs/35.0.0/development/extensions-contrib/opentsdb-emitter.md b/docs/35.0.0/development/extensions-contrib/opentsdb-emitter.md
new file mode 100644
index 0000000000..e13cd5b55f
--- /dev/null
+++ b/docs/35.0.0/development/extensions-contrib/opentsdb-emitter.md
@@ -0,0 +1,62 @@
+---
+id: opentsdb-emitter
+title: "OpenTSDB Emitter"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+To use this Apache Druid extension, [include](../../configuration/extensions.md#loading-extensions) `opentsdb-emitter` in the extensions load list.
+
+## Introduction
+
+This extension emits druid metrics to [OpenTSDB](https://github.com/OpenTSDB/opentsdb) over HTTP (Using `Jersey client`). And this emitter only emits service metric events to OpenTSDB (See [Druid metrics](../../operations/metrics.md) for a list of metrics).
+
+## Configuration
+
+All the configuration parameters for the OpenTSDB emitter are under `druid.emitter.opentsdb`.
+
+|property|description|required?|default|
+|--------|-----------|---------|-------|
+|`druid.emitter.opentsdb.host`|The host of the OpenTSDB server.|yes|none|
+|`druid.emitter.opentsdb.port`|The port of the OpenTSDB server.|yes|none|
+|`druid.emitter.opentsdb.connectionTimeout`|`Jersey client` connection timeout(in milliseconds).|no|2000|
+|`druid.emitter.opentsdb.readTimeout`|`Jersey client` read timeout(in milliseconds).|no|2000|
+|`druid.emitter.opentsdb.flushThreshold`|Queue flushing threshold.(Events will be sent as one batch)|no|100|
+|`druid.emitter.opentsdb.maxQueueSize`|Maximum size of the queue used to buffer events.|no|1000|
+|`druid.emitter.opentsdb.consumeDelay`|Queue consuming delay(in milliseconds). Actually, we use `ScheduledExecutorService` to schedule consuming events, so this `consumeDelay` means the delay between the termination of one execution and the commencement of the next. If your druid processes produce metric events fast, then you should decrease this `consumeDelay` or increase the `maxQueueSize`.|no|10000|
+|`druid.emitter.opentsdb.metricMapPath`|JSON file defining the desired metrics and dimensions for every Druid metric|no|./src/main/resources/defaultMetrics.json|
+|`druid.emitter.opentsdb.namespacePrefix`|Optional (string) prefix for metric names, for example the default metric name `query.count` with a namespacePrefix set to `druid` would be emitted as `druid.query.count` |no|null|
+
+### Druid to OpenTSDB Event Converter
+
+The OpenTSDB emitter will send only the desired metrics and dimensions which is defined in a JSON file.
+If the user does not specify their own JSON file, a default file is used.  All metrics are expected to be configured in the JSON file. Metrics which are not configured will be logged.
+Desired metrics and dimensions is organized using the following schema:`<druid metric name> : [ <dimension list> ]`<br />
+e.g.
+
+```json
+"query/time": [
+    "dataSource",
+    "type"
+]
+```
+
+For most use-cases, the default configuration is sufficient.
diff --git a/docs/35.0.0/development/extensions-contrib/prometheus.md b/docs/35.0.0/development/extensions-contrib/prometheus.md
new file mode 100644
index 0000000000..d5660e2e54
--- /dev/null
+++ b/docs/35.0.0/development/extensions-contrib/prometheus.md
@@ -0,0 +1,117 @@
+---
+id: prometheus
+title: "Prometheus Emitter"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+To use this Apache Druid extension, [include](../../configuration/extensions.md#loading-extensions) `prometheus-emitter` in the extensions load list.
+
+## Introduction
+
+This extension exposes [Druid metrics](https://druid.apache.org/docs/latest/operations/metrics.html) for collection by a Prometheus server (https://prometheus.io/).
+
+Emitter is enabled by setting `druid.emitter=prometheus` [configs](https://druid.apache.org/docs/latest/configuration/index.html#enabling-metrics) or include `prometheus` in the composing emitter list.
+
+## Configuration
+
+All the configuration parameters for the Prometheus emitter are under `druid.emitter.prometheus`.
+
+| property                                      | description                                                                                                                                                                                                                            | required? | default                              |
+|-----------------------------------------------|----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|-----------|--------------------------------------|
+| `druid.emitter.prometheus.strategy`           | The strategy to expose prometheus metrics. <br/>Should be one of `exporter` and `pushgateway`. Default strategy `exporter` would expose metrics for scraping purpose. Peon tasks (short-lived jobs) should use `pushgateway` strategy. | yes       | exporter                             |
+| `druid.emitter.prometheus.port`               | The port on which to expose the prometheus HTTPServer. Required if using `exporter` strategy.                                                                                                                                          | no        | none                                 |
+| `druid.emitter.prometheus.namespace`          | Optional metric namespace. Must match the regex `[a-zA-Z_:][a-zA-Z0-9_:]*`                                                                                                                                                             | no        | druid                                |
+| `druid.emitter.prometheus.dimensionMapPath`   | JSON file defining the Prometheus metric type, desired dimensions, conversionFactor, histogram buckets and help text for every Druid metric.                                                                                                             | no        | Default mapping provided. See below. |
+| `druid.emitter.prometheus.addHostAsLabel`     | Flag to include the hostname as a prometheus label.                                                                                                                                                                                    | no        | false                                |
+| `druid.emitter.prometheus.addServiceAsLabel`  | Flag to include the druid service name (e.g. `druid/broker`, `druid/coordinator`, etc.) as a prometheus label.                                                                                                                         | no        | false                                |
+| `druid.emitter.prometheus.pushGatewayAddress` | Pushgateway address. Required if using `pushgateway` strategy.                                                                                                                                                                         | no        | none                                 |
+| `druid.emitter.prometheus.flushPeriod`        | When using the `pushgateway` strategy metrics are emitted every `flushPeriod` seconds. <br/>When using the `exporter` strategy this configures the metric TTL such that if the metric value is not updated within `flushPeriod` seconds then it will stop being emitted. Note that unique label combinations per metric are currently not subject to TTL expiration. It is recommended to set this to at least 3 * `scrape_interval`. | Required if `pushgateway` strategy is used, optional otherwise. | 15 seconds for `pushgateway` strategy. <br/>None for `exporter` strategy. |
+| `druid.emitter.prometheus.extraLabels`        | JSON key-value pairs for additional labels on all metrics. Keys (label names) must match the regex `[a-zA-Z_:][a-zA-Z0-9_:]*`. Example: `{"cluster_name": "druid_cluster1", "env": "staging"}`.                                        | no        | none                                 |
+| `druid.emitter.prometheus.deletePushGatewayMetricsOnShutdown` | Flag to delete metrics from Pushgateway on task shutdown. Works only if `pushgateway` strategy is used. This feature allows to delete a stale metrics from batch executed tasks. Otherwise, the Pushgateway will store these stale metrics indefinitely as there is [no time to live mechanism](https://github.com/prometheus/pushgateway/issues/117), using the memory to hold data that was already scraped by Prometheus. | no | false |
+| `druid.emitter.prometheus.waitForShutdownDelay` | Time in milliseconds to wait for peon tasks to delete metrics from the Pushgateway on shutdown (e.g. 60_000). Applicable only when `pushgateway` strategy is used and `deletePushGatewayMetricsOnShutdown` is set to true. There is no guarantee that a peon task will delete metrics from the gateway if the configured delay is more than the [Peon's `druid.indexer.task.gracefulShutdownTimeout`](https://druid.apache.org/docs/latest/configuration/#additional-peon-configuration) value. For best results, set this value is 1.2 times the configured Prometheus `scrape_interval` of Pushgateway to ensure that  Druid scrapes the metrics before cleanup. | no | none |
+
+### Ports for colocated Druid processes
+
+In certain instances, Druid processes may be colocated on the same host. For example, the Broker and Router may share the same server. Other colocated processes include the Historical and Middle Manager or the Coordinator and Overlord. When you have colocated processes, specify `druid.emitter.prometheus.port` separately for each process on each host. For example, even if the Broker and Router share the same host, the Broker runtime properties and the Router runtime properties each need to list `druid.emitter.prometheus.port`, and the port value for both must be different.
+
+### Override properties for Peon Tasks
+
+Peon tasks are created dynamically by middle managers and have dynamic host and port addresses. Since the `exporter` strategy allows Prometheus to read only from a fixed address, it cannot be used for peon tasks.
+So, these tasks need to be configured to use `pushgateway` strategy to push metrics from Druid to prometheus gateway.
+
+If this emitter is configured to use `exporter` strategy globally, some of the above configurations need to be overridden in the middle manager so that spawned peon tasks can still use the `pushgateway` strategy.
+
+```
+#
+# Override global prometheus emitter configuration for peon tasks to use `pushgateway` strategy.
+# Other configurations can also be overridden by adding `druid.indexer.fork.property.` prefix to above configuration properties.
+# 
+druid.indexer.fork.property.druid.emitter.prometheus.strategy=pushgateway
+druid.indexer.fork.property.druid.emitter.prometheus.pushGatewayAddress=http://<push-gateway-address>
+```
+
+### Metric names
+
+All metric names and labels are reformatted to match Prometheus standards.
+- For names: all characters which are not alphanumeric, underscores, or colons (matching `[^a-zA-Z_:][^a-zA-Z0-9_:]*`) are replaced with `_`
+- For labels: all characters which are not alphanumeric or underscores (matching `[^a-zA-Z0-9_][^a-zA-Z0-9_]*`) are replaced with `_`
+
+### Metric mapping
+
+Each metric to be collected by Prometheus must specify a type, one of `[timer, counter, guage]`. Prometheus Emitter expects this mapping to
+be provided as a JSON file.  Additionally, this mapping specifies which dimensions should be included for each metric.  Prometheus expects
+histogram timers to use Seconds as the base unit.  Timers which do not use seconds as a base unit can use the `conversionFactor` to set
+the base time unit. Histogram timers also support custom bucket configurations through the `histogramBuckets` parameter. If no custom buckets are provided, the following default buckets are used: `[0.1, 0.25, 0.5, 0.75, 1.0, 2.5, 5.0, 7.5, 10.0, 30.0, 60.0, 120.0, 300.0]`. If the user does not specify their own JSON file, a default mapping is used.  All
+metrics are expected to be mapped. Metrics which are not mapped will not be tracked.
+
+Prometheus metric path is organized using the following schema:
+
+```json
+<druid metric name> : { 
+  "dimensions" : <dimension list>, 
+  "type" : <timer|counter|gauge>, 
+  "conversionFactor": <conversionFactor>, 
+  "histogramBuckets": <array of bucket values for timer metric>,
+  "help" : <help text>
+}
+```
+
+For example:
+```json
+"query/time" : { 
+  "dimensions" : ["dataSource", "type"],
+  "type" : "timer",
+  "conversionFactor": 1000.0,
+  "histogramBuckets": [0.1, 0.25, 0.5, 0.75, 1.0, 2.5, 5.0, 7.5, 10.0, 30.0, 60.0, 120.0, 300.0],
+  "help": "Seconds taken to complete a query."
+}
+```
+
+For metrics which are emitted from multiple services with different dimensions, the metric name is prefixed with
+the service name. For example:
+
+```json
+"druid/coordinator-segment/count" : { "dimensions" : ["dataSource"], "type" : "gauge" },
+"druid/historical-segment/count" : { "dimensions" : ["dataSource", "tier", "priority"], "type" : "gauge" }
+```
+
+For most use cases, the default mapping is sufficient.
diff --git a/docs/35.0.0/development/extensions-contrib/rabbit-stream-ingestion.md b/docs/35.0.0/development/extensions-contrib/rabbit-stream-ingestion.md
new file mode 100644
index 0000000000..9c0e395180
--- /dev/null
+++ b/docs/35.0.0/development/extensions-contrib/rabbit-stream-ingestion.md
@@ -0,0 +1,238 @@
+---
+id: rabbit-super-stream-injestion
+title: "RabbitMQ superstream ingestion"
+sidebar_label: "Rabbitmq superstream"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+The rabbit stream indexing service allows you to configure *supervisors* on the Overlord to manage the creation and lifetime of [RabbitMQ](https://www.rabbitmq.com/) indexing tasks. 
+These indexing tasks read events from a rabbit super-stream. The supervisor oversees the state of the indexing tasks to:
+
+  - coordinate handoffs
+  - manage failures
+  - ensure that Druid maintains scalability and replication requirements
+
+  To use the rabbit stream indexing service, load the `druid-rabbit-indexing-service` community druid extension.
+  See [Loading community extensions](../../configuration/extensions.md#loading-community-extensions) for more information.
+
+## Submitting a supervisor spec
+
+To use the rabbit stream indexing service, load the `druid-rabbit-indexing-service` extension on both the Overlord and the Middle Managers. Druid starts a supervisor for a dataSource when you submit a supervisor spec. Submit your supervisor spec to the following endpoint:
+
+
+`http://<OVERLORD_IP>:<OVERLORD_PORT>/druid/indexer/v1/supervisor`
+
+For example:
+
+```
+curl -X POST -H 'Content-Type: application/json' -d @supervisor-spec.json http://localhost:8090/druid/indexer/v1/supervisor
+```
+
+Where the file `supervisor-spec.json` contains a rabbit supervisor spec:
+
+```json
+{
+  "type": "rabbit",
+  "spec": {
+    "dataSchema": {
+      "dataSource": "metrics-rabbit",
+      "timestampSpec": {
+        "column": "timestamp",
+        "format": "auto"
+      },
+     "dimensionsSpec": {
+        "dimensions": [],
+        "dimensionExclusions": [
+         "timestamp",
+         "value"
+       ]
+      },
+     "metricsSpec": [
+        {
+         "name": "count",
+          "type": "count"
+       },
+       {
+          "name": "value_sum",
+          "fieldName": "value",
+          "type": "doubleSum"
+        },
+       {
+         "name": "value_min",
+         "fieldName": "value",
+         "type": "doubleMin"
+       },
+        {
+          "name": "value_max",
+         "fieldName": "value",
+         "type": "doubleMax"
+       }
+     ],
+     "granularitySpec": {
+        "type": "uniform",
+        "segmentGranularity": "HOUR",
+        "queryGranularity": "NONE"
+     }
+   },
+    "ioConfig": {
+     "stream": "metrics",
+     "inputFormat": {
+       "type": "json"
+      },
+      "uri": "rabbitmq-stream://localhost:5552",
+      "taskCount": 1,
+      "replicas": 1,
+      "taskDuration": "PT1H"
+   },
+   "tuningConfig": {
+     "type": "rabbit",
+     "maxRowsPerSegment": 5000000
+   }
+  }
+}
+```
+
+## Supervisor spec
+
+|Field|Description|Required|
+|--------|-----------|---------|
+|`type`|The supervisor type; this should always be `rabbit`.|yes|
+|`spec`|Container object for the supervisor configuration.|yes|
+|`dataSchema`|The schema that will be used by the rabbit indexing task during ingestion. See [`dataSchema`](../../ingestion/ingestion-spec.md#dataschema).|yes|
+|`ioConfig`|An [`ioConfig`](#ioconfig) object for configuring rabbit super stream connection and I/O-related settings for the supervisor and indexing task.|yes|
+|`tuningConfig`|A [`tuningConfig`](#tuningconfig) object for configuring performance-related settings for the supervisor and indexing tasks.|no|
+
+### `ioConfig`
+
+|Field|Type|Description|Required|
+|-----|----|-----------|--------|
+|`stream`|String|The RabbitMQ super stream to read.|yes|
+|`inputFormat`|Object|The input format to specify how to parse input data. See [`inputFormat`](../../ingestion/data-formats.md#input-format) for details.|yes|
+|`uri`|String|The URI to connect to RabbitMQ with. |yes |
+|`replicas`|Integer|The number of replica sets, where 1 means a single set of tasks (no replication). Replica tasks will always be assigned to different workers to provide resiliency against process failure.|no (default == 1)|
+|`taskCount`|Integer|The maximum number of *reading* tasks in a *replica set*. This means that the maximum number of reading tasks will be `taskCount * replicas` and the total number of tasks (*reading* + *publishing*) will be higher than this. |no (default == 1)|
+|`taskDuration`|ISO8601 Period|The length of time before tasks stop reading and begin publishing their segment.|no (default == PT1H)|
+|`startDelay`|ISO8601 Period|The period to wait before the supervisor starts managing tasks.|no (default == PT5S)|
+|`period`|ISO8601 Period|How often the supervisor will execute its management logic. Note that the supervisor will also run in response to certain events (such as tasks succeeding, failing, and reaching their taskDuration) so this value specifies the maximum time between iterations.|no (default == PT30S)|
+|`useEarliestSequenceNumber`|Boolean|If a supervisor is managing a dataSource for the first time, it will obtain a set of starting sequence numbers from RabbitMQ. This flag determines whether it retrieves the earliest or latest sequence numbers in the stream. Under normal circumstances, subsequent tasks will start from where the previous segments ended so this flag will only be used on first run.|no (default == false)|
+|`completionTimeout`|ISO8601 Period|The length of time to wait before declaring a publishing task as failed and terminating it. If this is set too low, your tasks may never publish. The publishing clock for a task begins roughly after `taskDuration` elapses.|no (default == PT6H)|
+|`lateMessageRejectionPeriod`|ISO8601 Period|Configure tasks to reject messages with timestamps earlier than this period before the task was created; for example if this is set to `PT1H` and the supervisor creates a task at *2016-01-01T12:00Z*, messages with timestamps earlier than *2016-01-01T11:00Z* will be dropped. This may help prevent concurrency issues if your data stream has late messages and you have multiple pipelines that need to operate on the same segments (e.g. a realtime and a nightly batch ingestion pipeline).|no (default == none)|
+|`earlyMessageRejectionPeriod`|ISO8601 Period|Configure tasks to reject messages with timestamps later than this period after the task reached its taskDuration; for example if this is set to `PT1H`, the taskDuration is set to `PT1H` and the supervisor creates a task at *2016-01-01T12:00Z*. Messages with timestamps later than *2016-01-01T14:00Z* will be dropped. **Note:** Tasks sometimes run past their task duration, for example, in cases of supervisor failover. Setting `earlyMessageRejectionPeriod` too low may cause messages to be dropped unexpectedly whenever a task runs past its originally configured task duration.|no (default == none)|
+|`Consumer Properties`|Object| a dynamic map used to provide |no (default == none)|
+
+<a name="tuningconfig"></a>
+
+### `tuningConfig`
+
+The `tuningConfig` is optional. If no `tuningConfig` is specified, default parameters are used.
+
+|Field|Type|Description|Required|
+|-----|----|-----------|--------|
+|`type`| String|The indexing task type, this should always be `rabbit`.|yes|
+|`maxRowsInMemory`|Integer|The number of rows to aggregate before persisting. This number is the post-aggregation rows, so it is not equivalent to the number of input events, but the number of aggregated rows that those events result in. This is used to manage the required JVM heap size. Maximum heap memory usage for indexing scales with `maxRowsInMemory * (2 + maxPendingPersists)`.|no (default == 100000)|
+|`maxBytesInMemory`|Long| The number of bytes to aggregate in heap memory before persisting. This is based on a rough estimate of memory usage and not actual usage. Normally, this is computed internally and user does not need to set it. The maximum heap memory usage for indexing is `maxBytesInMemory * (2 + maxPendingPersists)`.|no (default == One-sixth of max JVM memory)|
+|`maxRowsPerSegment`|Integer|The number of rows to aggregate into a segment; this number is post-aggregation rows. Handoff will happen either if `maxRowsPerSegment` or `maxTotalRows` is hit or every `intermediateHandoffPeriod`, whichever happens earlier.|no (default == 5000000)|
+|`maxTotalRows`|Long|The number of rows to aggregate across all segments; this number is post-aggregation rows. Handoff will happen either if `maxRowsPerSegment` or `maxTotalRows` is hit or every `intermediateHandoffPeriod`, whichever happens earlier.|no (default == unlimited)|
+|`intermediatePersistPeriod`|ISO8601 Period|The period that determines the rate at which intermediate persists occur.|no (default == PT10M)|
+|`maxPendingPersists`|Integer|Maximum number of persists that can be pending but not started. If this limit would be exceeded by a new intermediate persist, ingestion will block until the currently-running persist finishes. Maximum heap memory usage for indexing scales with `maxRowsInMemory * (2 + maxPendingPersists)`.|no (default == 0, meaning one persist can be running concurrently with ingestion, and none can be queued up)|
+|`indexSpec`|Object|Tune how data is indexed. See [IndexSpec](#indexspec) for more information.|no|
+|`indexSpecForIntermediatePersists`|Object|Defines segment storage format options to be used at indexing time for intermediate persisted temporary segments. This can be used to disable dimension/metric compression on intermediate segments to reduce memory required for final merging. However, disabling compression on intermediate segments might increase page cache use while they are used before getting merged into final segment published, see [IndexSpec](#indexspec) for possible values.| no (default = same as `indexSpec`)|
+|`reportParseExceptions`|Boolean|If true, exceptions encountered during parsing will be thrown and will halt ingestion; if false, unparseable rows and fields will be skipped.|no (default == false)|
+|`handoffConditionTimeout`|Long| Milliseconds to wait for segment handoff. It must be >= 0, where 0 means to wait forever.| no (default == 0)|
+|`resetOffsetAutomatically`|Boolean|Controls behavior when Druid needs to read RabbitMQ messages that are no longer available. Not supported.  |no (default == false)|
+|`skipSequenceNumberAvailabilityCheck`|Boolean|Whether to enable checking if the current sequence number is still available in a particular RabbitMQ stream. If set to false, the indexing task will attempt to reset the current sequence number (or not), depending on the value of `resetOffsetAutomatically`.|no (default == false)|
+|`workerThreads`|Integer|The number of threads that the supervisor uses to handle requests/responses for worker tasks, along with any other internal asynchronous operation.|no (default == min(10, taskCount))|
+|`chatRetries`|Integer|The number of times HTTP requests to indexing tasks will be retried before considering tasks unresponsive.| no (default == 8)|
+|`httpTimeout`|ISO8601 Period|How long to wait for a HTTP response from an indexing task.|no (default == PT10S)|
+|`shutdownTimeout`|ISO8601 Period|How long to wait for the supervisor to attempt a graceful shutdown of tasks before exiting.|no (default == PT80S)|
+|`recordBufferSize`|Integer|Size of the buffer (number of events) used between the RabbitMQ consumers and the main ingestion thread.|no ( default == 100 MB or an estimated 10% of available heap, whichever is smaller.)|
+|`recordBufferOfferTimeout`|Integer|Length of time in milliseconds to wait for space to become available in the buffer before timing out.| no (default == 5000)|                                                 |
+|`segmentWriteOutMediumFactory`|Object|Segment write-out medium to use when creating segments. See below for more information.|no (not specified by default, the value from `druid.peon.defaultSegmentWriteOutMediumFactory.type` is used)|
+|`intermediateHandoffPeriod`|ISO8601 Period|How often the tasks should hand off segments. Handoff will happen either if `maxRowsPerSegment` or `maxTotalRows` is hit or every `intermediateHandoffPeriod`, whichever happens earlier.| no (default == P2147483647D)|
+|`logParseExceptions`|Boolean|If true, log an error message when a parsing exception occurs, containing information about the row where the error occurred.|no, default == false|
+|`maxParseExceptions`|Integer|The maximum number of parse exceptions that can occur before the task halts ingestion and fails. Overridden if `reportParseExceptions` is set.|no, unlimited default|
+|`maxSavedParseExceptions`|Integer|When a parse exception occurs, Druid can keep track of the most recent parse exceptions. `maxSavedParseExceptions` limits how many exception instances Druid saves. These saved exceptions are made available after the task finishes in the [task completion report](../../ingestion/tasks.md#task-reports). Overridden if `reportParseExceptions` is set.|no, default == 0|
+|`maxRecordsPerPoll`|Integer|The maximum number of records/events to be fetched from buffer per poll. The actual maximum will be `Max(maxRecordsPerPoll, Max(bufferSize, 1))`|no, default = 100|
+|`repartitionTransitionDuration`|ISO8601 Period|When shards are split or merged, the supervisor will recompute shard -> task group mappings, and signal any running tasks created under the old mappings to stop early at (current time + `repartitionTransitionDuration`). Stopping the tasks early allows Druid to begin reading from the new shards more quickly. The repartition transition wait time controlled by this property gives the stream additional time to write records to the new shards after the split/merge, which helps avoid the issues with empty shard handling described at https://github.com/apache/druid/issues/7600.|no, (default == PT2M)|
+|`offsetFetchPeriod`|ISO8601 Period|How often the supervisor queries RabbitMQ and the indexing tasks to fetch current offsets and calculate lag. If the user-specified value is below the minimum value (`PT5S`), the supervisor ignores the value and uses the minimum value instead.|no (default == PT30S, min == PT5S)|
+
+
+#### IndexSpec
+
+|Field|Type|Description|Required|
+|-----|----|-----------|--------|
+|bitmap|Object|Compression format for bitmap indexes. Should be a JSON object. See [Bitmap types](#bitmap-types) below for options.|no (defaults to Roaring)|
+|dimensionCompression|String|Compression format for dimension columns. Choose from `LZ4`, `LZF`, or `uncompressed`.|no (default == `LZ4`)|
+|metricCompression|String|Compression format for primitive type metric columns. Choose from `LZ4`, `LZF`, `uncompressed`, or `none`.|no (default == `LZ4`)|
+|longEncoding|String|Encoding format for metric and dimension columns with type long. Choose from `auto` or `longs`. `auto` encodes the values using sequence number or lookup table depending on column cardinality, and store them with variable size. `longs` stores the value as is with 8 bytes each.|no (default == `longs`)|
+
+##### Bitmap types
+
+For Roaring bitmaps:
+
+|Field|Type|Description|Required|
+|-----|----|-----------|--------|
+|`type`|String|Must be `roaring`.|yes|
+
+For Concise bitmaps:
+
+|Field|Type|Description|Required|
+|-----|----|-----------|--------|
+|`type`|String|Must be `concise`.|yes|
+
+#### SegmentWriteOutMediumFactory
+
+|Field|Type|Description|Required|
+|-----|----|-----------|--------|
+|`type`|String|See [Additional Peon configuration: SegmentWriteOutMediumFactory](../../configuration/index.md#segmentwriteoutmediumfactory) for explanation and available options.|yes|
+
+
+
+## Operations
+
+This section describes how some supervisor APIs work in the Rabbit Stream Indexing Service.
+For all supervisor APIs, check [Supervisor APIs](../../api-reference/supervisor-api.md).
+
+### RabbitMQ authentication
+
+To authenticate with RabbitMQ securely, you must provide a username and password, as well as configure
+a certificate if you aren't using a standard certificate provider.
+
+In order to configure these, use the dynamic configuration provider of the ioConfig:
+```
+  "ioConfig": {
+    "type": "rabbit",
+    "stream": "api-audit",
+    "uri": "rabbitmq-stream://localhost:5552",
+    "taskCount": 1,
+    "replicas": 1,
+    "taskDuration": "PT1H",
+    "consumerProperties": {
+        "druid.dynamic.config.provider" : {
+            "type": "environment",
+            "variables": {
+                "username": "RABBIT_USERNAME",
+                "password": "RABBIT_PASSWORD"
+            }
+        }
+    }
+  },
+  ```
\ No newline at end of file
diff --git a/docs/35.0.0/development/extensions-contrib/redis-cache.md b/docs/35.0.0/development/extensions-contrib/redis-cache.md
new file mode 100644
index 0000000000..63e0b9e509
--- /dev/null
+++ b/docs/35.0.0/development/extensions-contrib/redis-cache.md
@@ -0,0 +1,111 @@
+---
+id: redis-cache
+title: "Druid Redis Cache"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+A cache implementation for Druid based on [Redis](https://github.com/redis/redis).
+
+Below are guidance and configuration options known to this module.
+
+## Installation
+
+Use [pull-deps](../../operations/pull-deps.md) tool shipped with Druid to install this [extension](../../configuration/extensions.md#community-extensions) on broker, historical and middle manager nodes.
+
+```bash
+java -classpath "druid_dir/lib/*" org.apache.druid.cli.Main tools pull-deps -c org.apache.druid.extensions.contrib:druid-redis-cache:{VERSION}
+```
+
+## Enabling
+
+To enable this extension after installation,
+
+1. [include](../../configuration/extensions.md#loading-extensions) this `druid-redis-cache` extension
+2. to enable cache on broker nodes, follow [broker caching docs](../../configuration/index.md#broker-caching) to set related properties
+3. to enable cache on historical nodes, follow [historical caching docs](../../configuration/index.md#historical-caching) to set related properties
+4. to enable cache on middle manager nodes, follow [peon caching docs](../../configuration/index.md#peon-caching) to set related properties
+5. set `druid.cache.type` to `redis`
+6. add the following properties
+
+## Configuration
+
+### Cluster mode 
+
+To utilize a redis cluster, following properties must be set.
+
+Note: some redis cloud service providers provide redis cluster service via a redis proxy, for these clusters, please follow the [Standalone mode](#standalone-mode) configuration below.
+
+| Properties |Description|Default|Required|
+|--------------------|-----------|-------|--------|
+|`druid.cache.cluster.nodes`| Redis nodes in a cluster, represented in comma separated string. See example below | None | yes |
+|`druid.cache.cluster.maxRedirection`| Max retry count | 5 | no |
+
+#### Example 
+
+```properties
+# a typical redis cluster with 6 nodes
+druid.cache.cluster.nodes=127.0.0.1:7001,127.0.0.1:7002,127.0.0.1:7003,127.0.0.1:7004,127.0.0.1:7005,127.0.0.1:7006
+```
+
+### Standalone mode
+
+To use a standalone redis, following properties must be set.
+
+| Properties |Description|Default|Required|
+|--------------------|-----------|-------|--------|
+|`druid.cache.host`|Redis server host|None|yes|
+|`druid.cache.port`|Redis server port|None|yes|
+|`druid.cache.database`|Redis database index|0|no|
+
+Note: if both `druid.cache.cluster.nodes` and `druid.cache.host` are provided, cluster mode is preferred.
+
+### Shared Properties
+
+Except for the properties above, there are some extra properties which can be customized to meet different needs.
+
+| Properties |Description|Default|Required|
+|--------------------|-----------|-------|--------|
+|`druid.cache.password`| Password to access redis server/cluster | None |no|
+|`druid.cache.expiration`|Expiration for cache entries | P1D |no|
+|`druid.cache.timeout`|Timeout for connecting to Redis and reading entries from Redis|PT2S|no|
+|`druid.cache.maxTotalConnections`|Max total connections to Redis|8|no|
+|`druid.cache.maxIdleConnections`|Max idle connections to Redis|8|no|
+|`druid.cache.minIdleConnections`|Min idle connections to Redis|0|no|
+
+For `druid.cache.expiration` and `druid.cache.timeout` properties, values can be format of `Period` or a number in milliseconds.
+
+```properties
+# Period format(recomended)
+# cache expires after 1 hour
+druid.cache.expiration=PT1H
+
+# or in number(milliseconds) format
+# 1 hour = 3_600_000 milliseconds
+druid.cache.expiration=3600000
+```
+
+## Metrics
+
+In addition to the normal cache metrics, the redis cache implementation also reports the following in both `total` and `delta`
+
+|Metric|Description|Normal value|
+|------|-----------|------------|
+|`query/cache/redis/*/requests`|Count of requests to redis cache|whatever request to redis will increase request count by 1|
diff --git a/docs/35.0.0/development/extensions-contrib/spectator-histogram.md b/docs/35.0.0/development/extensions-contrib/spectator-histogram.md
new file mode 100644
index 0000000000..e6d12517e5
--- /dev/null
+++ b/docs/35.0.0/development/extensions-contrib/spectator-histogram.md
@@ -0,0 +1,457 @@
+---
+id: spectator-histogram
+title: "Spectator Histogram module"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+## Summary
+This module provides Apache Druid approximate histogram aggregators and percentile
+post-aggregators based on Spectator fixed-bucket histograms.
+
+Consider SpectatorHistogram to compute percentile approximations. This extension has a reduced storage footprint compared to the [DataSketches extension](../extensions-core/datasketches-extension.md), which results in smaller segment sizes, faster loading from deep storage, and lower memory usage. This extension provides fast and accurate queries on large datasets at low storage cost.
+
+This aggregator only applies when your raw data contains positive long integer values. Do not use this aggregator if you have negative values in your data.
+
+In the Druid instance shown below, the example Wikipedia dataset is loaded 3 times.
+* `wikipedia` contains the dataset ingested as is, without rollup
+* `wikipedia_spectator` contains the dataset with a single extra metric column of type `spectatorHistogram` for the `added` column
+* `wikipedia_datasketch` contains the dataset with a single extra metric column of type `quantilesDoublesSketch` for the `added` column
+
+Spectator histograms average just 6 extra bytes per row, while the `quantilesDoublesSketch`
+adds 48 bytes per row. This represents an eightfold reduction in additional storage size for spectator histograms.
+
+![Comparison of datasource sizes in web console](../../assets/spectator-histogram-size-comparison.png)
+
+As rollup improves, so does the size savings. For example, when you ingest the Wikipedia dataset
+with day-grain query granularity and remove all dimensions except `countryName`,
+this results in a segment that has just 106 rows. The base segment has 87 bytes per row.
+Compare the following bytes per row for SpectatorHistogram versus DataSketches:
+* An additional `spectatorHistogram` column adds 27 bytes per row on average.
+* An additional `quantilesDoublesSketch` column adds 255 bytes per row.
+
+SpectatorHistogram reduces the additional storage size by 9.4 times in this example.
+Storage gains will differ per dataset depending on the variance and rollup of the data.
+
+## Background
+[Spectator](https://netflix.github.io/atlas-docs/spectator/) is a simple library
+for instrumenting code to record dimensional time series data.
+It was built, primarily, to work with [Atlas](https://netflix.github.io/atlas-docs/).
+Atlas was developed by Netflix to manage dimensional time series data for near
+real-time operational insight.
+
+With the [Atlas-Druid](https://github.com/Netflix-Skunkworks/iep-apps/tree/main/atlas-druid)
+service, it's possible to use the power of Atlas queries, backed by Druid as a
+data store to benefit from high-dimensionality and high-cardinality data.
+
+SpectatorHistogram is designed for efficient parallel aggregations while still
+allowing for filtering and grouping by dimensions. 
+It provides similar functionality to the built-in DataSketches `quantilesDoublesSketch` aggregator, but is
+opinionated to maintain higher absolute accuracy at smaller values.
+Larger values have lower absolute accuracy; however, relative accuracy is maintained across the range.
+See [Bucket boundaries](#histogram-bucket-boundaries) for more information.
+The SpectatorHistogram is optimized for typical measurements from cloud services and web apps,
+such as page load time, transferred bytes, response time, and request latency.
+
+Through some trade-offs SpectatorHistogram provides a significantly more compact
+representation with the same aggregation performance and accuracy as
+DataSketches Quantiles Sketch. Note that results depend on the dataset.
+Also see the [limitations](#limitations] of this extension.
+
+## Limitations
+* Supports positive long integer values within the range of [0, 2^53). Negatives are
+coerced to 0.
+* Does not support decimals.
+* Does not support Druid SQL queries, only native queries.
+* Does not support vectorized queries.
+* Generates 276 fixed buckets with increasing bucket widths. In practice, the observed error of computed percentiles ranges from 0.1% to 3%, exclusive. See [Bucket boundaries](#histogram-bucket-boundaries) for the full list of bucket boundaries.
+
+:::tip
+If these limitations don't work for your use case, then use [DataSketches](../extensions-core/datasketches-extension.md) instead.
+:::
+
+## Functionality
+The SpectatorHistogram aggregator can generate histograms from raw numeric
+values as well as aggregating or combining pre-aggregated histograms generated using
+the SpectatorHistogram aggregator itself.
+While you can generate histograms on the fly at query time, it is generally more
+performant to generate histograms during ingestion and then combine them at
+query time. This is especially true where rollup is enabled. It may be misleading or 
+incorrect to generate histograms from already rolled-up summed data.
+
+The module provides postAggregators, `percentileSpectatorHistogram` (singular) and
+`percentilesSpectatorHistogram` (plural), to compute approximate 
+percentiles from histograms generated by the SpectatorHistogram aggregator.
+Again, these postAggregators can be used to compute percentiles from raw numeric
+values via the SpectatorHistogram aggregator or from pre-aggregated histograms.
+
+> If you're only using the aggregator to compute percentiles from raw numeric values,
+then you can use the built-in quantilesDoublesSketch aggregator instead. The performance
+and accuracy are comparable. However, the DataSketches aggregator supports negative values,
+and you don't need to download an additional extension.
+ 
+An aggregated SpectatorHistogram can also be queried using a `longSum` or `doubleSum`
+aggregator to retrieve the population of the histogram. This is effectively the count
+of the number of values that were aggregated into the histogram. This flexibility can
+avoid the need to maintain a separate metric for the count of values.
+
+For high-frequency measurements, you may need to pre-aggregate data at the client prior
+to sending into Druid. For example, if you're measuring individual image render times
+on an image-heavy website, you may want to aggregate the render times for a page-view
+into a single histogram prior to sending to Druid in real-time. This can reduce the
+amount of data that's needed to send from the client across the wire.
+
+SpectatorHistogram supports ingesting pre-aggregated histograms in real-time and batch.
+They can be sent as a JSON map, keyed by the spectator bucket ID and the value is the
+count of values. This is the same format as the serialized JSON representation of the
+histogram. The keys need not be ordered or contiguous. For example:
+
+```json
+{ "4":  8, "5": 15, "6": 37, "7": 9, "8": 3, "10": 1, "13": 1 }
+```
+
+## Loading the extension
+To use SpectatorHistogram, make sure you [include](../../configuration/extensions.md#loading-extensions) the extension in your config file:
+
+```
+druid.extensions.loadList=["druid-spectator-histogram"]
+```
+
+## Aggregators
+
+The result of the aggregation is a histogram that is built by ingesting numeric values from
+the raw data, or from combining pre-aggregated histograms. The result is represented in 
+JSON format where the keys are the bucket index and the values are the count of entries
+in that bucket.
+
+The buckets are defined as per the Spectator [PercentileBuckets](https://github.com/Netflix/spectator/blob/main/spectator-api/src/main/java/com/netflix/spectator/api/histogram/PercentileBuckets.java) specification.
+See [Histogram bucket boundaries](#histogram-bucket-boundaries) for the full list of bucket boundaries.
+```js
+  // The set of buckets is generated by using powers of 4 and incrementing by one-third of the
+  // previous power of 4 in between as long as the value is less than the next power of 4 minus
+  // the delta.
+  //
+  // Base: 1, 2, 3
+  //
+  // 4 (4^1), delta = 1 (~1/3 of 4)
+  //     5, 6, 7, ..., 14,
+  //
+  // 16 (4^2), delta = 5 (~1/3 of 16)
+  //    21, 26, 31, ..., 56,
+  //
+  // 64 (4^3), delta = 21 (~1/3 of 64)
+  // ...
+```
+
+There are multiple aggregator types included, all of which are based on the same
+underlying implementation. If you use the Atlas-Druid service, the different types
+signal the service on how to handle the resulting data from a query.
+
+* spectatorHistogramTimer signals that the histogram is representing
+a collection of timer values. It is recommended to normalize timer values to nanoseconds
+at, or prior to, ingestion. If queried via the Atlas-Druid service, it will
+normalize timers to second resolution at query time as a more natural unit of time
+for human consumption.
+* spectatorHistogram and spectatorHistogramDistribution are generic histograms that
+can be used to represent any measured value without units. No normalization is
+required or performed.
+
+### `spectatorHistogram` aggregator
+Alias: `spectatorHistogramDistribution`, `spectatorHistogramTimer`
+
+To aggregate at query time:
+```
+{
+  "type" : "spectatorHistogram",
+  "name" : <output_name>,
+  "fieldName" : <column_name>
+ }
+```
+
+| Property  | Description                                                                                                  | Required? |
+|-----------|--------------------------------------------------------------------------------------------------------------|-----------|
+| type      | This String must be one of "spectatorHistogram", "spectatorHistogramTimer", "spectatorHistogramDistribution" | yes       |
+| name      | A String for the output (result) name of the aggregation.                                                    | yes       |
+| fieldName | A String for the name of the input field containing raw numeric values or pre-aggregated histograms.         | yes       |
+
+### `longSum`, `doubleSum` and `floatSum` aggregators
+To get the population size (count of events contributing to the histogram):
+```
+{
+  "type" : "longSum",
+  "name" : <output_name>,
+  "fieldName" : <column_name_of_aggregated_histogram>
+ }
+```
+
+| Property  | Description                                                                    | Required? |
+|-----------|--------------------------------------------------------------------------------|-----------|
+| type      | Must be "longSum", "doubleSum", or "floatSum".                                 | yes       |
+| name      | A String for the output (result) name of the aggregation.                      | yes       |
+| fieldName | A String for the name of the input field containing pre-aggregated histograms. | yes       |
+
+## Post Aggregators
+
+### Percentile (singular)
+This returns a single percentile calculation based on the distribution of the values in the aggregated histogram.
+
+```
+{
+  "type": "percentileSpectatorHistogram",
+  "name": <output name>,
+  "field": {
+    "type": "fieldAccess",
+    "fieldName": <name of aggregated SpectatorHistogram>
+  },
+  "percentile": <decimal percentile, e.g. 50.0 for median>
+}
+```
+
+| Property   | Description                                                 | Required? |
+|------------|-------------------------------------------------------------|-----------|
+| type       | This String should always be "percentileSpectatorHistogram" | yes       |
+| name       | A String for the output (result) name of the calculation.   | yes       |
+| field      | A field reference pointing to the aggregated histogram.     | yes       |
+| percentile | A single decimal percentile between 0.0 and 100.0           | yes       |
+
+### Percentiles (multiple)
+This returns an array of percentiles corresponding to those requested.
+
+```
+{
+  "type": "percentilesSpectatorHistogram",
+  "name": <output name>,
+  "field": {
+    "type": "fieldAccess",
+    "fieldName": <name of aggregated SpectatorHistogram>
+  },
+  "percentiles": [25, 50, 75, 99.5]
+}
+```
+
+> It's more efficient to request multiple percentiles in a single query
+than to request individual percentiles in separate queries. This array-based
+helper is provided for convenience and has a marginal performance benefit over
+using the singular percentile post-aggregator multiple times within a query.
+The more expensive part of the query is the aggregation of the histogram.
+The post-aggregation calculations all happen on the same aggregated histogram.
+
+The results contain arrays matching the length and order of the requested
+array of percentiles.
+
+```
+"percentilesAdded": [
+    0.5504911679884643, // 25th percentile
+    4.013975155279504,  // 50th percentile 
+    78.89518317503394,  // 75th percentile
+    8580.024999999994   // 99.5th percentile
+]
+```
+
+| Property    | Description                                                  | Required? |
+|-------------|--------------------------------------------------------------|-----------|
+| type        | This String should always be "percentilesSpectatorHistogram" | yes       |
+| name        | A String for the output (result) name of the calculation.    | yes       |
+| field       | A field reference pointing to the aggregated histogram.      | yes       |
+| percentiles | Non-empty array of decimal percentiles between 0.0 and 100.0 | yes       |
+
+## Examples
+
+### Example Ingestion Spec
+Example of ingesting the sample Wikipedia dataset with a histogram metric column:
+```json
+{
+  "type": "index_parallel",
+  "spec": {
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "http",
+        "uris": ["https://druid.apache.org/data/wikipedia.json.gz"]
+      },
+      "inputFormat": { "type": "json" }
+    },
+    "dataSchema": {
+      "granularitySpec": {
+        "segmentGranularity": "day",
+        "queryGranularity": "minute",
+        "rollup": true
+      },
+      "dataSource": "wikipedia",
+      "timestampSpec": { "column": "timestamp", "format": "iso" },
+      "dimensionsSpec": {
+        "dimensions": [
+          "isRobot",
+          "channel",
+          "flags",
+          "isUnpatrolled",
+          "page",
+          "diffUrl",
+          "comment",
+          "isNew",
+          "isMinor",
+          "isAnonymous",
+          "user",
+          "namespace",
+          "cityName",
+          "countryName",
+          "regionIsoCode",
+          "metroCode",
+          "countryIsoCode",
+          "regionName"
+        ]
+      },
+      "metricsSpec": [
+        { "name": "count", "type": "count" },
+        { "name": "sum_added", "type": "longSum", "fieldName": "added" },
+        {
+          "name": "hist_added",
+          "type": "spectatorHistogram",
+          "fieldName": "added"
+        }
+      ]
+    },
+    "tuningConfig": {
+      "type": "index_parallel",
+      "partitionsSpec": { "type": "hashed" },
+      "forceGuaranteedRollup": true
+    }
+  }
+}
+```
+
+### Example Query
+Example query using the sample Wikipedia dataset:
+```json
+{
+  "queryType": "timeseries",
+  "dataSource": {
+    "type": "table",
+    "name": "wikipedia"
+  },
+  "intervals": {
+    "type": "intervals",
+    "intervals": [
+      "0000-01-01/9999-12-31"
+    ]
+  },
+  "granularity": {
+    "type": "all"
+  },
+  "aggregations": [
+    {
+      "type": "spectatorHistogram",
+      "name": "histogram_added",
+      "fieldName": "added"
+    }
+  ],
+  "postAggregations": [
+    {
+      "type": "percentileSpectatorHistogram",
+      "name": "medianAdded",
+      "field": {
+        "type": "fieldAccess",
+        "fieldName": "histogram_added"
+      },
+      "percentile": "50.0"
+    }
+  ]
+}
+```
+Results in
+```json
+[
+  {
+    "result": {
+      "histogram_added": {
+        "0": 11096, "1": 632, "2": 297, "3": 187, "4": 322, "5": 161,
+        "6": 174, "7": 127, "8": 125, "9": 162, "10": 123, "11": 106,
+        "12": 95, "13": 104, "14": 95, "15": 588, "16": 540, "17": 690,
+        "18": 719, "19": 478, "20": 288, "21": 250, "22": 219, "23": 224,
+        "24": 737, "25": 424, "26": 343, "27": 266, "28": 232, "29": 217,
+        "30": 171, "31": 164, "32": 161, "33": 530, "34": 339, "35": 236,
+        "36": 181, "37": 152, "38": 113, "39": 128, "40": 80, "41": 75,
+        "42": 289, "43": 145, "44": 138, "45": 83, "46": 45, "47": 46,
+        "48": 64, "49": 65, "50": 71, "51": 421, "52": 525, "53": 59,
+        "54": 31, "55": 35, "56": 8, "57": 10, "58": 5, "59": 4, "60": 11,
+        "61": 10, "62": 5, "63": 2, "64": 2, "65": 1, "67": 1, "68": 1,
+        "69": 1, "70": 1, "71": 1, "78": 2
+      },
+      "medianAdded": 4.013975155279504
+    },
+    "timestamp": "2016-06-27T00:00:00.000Z"
+  }
+]
+```
+
+## Histogram bucket boundaries
+The following array lists the upper bounds of each bucket index. There are 276 buckets in total.
+The first bucket index is 0 and the last bucket index is 275.
+The bucket widths increase as the bucket index increases. This leads to a greater absolute error for larger values, but maintains a relative error of rough percentage across the number range.
+For example, the maximum error at value 10 is zero since the bucket width is 1 (the difference of `11-10`). For a value of 16,000,000,000, the bucket width is 1,431,655,768 (from `17179869184-15748213416`). This gives an error of up to ~8.9%, from `1,431,655,768/16,000,000,000*100`. In practice, the observed error of computed percentiles is in the range of (0.1%, 3%).
+```json
+[
+  1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 16, 21, 26, 31, 36, 41, 46,
+  51, 56, 64, 85, 106, 127, 148, 169, 190, 211, 232, 256, 341, 426, 511, 596,
+  681, 766, 851, 936, 1024, 1365, 1706, 2047, 2388, 2729, 3070, 3411, 3752,
+  4096, 5461, 6826, 8191, 9556, 10921, 12286, 13651, 15016, 16384, 21845,
+  27306, 32767, 38228, 43689, 49150, 54611, 60072, 65536, 87381, 109226,
+  131071, 152916, 174761, 196606, 218451, 240296, 262144, 349525, 436906,
+  524287, 611668, 699049, 786430, 873811, 961192, 1048576, 1398101, 1747626,
+  2097151, 2446676, 2796201, 3145726, 3495251, 3844776, 4194304, 5592405,
+  6990506, 8388607, 9786708, 11184809, 12582910, 13981011, 15379112, 16777216,
+  22369621, 27962026, 33554431, 39146836, 44739241, 50331646, 55924051,
+  61516456, 67108864, 89478485, 111848106, 134217727, 156587348, 178956969,
+  201326590, 223696211, 246065832, 268435456, 357913941, 447392426, 536870911,
+  626349396, 715827881, 805306366, 894784851, 984263336, 1073741824, 1431655765,
+  1789569706, 2147483647, 2505397588, 2863311529, 3221225470, 3579139411,
+  3937053352, 4294967296, 5726623061, 7158278826, 8589934591, 10021590356,
+  11453246121, 12884901886, 14316557651, 15748213416, 17179869184, 22906492245,
+  28633115306, 34359738367, 40086361428, 45812984489, 51539607550, 57266230611,
+  62992853672, 68719476736, 91625968981, 114532461226, 137438953471,
+  160345445716, 183251937961, 206158430206, 229064922451, 251971414696,
+  274877906944, 366503875925, 458129844906, 549755813887, 641381782868,
+  733007751849, 824633720830, 916259689811, 1007885658792, 1099511627776,
+  1466015503701, 1832519379626, 2199023255551, 2565527131476, 2932031007401,
+  3298534883326, 3665038759251, 4031542635176, 4398046511104, 5864062014805,
+  7330077518506, 8796093022207, 10262108525908, 11728124029609, 13194139533310,
+  14660155037011, 16126170540712, 17592186044416, 23456248059221,
+  29320310074026, 35184372088831, 41048434103636, 46912496118441,
+  52776558133246, 58640620148051, 64504682162856, 70368744177664,
+  93824992236885, 117281240296106, 140737488355327, 164193736414548,
+  187649984473769, 211106232532990, 234562480592211, 258018728651432,
+  281474976710656, 375299968947541, 469124961184426, 562949953421311,
+  656774945658196, 750599937895081, 844424930131966, 938249922368851,
+  1032074914605736, 1125899906842624, 1501199875790165, 1876499844737706,
+  2251799813685247, 2627099782632788, 3002399751580329, 3377699720527870,
+  3752999689475411, 4128299658422952, 4503599627370496, 6004799503160661,
+  7505999378950826, 9007199254740991, 10508399130531156, 12009599006321321,
+  13510798882111486, 15011998757901651, 16513198633691816, 18014398509481984,
+  24019198012642645, 30023997515803306, 36028797018963967, 42033596522124628,
+  48038396025285289, 54043195528445950, 60047995031606611, 66052794534767272,
+  72057594037927936, 96076792050570581, 120095990063213226, 144115188075855871,
+  168134386088498516, 192153584101141161, 216172782113783806, 240191980126426451,
+  264211178139069096, 288230376151711744, 384307168202282325, 480383960252852906,
+  576460752303423487, 672537544353994068, 768614336404564649, 864691128455135230,
+  960767920505705811, 1056844712556276392, 1152921504606846976, 1537228672809129301,
+  1921535841011411626, 2305843009213693951, 2690150177415976276, 3074457345618258601,
+  3458764513820540926, 3843071682022823251, 4227378850225105576, 9223372036854775807
+]
+```
diff --git a/docs/35.0.0/development/extensions-contrib/sqlserver.md b/docs/35.0.0/development/extensions-contrib/sqlserver.md
new file mode 100644
index 0000000000..0f2e8de24e
--- /dev/null
+++ b/docs/35.0.0/development/extensions-contrib/sqlserver.md
@@ -0,0 +1,56 @@
+---
+id: sqlserver
+title: "Microsoft SQLServer"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+To use this Apache Druid extension, [include](../../configuration/extensions.md#loading-extensions) `sqlserver-metadata-storage` in the extensions load list.
+
+## Setting up SQLServer
+
+1. Install Microsoft SQLServer
+
+2. Create a druid database and user
+
+  Create the druid user
+  - Microsoft SQL Server Management Studio - Security - Logins - New Login...
+  - Create a druid user, enter `diurd` when prompted for the password.
+
+  Create a druid database owned by the user we just created
+  - Databases - New Database
+  - Database Name: druid, Owner: druid
+
+3. Add the Microsoft JDBC library to the Druid classpath
+  - To ensure the com.microsoft.sqlserver.jdbc.SQLServerDriver class is loaded you will have to add the appropriate Microsoft JDBC library (sqljdbc*.jar) to the Druid classpath.
+  - For instance, if all jar files in your "druid/lib" directory are automatically added to your Druid classpath, then manually download the Microsoft JDBC drivers from ( https://www.microsoft.com/en-ca/download/details.aspx?id=11774) and drop it into my druid/lib directory.
+
+4. Configure your Druid metadata storage extension:
+
+  Add the following parameters to your Druid configuration, replacing `<host>`
+  with the location (host name and port) of the database.
+
+  ```properties
+  druid.metadata.storage.type=sqlserver
+  druid.metadata.storage.connector.connectURI=jdbc:sqlserver://<host>;databaseName=druid
+  druid.metadata.storage.connector.user=druid
+  druid.metadata.storage.connector.password=diurd
+  ```
diff --git a/docs/35.0.0/development/extensions-contrib/statsd.md b/docs/35.0.0/development/extensions-contrib/statsd.md
new file mode 100644
index 0000000000..3e5713f586
--- /dev/null
+++ b/docs/35.0.0/development/extensions-contrib/statsd.md
@@ -0,0 +1,75 @@
+---
+id: statsd
+title: "StatsD Emitter"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+To use this Apache Druid extension, [include](../../configuration/extensions.md#loading-extensions) `statsd-emitter` in the extensions load list.
+
+## Introduction
+
+This extension emits druid metrics to a StatsD server.
+(https://github.com/etsy/statsd)
+(https://github.com/armon/statsite)
+
+## Configuration
+
+All the configuration parameters for the StatsD emitter are under `druid.emitter.statsd`.
+
+|property|description|required?|default|
+|--------|-----------|---------|-------|
+|`druid.emitter.statsd.hostname`|The hostname of the StatsD server.|yes|none|
+|`druid.emitter.statsd.port`|The port of the StatsD server.|yes|none|
+|`druid.emitter.statsd.prefix`|Optional metric name prefix.|no|""|
+|`druid.emitter.statsd.separator`|Metric name separator|no|.|
+|`druid.emitter.statsd.includeHost`|Flag to include the hostname as part of the metric name.|no|false|
+|`druid.emitter.statsd.dimensionMapPath`|JSON file defining the StatsD type, and desired dimensions for every Druid metric|no|Default mapping provided. See below.|
+|`druid.emitter.statsd.blankHolder`|The blank character replacement as StatsD does not support path with blank character|no|"-"|
+|`druid.emitter.statsd.queueSize`|Maximum number of unprocessed messages in the message queue.|no|Default value of StatsD Client(4096)|
+|`druid.emitter.statsd.poolSize`|Network packet buffer pool size.|no|Default value of StatsD Client(512)|
+|`druid.emitter.statsd.processorWorkers`|The number of processor worker threads assembling buffers for submission.|no|Default value of StatsD Client(1)|
+|`druid.emitter.statsd.senderWorkers`|	The number of sender worker threads submitting buffers to the socket.|no|Default value of StatsD Client(1)|
+|`druid.emitter.statsd.dogstatsd`|Flag to enable [DogStatsD](https://docs.datadoghq.com/developers/dogstatsd/) support. Causes dimensions to be included as tags, not as a part of the metric name. `convertRange` fields will be ignored.|no|false|
+|`druid.emitter.statsd.dogstatsdConstantTags`|If `druid.emitter.statsd.dogstatsd` is true, the tags in the JSON list of strings will be sent with every event.|no|[]|
+|`druid.emitter.statsd.dogstatsdServiceAsTag`|If `druid.emitter.statsd.dogstatsd` and `druid.emitter.statsd.dogstatsdServiceAsTag` are true, druid service (e.g. `druid/broker`, `druid/coordinator`, etc) is reported as a tag (e.g. `druid_service:druid/broker`) instead of being included in metric name (e.g. `druid.broker.query.time`) and `druid` is used as metric prefix (e.g. `druid.query.time`).|no|false|
+|`druid.emitter.statsd.dogstatsdEvents`|If `druid.emitter.statsd.dogstatsd` and `druid.emitter.statsd.dogstatsdEvents` are true, [Alert events](../../operations/alerts.md) are reported to DogStatsD.|no|false|
+
+### Druid to StatsD Event Converter
+
+Each metric sent to StatsD must specify a type, one of `[timer, counter, guage]`. StatsD Emitter expects this mapping to
+be provided as a JSON file.  Additionally, this mapping specifies which dimensions should be included for each metric.
+StatsD expects that metric values be integers.  Druid emits some metrics with values between the range 0 and 1. To accommodate these metrics they are converted
+into the range 0 to 100.  This conversion can be enabled by setting the optional "convertRange" field true in the JSON mapping file.
+If the user does not specify their own JSON file, a default mapping is used.  All
+metrics are expected to be mapped. Metrics which are not mapped will log an error.
+StatsD metric path is organized using the following schema:
+`<druid metric name> : { "dimensions" : <dimension list>, "type" : <StatsD type>, "convertRange" : true/false}`
+e.g.
+`query/time" : { "dimensions" : ["dataSource", "type"], "type" : "timer"}`
+
+For metrics which are emitted from multiple services with different dimensions, the metric name is prefixed with
+the service name.
+e.g.
+`"druid/coordinator-segment/count" : { "dimensions" : ["dataSource"], "type" : "gauge" },
+ "druid/historical-segment/count" : { "dimensions" : ["dataSource", "tier", "priority"], "type" : "gauge" }`
+
+For most use-cases, the default mapping is sufficient.
diff --git a/docs/35.0.0/development/extensions-contrib/tdigestsketch-quantiles.md b/docs/35.0.0/development/extensions-contrib/tdigestsketch-quantiles.md
new file mode 100644
index 0000000000..101368445d
--- /dev/null
+++ b/docs/35.0.0/development/extensions-contrib/tdigestsketch-quantiles.md
@@ -0,0 +1,175 @@
+---
+id: tdigestsketch-quantiles
+title: "T-Digest Quantiles Sketch module"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+This module provides Apache Druid approximate sketch aggregators based on T-Digest.
+T-Digest (https://github.com/tdunning/t-digest) is a popular data structure for accurate on-line accumulation of
+rank-based statistics such as quantiles and trimmed means.
+The data structure is also designed for parallel programming use cases like distributed aggregations or map reduce jobs by making combining two intermediate t-digests easy and efficient.
+
+The tDigestSketch aggregator is capable of generating sketches from raw numeric values as well as 
+aggregating/combining pre-generated T-Digest sketches generated using the tDigestSketch aggregator itself.
+While one can generate sketches on the fly during the query time itself, it generally is more performant
+to generate sketches during ingestion time itself and then combining them during query time.
+The module also provides a postAggregator, quantilesFromTDigestSketch, that can be used to compute approximate 
+quantiles from T-Digest sketches generated by the tDigestSketch aggregator.
+
+To use this aggregator, make sure you [include](../../configuration/extensions.md#loading-extensions) the extension in your config file:
+
+```
+druid.extensions.loadList=["druid-tdigestsketch"]
+```
+
+### Aggregator
+
+The result of the aggregation is a T-Digest sketch that is built ingesting numeric values from the raw data or from
+combining pre-generated T-Digest sketches.
+
+```json
+{
+  "type" : "tDigestSketch",
+  "name" : <output_name>,
+  "fieldName" : <metric_name>,
+  "compression": <parameter that controls size and accuracy>
+ }
+```
+
+Example:
+
+```json
+{
+	"type": "tDigestSketch",
+	"name": "sketch",
+	"fieldName": "session_duration",
+	"compression": 200
+}
+```
+
+```json
+{
+	"type": "tDigestSketch",
+	"name": "combined_sketch",
+	"fieldName": <input-column>,
+	"compression": 200
+}
+```
+
+|property|description|required?|
+|--------|-----------|---------|
+|type|This String should always be "tDigestSketch"|yes|
+|name|A String for the output (result) name of the calculation.|yes|
+|fieldName|A String for the name of the input field containing raw numeric values or pre-generated T-Digest sketches.|yes|
+|compression|Parameter that determines the accuracy and size of the sketch. Higher compression means higher accuracy but more space to store sketches.|no, defaults to 100|
+
+
+### Post Aggregators
+
+#### Quantiles
+
+This returns an array of quantiles corresponding to a given array of fractions.
+
+```json
+{
+  "type"  : "quantilesFromTDigestSketch",
+  "name": <output name>,
+  "field"  : <post aggregator that refers to a TDigestSketch (fieldAccess or another post aggregator)>,
+  "fractions" : <array of fractions>
+}
+```
+
+|property|description|required?|
+|--------|-----------|---------|
+|type|This String should always be "quantilesFromTDigestSketch"|yes|
+|name|A String for the output (result) name of the calculation.|yes|
+|field|A field reference pointing to the field aggregated/combined T-Digest sketch.|yes|
+|fractions|Non-empty array of fractions between 0 and 1|yes|
+
+Example:
+
+```json
+{
+	"queryType": "groupBy",
+	"dataSource": "test_datasource",
+	"granularity": "ALL",
+	"dimensions": [],
+	"aggregations": [{
+		"type": "tDigestSketch",
+		"name": "merged_sketch",
+		"fieldName": "ingested_sketch",
+		"compression": 200
+	}],
+	"postAggregations": [{
+		"type": "quantilesFromTDigestSketch",
+		"name": "quantiles",
+		"fractions": [0, 0.5, 1],
+		"field": {
+			"type": "fieldAccess",
+			"fieldName": "merged_sketch"
+		}
+	}],
+	"intervals": ["2016-01-01T00:00:00.000Z/2016-01-31T00:00:00.000Z"]
+}
+```
+
+Similar to quantilesFromTDigestSketch except it takes in a single fraction for computing quantile.
+
+```json
+{
+  "type"  : "quantileFromTDigestSketch",
+  "name": <output name>,
+  "field"  : <post aggregator that refers to a TDigestSketch (fieldAccess or another post aggregator)>,
+  "fraction" : <value>
+}
+```
+
+|property|description|required?|
+|--------|-----------|---------|
+|type|This String should always be "quantileFromTDigestSketch"|yes|
+|name|A String for the output (result) name of the calculation.|yes|
+|field|A field reference pointing to the field aggregated/combined T-Digest sketch.|yes|
+|fraction|Decimal value between 0 and 1|yes|
+
+### SQL functions
+
+Once you load the T-Digest extension, you can use the following SQL functions.
+
+#### TDIGEST_GENERATE_SKETCH
+
+Builds a T-Digest sketch on values produced by an expression.
+Compression parameter (default value 100) determines the accuracy and size of the sketch.
+Higher compression provides higher accuracy but requires more storage space.
+
+* **Syntax**: `TDIGEST_GENERATE_SKETCH(expr, [compression])`
+* **Default**: Empty Base64-encoded T-Digest sketch string
+* **Function type**: [Aggregation](../../querying/sql-aggregations.md)
+
+#### TDIGEST_QUANTILE
+
+Builds a T-Digest sketch on values produced by an expression and returns the value for the quantile.
+Compression parameter (default value 100) determines the accuracy and size of the sketch.
+Higher compression provides higher accuracy but requires more storage space.
+
+* **Syntax**: `TDIGEST_QUANTILE(expr, quantileFraction, [compression])`
+* **Default**: `Double.NaN`
+* **Function type**: [Aggregation](../../querying/sql-aggregations.md)
diff --git a/docs/35.0.0/development/extensions-contrib/thrift.md b/docs/35.0.0/development/extensions-contrib/thrift.md
new file mode 100644
index 0000000000..3148982709
--- /dev/null
+++ b/docs/35.0.0/development/extensions-contrib/thrift.md
@@ -0,0 +1,87 @@
+---
+id: thrift
+title: "Thrift"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+To use this Apache Druid extension, [include](../../configuration/extensions.md#loading-extensions) `druid-thrift-extensions` in the extensions load list.
+
+This extension enables Druid to ingest thrift compact data online (`ByteBuffer`) and offline (SequenceFile of type `<Writable, BytesWritable>` or LzoThriftBlock File).
+
+You may want to use another version of thrift, change the dependency in pom and compile yourself.
+
+## LZO Support
+
+If you plan to read LZO-compressed Thrift files, you will need to download version 0.4.19 of the [hadoop-lzo JAR](https://mvnrepository.com/artifact/com.hadoop.gplcompression/hadoop-lzo/0.4.19) and place it in your `extensions/druid-thrift-extensions` directory.
+
+## Thrift Parser
+
+
+| Field       | Type        | Description                              | Required |
+| ----------- | ----------- | ---------------------------------------- | -------- |
+| type        | String      | This should say `thrift`                 | yes      |
+| parseSpec   | JSON Object | Specifies the timestamp and dimensions of the data. Should be a JSON parseSpec. | yes      |
+| thriftJar   | String      | path of thrift jar, if not provided, it will try to find the thrift class in classpath. Thrift jar in batch ingestion should be uploaded to HDFS first and configure `jobProperties` with `"tmpjars":"/path/to/your/thrift.jar"` | no       |
+| thriftClass | String      | classname of thrift                      | yes      |
+
+- Batch Ingestion example - `inputFormat` and `tmpjars` should be set.
+
+This is for batch ingestion using the HadoopDruidIndexer. The inputFormat of inputSpec in ioConfig could be one of `"org.apache.hadoop.mapreduce.lib.input.SequenceFileInputFormat"` and `com.twitter.elephantbird.mapreduce.input.LzoThriftBlockInputFormat`. Be careful, when `LzoThriftBlockInputFormat` is used, thrift class must be provided twice.
+
+```json
+{
+  "type": "index_hadoop",
+  "spec": {
+    "dataSchema": {
+      "dataSource": "book",
+      "parser": {
+        "type": "thrift",
+        "jarPath": "book.jar",
+        "thriftClass": "org.apache.druid.data.input.thrift.Book",
+        "protocol": "compact",
+        "parseSpec": {
+          "format": "json",
+          ...
+        }
+      },
+      "metricsSpec": [],
+      "granularitySpec": {}
+    },
+    "ioConfig": {
+      "type": "hadoop",
+      "inputSpec": {
+        "type": "static",
+        "inputFormat": "org.apache.hadoop.mapreduce.lib.input.SequenceFileInputFormat",
+        // "inputFormat": "com.twitter.elephantbird.mapreduce.input.LzoThriftBlockInputFormat",
+        "paths": "/user/to/some/book.seq"
+      }
+    },
+    "tuningConfig": {
+      "type": "hadoop",
+      "jobProperties": {
+        "tmpjars":"/user/h_user_profile/du00/druid/test/book.jar",
+        // "elephantbird.class.for.MultiInputFormat" : "${YOUR_THRIFT_CLASS_NAME}"
+      }
+    }
+  }
+}
+```
diff --git a/docs/35.0.0/development/extensions-contrib/time-min-max.md b/docs/35.0.0/development/extensions-contrib/time-min-max.md
new file mode 100644
index 0000000000..f83667baea
--- /dev/null
+++ b/docs/35.0.0/development/extensions-contrib/time-min-max.md
@@ -0,0 +1,104 @@
+---
+id: time-min-max
+title: "Timestamp Min/Max aggregators"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+To use this Apache Druid extension, [include](../../configuration/extensions.md#loading-extensions) `druid-time-min-max` in the extensions load list.
+
+These aggregators enable more precise calculation of min and max time of given events than `__time` column whose granularity is sparse, the same as query granularity.
+To use this feature, a "timeMin" or "timeMax" aggregator must be included at indexing time.
+They can apply to any columns that can be converted to timestamp, which include Long, DateTime, Timestamp, and String types.
+
+For example, when a data set consists of timestamp, dimension, and metric value like followings.
+
+```
+2015-07-28T01:00:00.000Z  A  1
+2015-07-28T02:00:00.000Z  A  1
+2015-07-28T03:00:00.000Z  A  1
+2015-07-28T04:00:00.000Z  B  1
+2015-07-28T05:00:00.000Z  A  1
+2015-07-28T06:00:00.000Z  B  1
+2015-07-29T01:00:00.000Z  C  1
+2015-07-29T02:00:00.000Z  C  1
+2015-07-29T03:00:00.000Z  A  1
+2015-07-29T04:00:00.000Z  A  1
+```
+
+At ingestion time, timeMin and timeMax aggregator can be included as other aggregators.
+
+```json
+{
+    "type": "timeMin",
+    "name": "tmin",
+    "fieldName": "<field_name, typically column specified in timestamp spec>"
+}
+```
+
+```json
+{
+    "type": "timeMax",
+    "name": "tmax",
+    "fieldName": "<field_name, typically column specified in timestamp spec>"
+}
+```
+
+`name` is output name of aggregator and can be any string. `fieldName` is typically column specified in timestamp spec but can be any column that can be converted to timestamp.
+
+To query for results, the same aggregators "timeMin" and "timeMax" is used.
+
+```json
+{
+  "queryType": "groupBy",
+  "dataSource": "timeMinMax",
+  "granularity": "DAY",
+  "dimensions": ["product"],
+  "aggregations": [
+    {
+      "type": "count",
+      "name": "count"
+    },
+    {
+      "type": "timeMin",
+      "name": "<output_name of timeMin>",
+      "fieldName": "tmin"
+    },
+    {
+      "type": "timeMax",
+      "name": "<output_name of timeMax>",
+      "fieldName": "tmax"
+    }
+  ],
+  "intervals": [
+    "2010-01-01T00:00:00.000Z/2020-01-01T00:00:00.000Z"
+  ]
+}
+```
+
+Then, result has min and max of timestamp, which is finer than query granularity.
+
+```
+2015-07-28T00:00:00.000Z A 4 2015-07-28T01:00:00.000Z 2015-07-28T05:00:00.000Z
+2015-07-28T00:00:00.000Z B 2 2015-07-28T04:00:00.000Z 2015-07-28T06:00:00.000Z
+2015-07-29T00:00:00.000Z A 2 2015-07-29T03:00:00.000Z 2015-07-29T04:00:00.000Z
+2015-07-29T00:00:00.000Z C 2 2015-07-29T01:00:00.000Z 2015-07-29T02:00:00.000Z
+```
diff --git a/docs/35.0.0/development/extensions-core/approximate-histograms.md b/docs/35.0.0/development/extensions-core/approximate-histograms.md
new file mode 100644
index 0000000000..240d87a5a0
--- /dev/null
+++ b/docs/35.0.0/development/extensions-core/approximate-histograms.md
@@ -0,0 +1,315 @@
+---
+id: approximate-histograms
+title: "Approximate Histogram aggregators"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+:::caution
+ The Approximate Histogram aggregator is deprecated. Use [DataSketches Quantiles](../extensions-core/datasketches-quantiles.md) instead as it provides a superior distribution-independent algorithm with formal error guarantees.
+:::
+
+To use this Apache Druid extension, [include](../../configuration/extensions.md#loading-extensions) `druid-histogram` in the extensions load list.
+
+The `druid-histogram` extension provides an approximate histogram aggregator and a fixed buckets histogram aggregator.
+
+<a name="approximate-histogram-aggregator"></a>
+
+## Approximate Histogram aggregator 
+
+
+This aggregator is based on
+[http://jmlr.org/papers/volume11/ben-haim10a/ben-haim10a.pdf](http://jmlr.org/papers/volume11/ben-haim10a/ben-haim10a.pdf)
+to compute approximate histograms, with the following modifications:
+
+- some tradeoffs in accuracy were made in the interest of speed (see below)
+- the sketch maintains the exact original data as long as the number of
+  distinct data points is fewer than the resolutions (number of centroids),
+  increasing accuracy when there are few data points, or when dealing with
+  discrete data points. You can find some of the details in [this post](https://metamarkets.com/2013/histograms/).
+
+Here are a few things to note before using approximate histograms:
+
+- As indicated in the original paper, there are no formal error bounds on the
+  approximation. In practice, the approximation gets worse if the distribution
+  is skewed.
+- The algorithm is order-dependent, so results can vary for the same query, due
+  to variations in the order in which results are merged.
+- In general, the algorithm only works well if the data that comes is randomly
+  distributed (i.e. if data points end up sorted in a column, approximation
+  will be horrible)
+- We traded accuracy for aggregation speed, taking some shortcuts when adding
+  histograms together, which can lead to pathological cases if your data is
+  ordered in some way, or if your distribution has long tails. It should be
+  cheaper to increase the resolution of the sketch to get the accuracy you need.
+
+That being said, those sketches can be useful to get a first order approximation
+when averages are not good enough. Assuming most rows in your segment store
+fewer data points than the resolution of histogram, you should be able to use
+them for monitoring purposes and detect meaningful variations with a few
+hundred centroids. To get good accuracy readings on 95th percentiles with
+millions of rows of data, you may want to use several thousand centroids,
+especially with long tails, since that's where the approximation will be worse.
+
+### Creating approximate histogram sketches at ingestion time
+
+To use this feature, an "approxHistogram" or "approxHistogramFold" aggregator must be included at
+indexing time. The ingestion aggregator can only apply to numeric values. If you use "approxHistogram"
+then any input rows missing the value will be considered to have a value of 0, while with "approxHistogramFold"
+such rows will be ignored.
+
+To query for results, an "approxHistogramFold" aggregator must be included in the
+query.
+
+```json
+{
+  "type" : "approxHistogram or approxHistogramFold (at ingestion time), approxHistogramFold (at query time)",
+  "name" : <output_name>,
+  "fieldName" : <metric_name>,
+  "resolution" : <integer>,
+  "numBuckets" : <integer>,
+  "lowerLimit" : <float>,
+  "upperLimit" : <float>
+}
+```
+
+|Property                 |Description                   |Default                           |
+|-------------------------|------------------------------|----------------------------------|
+|`resolution`             |Number of centroids (data points) to store. The higher the resolution, the more accurate results are, but the slower the computation will be.|50|
+|`numBuckets`             |Number of output buckets for the resulting histogram. Bucket intervals are dynamic, based on the range of the underlying data. Use a post-aggregator to have finer control over the bucketing scheme|7|
+|`lowerLimit`/`upperLimit`|Restrict the approximation to the given range. The values outside this range will be aggregated into two centroids. Counts of values outside this range are still maintained. |-INF/+INF|
+|`finalizeAsBase64Binary` |If true, the finalized aggregator value will be a Base64-encoded byte array containing the serialized form of the histogram. If false, the finalized aggregator value will be a JSON representation of the histogram.|false|
+
+## Fixed Buckets Histogram
+
+The fixed buckets histogram aggregator builds a histogram on a numeric column, with evenly-sized buckets across a specified value range. Values outside of the range are handled based on a user-specified outlier handling mode.
+
+This histogram supports the min/max/quantiles post-aggregators but does not support the bucketing post-aggregators.
+
+### When to use
+
+The accuracy/usefulness of the fixed buckets histogram is extremely data-dependent; it is provided to support special use cases where the user has a great deal of prior information about the data being aggregated and knows that a fixed buckets implementation is suitable.
+
+For general histogram and quantile use cases, the [DataSketches Quantiles Sketch](../extensions-core/datasketches-quantiles.md) extension is recommended.
+
+### Properties
+
+
+|Property                 |Description                   |Default                           |
+|-------------------------|------------------------------|----------------------------------|
+|`type`|Type of the aggregator. Must `fixedBucketsHistogram`.|No default, must be specified|
+|`name`|Column name for the aggregator.|No default, must be specified|
+|`fieldName`|Column name of the input to the aggregator.|No default, must be specified|
+|`lowerLimit`|Lower limit of the histogram. |No default, must be specified|
+|`upperLimit`|Upper limit of the histogram. |No default, must be specified|
+|`numBuckets`|Number of buckets for the histogram. The range [lowerLimit, upperLimit] will be divided into `numBuckets` intervals of equal size.|10|
+|`outlierHandlingMode`|Specifies how values outside of [lowerLimit, upperLimit] will be handled. Supported modes are "ignore", "overflow", and "clip". See [outlier handling modes](#outlier-handling-modes) for more details.|No default, must be specified|
+|`finalizeAsBase64Binary`|If true, the finalized aggregator value will be a Base64-encoded byte array containing the [serialized form](#serialization-formats) of the histogram. If false, the finalized aggregator value will be a JSON representation of the histogram.|false|
+
+An example aggregator spec is shown below:
+
+```json
+{
+  "type" : "fixedBucketsHistogram",
+  "name" : <output_name>,
+  "fieldName" : <metric_name>,
+  "numBuckets" : <integer>,
+  "lowerLimit" : <double>,
+  "upperLimit" : <double>,
+  "outlierHandlingMode": <mode>
+}
+```
+
+### Outlier handling modes
+
+The outlier handling mode specifies what should be done with values outside of the histogram's range. There are three supported modes:
+
+- `ignore`: Throw away outlier values.
+- `overflow`: A count of outlier values will be tracked by the histogram, available in the `lowerOutlierCount` and `upperOutlierCount` fields.
+- `clip`: Outlier values will be clipped to the `lowerLimit` or the `upperLimit` and included in the histogram.
+
+If you don't care about outliers, `ignore` is the cheapest option performance-wise. There is currently no difference in storage size among the modes.
+
+### Output fields
+
+The histogram aggregator's output object has the following fields:
+
+- `lowerLimit`: Lower limit of the histogram
+- `upperLimit`: Upper limit of the histogram
+- `numBuckets`: Number of histogram buckets
+- `outlierHandlingMode`: Outlier handling mode
+- `count`: Total number of values contained in the histogram, excluding outliers
+- `lowerOutlierCount`: Count of outlier values below `lowerLimit`. Only used if the outlier mode is `overflow`.
+- `upperOutlierCount`: Count of outlier values above `upperLimit`. Only used if the outlier mode is `overflow`.
+- `missingValueCount`: Count of null values seen by the histogram.
+- `max`: Max value seen by the histogram. This does not include outlier values.
+- `min`: Min value seen by the histogram. This does not include outlier values.
+- `histogram`: An array of longs with size `numBuckets`, containing the bucket counts
+
+### Ingesting existing histograms
+
+It is also possible to ingest existing fixed buckets histograms. The input must be a Base64 string encoding a byte array that contains a serialized histogram object. Both "full" and "sparse" formats can be used. Please see [Serialization formats](#serialization-formats) below for details.
+
+### Serialization formats
+
+#### Full serialization format
+
+This format includes the full histogram bucket count array in the serialization format.
+
+```
+byte: serialization version, must be 0x01
+byte: encoding mode, 0x01 for full
+double: lowerLimit
+double: upperLimit
+int: numBuckets
+byte: outlier handling mode (0x00 for `ignore`, 0x01 for `overflow`, and 0x02 for `clip`)
+long: count, total number of values contained in the histogram, excluding outliers
+long: lowerOutlierCount
+long: upperOutlierCount
+long: missingValueCount
+double: max
+double: min
+array of longs: bucket counts for the histogram
+```
+
+#### Sparse serialization format
+
+This format represents the histogram bucket counts as (bucketNum, count) pairs. This serialization format is used when less than half of the histogram's buckets have values.
+
+```
+byte: serialization version, must be 0x01
+byte: encoding mode, 0x02 for sparse
+double: lowerLimit
+double: upperLimit
+int: numBuckets
+byte: outlier handling mode (0x00 for `ignore`, 0x01 for `overflow`, and 0x02 for `clip`)
+long: count, total number of values contained in the histogram, excluding outliers
+long: lowerOutlierCount
+long: upperOutlierCount
+long: missingValueCount
+double: max
+double: min
+int: number of following (bucketNum, count) pairs
+sequence of (int, long) pairs:
+  int: bucket number
+  count: bucket count
+```
+
+### Combining histograms with different bucketing schemes
+
+It is possible to combine two histograms with different bucketing schemes (lowerLimit, upperLimit, numBuckets) together.
+
+The bucketing scheme of the "left hand" histogram will be preserved (i.e., when running a query, the bucketing schemes specified in the query's histogram aggregators will be preserved).
+
+When merging, we assume that values are evenly distributed within the buckets of the "right hand" histogram.
+
+When the right-hand histogram contains outliers (when using `overflow` mode), we assume that all of the outliers counted in the right-hand histogram will be outliers in the left-hand histogram as well.
+
+For performance and accuracy reasons, we recommend avoiding aggregation of histograms with different bucketing schemes if possible.
+
+### Null handling
+
+Druid tracks null values in the `missingValueCount` field of the histogram.
+
+## Histogram post-aggregators
+
+Post-aggregators are used to transform opaque approximate histogram sketches
+into bucketed histogram representations, as well as to compute various
+distribution metrics such as quantiles, min, and max.
+
+### Equal buckets post-aggregator
+
+Computes a visual representation of the approximate histogram with a given number of equal-sized bins.
+Bucket intervals are based on the range of the underlying data. This aggregator is not supported for the fixed buckets histogram.
+
+```json
+{
+  "type": "equalBuckets",
+  "name": "<output_name>",
+  "fieldName": "<aggregator_name>",
+  "numBuckets": <count>
+}
+```
+
+### Buckets post-aggregator
+
+Computes a visual representation given an initial breakpoint, offset, and a bucket size.
+
+Bucket size determines the width of the binning interval.
+
+Offset determines the value on which those interval bins align.
+
+This aggregator is not supported for the fixed buckets histogram.
+
+```json
+{
+  "type": "buckets",
+  "name": "<output_name>",
+  "fieldName": "<aggregator_name>",
+  "bucketSize": <bucket_size>,
+  "offset": <offset>
+}
+```
+
+### Custom buckets post-aggregator
+
+Computes a visual representation of the approximate histogram with bins laid out according to the given breaks.
+
+This aggregator is not supported for the fixed buckets histogram.
+
+```json
+{ "type" : "customBuckets", "name" : <output_name>, "fieldName" : <aggregator_name>,
+  "breaks" : [ <value>, <value>, ... ] }
+```
+
+### min post-aggregator
+
+Returns the minimum value of the underlying approximate or fixed buckets histogram aggregator
+
+```json
+{ "type" : "min", "name" : <output_name>, "fieldName" : <aggregator_name> }
+```
+
+### max post-aggregator
+
+Returns the maximum value of the underlying approximate or fixed buckets histogram aggregator
+
+```json
+{ "type" : "max", "name" : <output_name>, "fieldName" : <aggregator_name> }
+```
+
+#### quantile post-aggregator
+
+Computes a single quantile based on the underlying approximate or fixed buckets histogram aggregator
+
+```json
+{ "type" : "quantile", "name" : <output_name>, "fieldName" : <aggregator_name>,
+  "probability" : <quantile> }
+```
+
+#### quantiles post-aggregator
+
+Computes an array of quantiles based on the underlying approximate or fixed buckets histogram aggregator
+
+```json
+{ "type" : "quantiles", "name" : <output_name>, "fieldName" : <aggregator_name>,
+  "probabilities" : [ <quantile>, <quantile>, ... ] }
+```
diff --git a/docs/35.0.0/development/extensions-core/avro.md b/docs/35.0.0/development/extensions-core/avro.md
new file mode 100644
index 0000000000..7db7530b07
--- /dev/null
+++ b/docs/35.0.0/development/extensions-core/avro.md
@@ -0,0 +1,64 @@
+---
+id: avro
+title: "Apache Avro"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+This Apache Druid extension enables Druid to ingest and parse the Apache Avro data format as follows:
+- [Avro stream input format](../../ingestion/data-formats.md#avro-stream) for Kafka and Kinesis.
+- [Avro OCF input format](../../ingestion/data-formats.md#avro-ocf) for native batch ingestion.
+- [Avro Hadoop Parser](../../ingestion/data-formats.md#avro-hadoop-parser).
+
+The [Avro Stream Parser](../../ingestion/data-formats.md#avro-stream-parser) is deprecated.
+
+## Load the Avro extension
+
+To use the Avro extension, add the `druid-avro-extensions` to the list of loaded extensions. See [Loading extensions](../../configuration/extensions.md#loading-extensions) for more information.
+
+## Avro types
+
+Druid supports most Avro types natively. This section describes some  exceptions.
+
+### Unions
+Druid has two modes for supporting `union` types.
+
+The default mode treats unions as a single value regardless of the type of data populating the union.
+
+If you want to operate on individual members of a union, set `extractUnionsByType` on the Avro parser. This configuration expands union values into nested objects according to the following rules:
+- Primitive types and unnamed complex types are keyed by their type name, such as `int` and `string`.
+- Complex named types are keyed by their names, this includes `record`, `fixed`, and `enum`.
+- The Avro null type is elided as its value can only ever be null.
+
+This is safe because an Avro union can only contain a single member of each unnamed type and duplicates of the same named type are not allowed. For example, only a single array is allowed, multiple records (or other named types) are allowed as long as each has a unique name.
+
+You can then access the members of the union with a [flattenSpec](../../ingestion/data-formats.md#flattenspec) like you would for other nested types.
+
+### Binary types
+The extension returns `bytes` and `fixed` Avro types as base64 encoded strings by default. To decode these types as UTF-8 strings, enable the `binaryAsString` option on the Avro parser.
+
+### Enums
+The extension returns `enum` types as `string` of the enum symbol.
+
+### Complex types
+You can ingest `record` and `map` types representing nested data with a [flattenSpec](../../ingestion/data-formats.md#flattenspec) on the parser.
+
+### Logical types
+Druid does not currently support Avro logical types. It ignores them and handles fields according to the underlying primitive type.
diff --git a/docs/35.0.0/development/extensions-core/azure.md b/docs/35.0.0/development/extensions-core/azure.md
new file mode 100644
index 0000000000..d6310e32cf
--- /dev/null
+++ b/docs/35.0.0/development/extensions-core/azure.md
@@ -0,0 +1,96 @@
+---
+id: azure
+title: "Microsoft Azure"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+## Azure extension
+
+This extension allows you to do the following:
+
+* [Ingest data](#ingest-data-from-azure) from objects stored in Azure Blob Storage.
+* [Write segments](#store-segments-in-azure) to Azure Blob Storage for deep storage.
+* [Persist task logs](#persist-task-logs-in-azure) to Azure Blob Storage for long-term storage.
+
+:::info
+
+To use this Apache Druid extension, [include](../../configuration/extensions.md#loading-extensions) `druid-azure-extensions` in the extensions load list.
+
+:::
+
+### Ingest data from Azure
+
+Ingest data using either [MSQ](../../multi-stage-query/index.md) or a native batch [parallel task](../../ingestion/native-batch.md) with an [Azure input source](../../ingestion/input-sources.md#azure-input-source) (`azureStorage`) to read objects directly from Azure Blob Storage.
+
+### Store segments in Azure
+
+:::info
+
+To use Azure for deep storage, set `druid.storage.type=azure`.
+
+:::
+
+#### Configure location
+
+Configure where to store segments using the following properties:
+
+| Property | Description | Default |
+|---|---|---|
+| `druid.azure.account` | The Azure Storage account name. | Must be set. |
+| `druid.azure.container` | The Azure Storage container name. | Must be set. |
+| `druid.azure.prefix` | A prefix string that will be prepended to the blob names for the segments published. | "" |
+| `druid.azure.maxTries` | Number of tries before canceling an Azure operation. | 3 |
+| `druid.azure.protocol` | The protocol to use to connect to the Azure Storage account. Either `http` or `https`. | `https` |
+| `druid.azure.storageAccountEndpointSuffix` | The Storage account endpoint to use. Override the default value to connect to [Azure Government](https://learn.microsoft.com/en-us/azure/azure-government/documentation-government-get-started-connect-to-storage#getting-started-with-storage-api) or storage accounts with [Azure DNS zone endpoints](https://learn.microsoft.com/en-us/azure/storage/common/storage-account-overview#azure-dns-zone-endpoints-preview).<br/><br/>Do _not_ include the storage account name prefix in this config value.<br/><br/>Examples: `ABCD1234.blob.storage.azure.net`, `blob.core.usgovcloudapi.net`. | `blob.core.windows.net` |
+
+#### Configure authentication
+
+Authenticate access to Azure Blob Storage using one of the following methods:
+
+* [SAS token](https://learn.microsoft.com/en-us/azure/storage/common/storage-sas-overview)
+* [Shared Key](https://learn.microsoft.com/en-us/rest/api/storageservices/authorize-with-shared-key)
+* Default Azure credentials chain ([`DefaultAzureCredential`](https://learn.microsoft.com/en-us/java/api/overview/azure/identity-readme#defaultazurecredential)).
+
+Configure authentication using the following properties:
+
+| Property | Description | Default |
+|---|---|---|
+| `druid.azure.sharedAccessStorageToken` | The SAS (Shared Storage Access) token. |  |
+| `druid.azure.key` | The Shared Key. |  |
+| `druid.azure.useAzureCredentialsChain` | If `true`, use `DefaultAzureCredential` for authentication. | `false` |
+| `druid.azure.managedIdentityClientId` | To use managed identity authentication in the `DefaultAzureCredential`, set `useAzureCredentialsChain` to `true` and provide the client ID here. |  |
+
+### Persist task logs in Azure
+
+:::info
+
+To persist task logs in Azure Blob Storage, set `druid.indexer.logs.type=azure`.
+
+:::
+
+Druid stores task logs using the storage account and authentication method configured for storing segments. Use the following configuration to set up where to store the task logs:
+
+| Property | Description | Default |
+|---|---|---|
+| `druid.indexer.logs.container` | The Azure Blob Store container to write logs to. | Must be set. |
+| `druid.indexer.logs.prefix` | The path to prepend to logs. | Must be set. |
+
+For general options regarding task retention, see [Log retention policy](../../configuration/index.md#log-retention-policy).
diff --git a/docs/35.0.0/development/extensions-core/bloom-filter.md b/docs/35.0.0/development/extensions-core/bloom-filter.md
new file mode 100644
index 0000000000..c0167e446d
--- /dev/null
+++ b/docs/35.0.0/development/extensions-core/bloom-filter.md
@@ -0,0 +1,175 @@
+---
+id: bloom-filter
+title: "Bloom Filter"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+To use the Apache Druid&circledR; Bloom filter extension, include `druid-bloom-filter` in the extensions load list. See [Loading extensions](../../configuration/extensions.md#loading-extensions) for more information.
+
+This extension adds the abilities to construct Bloom filters from query results and to filter query results by testing
+against a Bloom filter. A Bloom filter is a probabilistic data structure to check for set membership. A Bloom
+filter is a good candidate to use when an explicit filter is impossible, such as filtering a query
+against a set of millions of values.
+
+Following are some characteristics of Bloom filters:
+
+- Bloom filters are significantly more space efficient than HashSets.
+- Because they are probabilistic, false positive results are possible with Bloom filters. For example, the `test()` function might return `true` for an element that is not within the filter.
+- False negatives are not possible. If an element is present, `test()` always returns `true`.
+- The false positive probability of this implementation is fixed at 5%. Increasing the number of entries that the filter can hold can decrease this false positive rate in exchange for overall size.
+- Bloom filters are sensitive to the number of inserted elements. You must specify the expected number of entries at creation time. If the number of insertions exceeds the specified number of entries, the false positive probability increases accordingly.
+
+This extension is based on `org.apache.hive.common.util.BloomKFilter` from `hive-storage-api`. Internally,
+this implementation uses Murmur3 as the hash algorithm.
+
+The following Java example shows how to construct a BloomKFilter externally:
+
+```java
+BloomKFilter bloomFilter = new BloomKFilter(1500);
+bloomFilter.addString("value 1");
+bloomFilter.addString("value 2");
+bloomFilter.addString("value 3");
+ByteArrayOutputStream byteArrayOutputStream = new ByteArrayOutputStream();
+BloomKFilter.serialize(byteArrayOutputStream, bloomFilter);
+String base64Serialized = Base64.encodeBase64String(byteArrayOutputStream.toByteArray());
+```
+
+You can then use the Base64 encoded string in JSON-based or SQL-based queries in Druid.
+
+## Filter queries with a Bloom filter
+
+### JSON specification
+
+```json
+{
+  "type" : "bloom",
+  "dimension" : <dimension_name>,
+  "bloomKFilter" : <serialized_bytes_for_BloomKFilter>,
+  "extractionFn" : <extraction_fn>
+}
+```
+
+|Property|Description|Required|
+|--------|-----------|--------|
+|`type`|Filter type. Set to `bloom`.|Yes|
+|`dimension`|Dimension to filter over.|Yes|
+|`bloomKFilter`|Base64 encoded binary representation of `org.apache.hive.common.util.BloomKFilter`.|Yes|
+|`extractionFn`|[Extraction function](../../querying/dimensionspecs.md#extraction-functions) to apply to the dimension values.|No|
+
+### Serialized format for BloomKFilter
+
+Serialized BloomKFilter format:
+
+- 1 byte for the number of hash functions.
+- 1 big-endian integer for the number of longs in the bitset.
+- Big-endian longs in the BloomKFilter bitset.
+
+`org.apache.hive.common.util.BloomKFilter` provides a method to serialize Bloom filters to `outputStream`.
+
+### Filter SQL queries
+
+You can use Bloom filters in SQL `WHERE` clauses with the `bloom_filter_test` operator:
+
+```sql
+SELECT COUNT(*) FROM druid.foo WHERE bloom_filter_test(<expr>, '<serialized_bytes_for_BloomKFilter>')
+```
+
+### Expression and virtual column support
+
+The Bloom filter extension also adds a Bloom filter [Druid expression](../../querying/math-expr.md) which shares syntax
+with the SQL operator.
+
+```sql
+bloom_filter_test(<expr>, '<serialized_bytes_for_BloomKFilter>')
+```
+
+## Bloom filter query aggregator
+
+You can create an input for a `BloomKFilter` from a Druid query with the `bloom` aggregator. Make sure to set a reasonable value for the `maxNumEntries` parameter to specify the maximum number of distinct entries that the Bloom filter can represent without increasing the false positive rate. Try performing a query using
+one of the unique count sketches to calculate the value for this parameter to build a Bloom filter appropriate for the query.
+
+### JSON specification
+
+```json
+{
+      "type": "bloom",
+      "name": <output_field_name>,
+      "maxNumEntries": <maximum_number_of_elements_for_BloomKFilter>
+      "field": <dimension_spec>
+    }
+```
+
+|Property|Description|Required|
+|--------|-----------|--------|
+|`type`|Aggregator type. Set to `bloom`.|Yes|
+|`name`|Output field name.|Yes|
+|`field`|[DimensionSpec](../../querying/dimensionspecs.md) to add to `org.apache.hive.common.util.BloomKFilter`.|Yes|
+|`maxNumEntries`|Maximum number of distinct values supported by `org.apache.hive.common.util.BloomKFilter`. Defaults to `1500`.|No|
+
+### Example
+
+The following example shows a timeseries query object with a `bloom` aggregator:
+
+```json
+{
+  "queryType": "timeseries",
+  "dataSource": "wikiticker",
+  "intervals": [ "2015-09-12T00:00:00.000/2015-09-13T00:00:00.000" ],
+  "granularity": "day",
+  "aggregations": [
+    {
+      "type": "bloom",
+      "name": "userBloom",
+      "maxNumEntries": 100000,
+      "field": {
+        "type":"default",
+        "dimension":"user",
+        "outputType": "STRING"
+      }
+    }
+  ]
+}
+```
+
+Example response:
+
+```json
+[
+  {
+    "timestamp":"2015-09-12T00:00:00.000Z",
+    "result":{"userBloom":"BAAAJhAAAA..."}
+  }
+]
+```
+
+We recommend ordering by an alternative aggregation method instead of ordering results by a Bloom filter aggregator.
+Ordering results by a Bloom filter aggregator can be resource-intensive because Druid performs an expensive linear scan of the filter to approximate the count of items added to the set by counting the number of set bits. 
+
+### SQL Bloom filter aggregator
+
+You can compute Bloom filters in SQL expressions with the BLOOM_FILTER aggregator. For example:
+
+```sql
+SELECT BLOOM_FILTER(<expression>, <max number of entries>) FROM druid.foo WHERE dim2 = 'abc'
+```
+
+Druid serializes Bloom filter results in a SQL response into a Base64 string. You can use the resulting string in subsequent queries as a filter.
diff --git a/docs/35.0.0/development/extensions-core/catalog.md b/docs/35.0.0/development/extensions-core/catalog.md
new file mode 100644
index 0000000000..37e56941e0
--- /dev/null
+++ b/docs/35.0.0/development/extensions-core/catalog.md
@@ -0,0 +1,456 @@
+---
+id: catalog
+title: Catalog
+---
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+import Tabs from '@theme/Tabs';
+import TabItem from '@theme/TabItem';
+
+Consider this an [EXPERIMENTAL](../experimental.md) feature mostly because it has not been tested yet on a wide variety of long running Druid clusters.
+
+This extension allows users to configure, update, retrieve, and manage metadata stored in Druid's catalog. At present, only metadata about tables is stored in the catalog. This extension only supports MSQ based ingestion.
+
+## Configuration
+
+To use this extension please make sure to  [include](../../configuration/extensions.md#loading-extensions) `druid-catalog` in the extensions load list.
+
+# Catalog Metadata
+
+## Tables
+
+A user may define a table with a defined set of column names, and respective data types, along with other properties. When
+ingesting data into a table defined in the catalog, the DML query is validated against the definition of the table
+as defined in the catalog. This allows the user to omit the table's properties that are found in its definition,
+allowing queries to be more concise, and simpler to write. This also allows the user to ensure that the type of data being
+written into a defined column of the table is consistent with that columns definition, minimizing errors where unexpected
+data is written into a particular column of the table.
+
+### API Objects
+
+#### TableSpec
+
+A tableSpec defines a table
+
+| Property     | Type                            | Description                                                               | Required | Default |
+|--------------|---------------------------------|---------------------------------------------------------------------------|----------|---------|
+| `type`       | String                          | the type of table. The only value supported at this time is `datasource`  | yes      | null    |
+| `properties` | Map&lt;String, Object>             | the table's defined properties. see [table properties](#table-properties) | no       | null    |
+| `columns`    | List&lt;[ColumnSpec](#columnspec)> | the table's defined columns                                               | no       | null    |
+
+#### Table Properties
+
+| PropertyKeyName      | PropertyValueType | Description                                                                                                                                                                                                                                                                                                                                              | Required | Default |
+|----------------------|-------------------|----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|----------|---------|
+| `segmentGranularity` | String            | determines how time-based partitioning is done. See [Partitioning by time](../../multi-stage-query/concepts.md#partitioning-by-time). Can specify any of the values as permitted for [PARTITIONED BY](../../multi-stage-query/reference.md#partitioned-by). This property value may be overridden at query time, by specifying the PARTITIONED BY clause. | no       | null    |
+| `sealed`             | boolean           | require all columns in the table schema to be fully declared before data is ingested. Setting this to true will cause failure when DML queries attempt to add undefined columns to the table.                                                                                                                                                            | no       | false   |
+
+#### ColumnSpec
+
+| Property     | Type                | Description                                                                                                            | Required | Default |
+|--------------|---------------------|------------------------------------------------------------------------------------------------------------------------|----------|---------|
+| `name`       | String              | The name of the column                                                                                                 | yes      | null    |
+| `dataType`   | String              | The type of the column. Can be any column data type that is available to Druid. Depends on what extensions are loaded. | no       | null    |
+| `properties` | Map&lt;String, Object\> | the column's defined properties. Non properties defined at this time.                                                  | no       | null    |
+
+### APIs
+
+#### Create or update a table
+
+Update or create a new table containing the given table specification.
+
+##### URL
+
+`POST` `/druid/coordinator/v1/catalog/schemas/{schema}/tables/{name}`
+
+##### Request body
+
+The request object for this request is a [TableSpec](#tablespec)
+
+##### Query parameters
+
+The endpoint supports a set of optional query parameters to enforce optimistic locking, and to specify that a request
+is meant to update a table rather than create a new one. In the default case, with no query parameters set, this request
+will return an error if a table of the same name already exists in the schema specified.
+
+| Parameter   | Type    | Description                                                                                                                   |
+|-------------|---------|-------------------------------------------------------------------------------------------------------------------------------|
+| `version`   | Long    | the expected version of an existing table. The version must match. If not (or if the table does not exist), returns an error. |
+| `overwrite` | boolean | if true, then overwrites any existing table. Otherwise, the operation fails if the table already exists.                      |
+
+##### Responses
+
+<Tabs>
+
+<TabItem value="1" label="200 SUCCESS">
+
+*Successfully submitted table spec. Returns an object that includes the version of the table created or updated:*
+
+```json
+{
+    "version": 12345687
+}
+```
+
+</TabItem>
+<TabItem value="2" label="400 BAD REQUEST">
+
+*Error thrown due to bad request. Returns a JSON object detailing the error with the following format:*
+
+```json
+{
+    "error": "A well-defined error code.",
+    "errorMessage": "A message with additional details about the error."
+}
+```
+</TabItem>
+<TabItem value="3" label="500 INTERNAL SERVER ERROR">
+
+
+*Error thrown due to unexpected conditions. Returns a JSON object detailing the error with the following format:*
+
+```json
+{
+    "error": "A well-defined error code.",
+    "errorMessage": "A message with additional details about the error."
+}
+```
+
+</TabItem>
+</Tabs>
+
+##### Sample request
+
+The following example shows how to create a sealed table with several defined columns, and a defined segment granularity of `"P1D"`
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/coordinator/v1/catalog/schemas/druid/tables/test_table" \
+-X 'POST' \
+--header 'Content-Type: application/json' \
+--data '{
+  "type": "datasource",
+  "columns": [
+    {
+      "name": "__time",
+      "dataType": "long"
+    },
+    {
+      "name": "double_col",
+      "dataType": "double"
+    },
+    {
+      "name": "float_col",
+      "dataType": "float"
+    },
+    {
+      "name": "long_col",
+      "dataType": "long"
+    },
+    {
+      "name": "string_col",
+      "dataType": "string"
+    }
+  ],
+  "properties": {
+    "segmentGranularity": "P1D",
+    "sealed": true
+  }
+}'
+```
+
+##### Sample response
+
+```json
+{
+  "version": 1730965026295
+}
+```
+
+#### Retrieve a table
+
+Retrieve a table
+
+##### URL
+
+`GET` `/druid/coordinator/v1/catalog/schemas/{schema}/tables/{name}`
+
+##### Responses
+
+<Tabs>
+
+<TabItem value="1" label="200 SUCCESS">
+
+*Successfully retrieved corresponding table's [TableSpec](#tablespec)*
+
+</TabItem>
+<TabItem value="2" label="400 BAD REQUEST">
+
+*Error thrown due to bad request. Returns a JSON object detailing the error with the following format:*
+
+```json
+{
+    "error": "A well-defined error code.",
+    "errorMessage": "A message with additional details about the error."
+}
+```
+</TabItem>
+<TabItem value="3" label="500 INTERNAL SERVER ERROR">
+
+*Error thrown due to unexpected conditions. Returns a JSON object detailing the error with the following format:*
+
+```json
+{
+    "error": "A well-defined error code.",
+    "errorMessage": "A message with additional details about the error."
+}
+```
+
+</TabItem>
+</Tabs>
+
+##### Sample request
+
+The following example shows how to retrieve a table named `test_table` in schema `druid`:
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/coordinator/v1/catalog/schemas/druid/tables/test_table"
+```
+
+##### Sample response
+
+<details>
+  <summary>View the response</summary>
+
+```json
+{
+  "id": {
+    "schema": "druid",
+    "name": "test_table"
+  },
+  "creationTime": 1730965026295,
+  "updateTime": 1730965026295,
+  "state": "ACTIVE",
+  "spec": {
+    "type": "datasource",
+    "properties": {
+      "segmentGranularity": "P1D",
+      "sealed": true
+    },
+    "columns": [
+      {
+        "name": "__time",
+        "dataType": "long"
+      },
+      {
+        "name": "double_col",
+        "dataType": "double"
+      },
+      {
+        "name": "float_col",
+        "dataType": "float"
+      },
+      {
+        "name": "long_col",
+        "dataType": "long"
+      },
+      {
+        "name": "string_col",
+        "dataType": "string"
+      }
+    ]
+  }
+}
+```
+</details>
+
+#### Delete a table
+
+Delete a table
+
+##### URL
+
+`DELETE` `/druid/coordinator/v1/catalog/schemas/{schema}/tables/{name}`
+
+##### Responses
+
+<Tabs>
+
+<TabItem value="1" label="200 SUCCESS">
+
+*No response body*
+
+</TabItem>
+<TabItem value="2" label="400 BAD REQUEST">
+
+*Error thrown due to bad request. Returns a JSON object detailing the error with the following format:*
+
+```json
+{
+    "error": "A well-defined error code.",
+    "errorMessage": "A message with additional details about the error."
+}
+```
+</TabItem>
+<TabItem value="3" label="500 INTERNAL SERVER ERROR">
+
+*Error thrown due to unexpected conditions. Returns a JSON object detailing the error with the following format:*
+
+```json
+{
+    "error": "A well-defined error code.",
+    "errorMessage": "A message with additional details about the error."
+}
+```
+
+</TabItem>
+</Tabs>
+
+##### Sample request
+
+The following example shows how to delete the a table named `test_table` in schema `druid`
+
+```shell
+curl -X 'DELETE' "http://ROUTER_IP:ROUTER_PORT/druid/coordinator/v1/catalog/schemas/druid/tables/test_table"
+```
+
+##### Sample response
+
+No response body
+
+#### Retrieve list of schema names
+
+retrieve list of schema names
+
+##### URL
+
+`GET` `/druid/coordinator/v1/catalog/schemas`
+
+##### Responses
+
+<Tabs>
+
+<TabItem value="1" label="200 SUCCESS">
+
+*Successfully retrieved list of schema names*
+
+</TabItem>
+<TabItem value="2" label="400 BAD REQUEST">
+
+*Error thrown due to bad request. Returns a JSON object detailing the error with the following format:*
+
+```json
+{
+    "error": "A well-defined error code.",
+    "errorMessage": "A message with additional details about the error."
+}
+```
+</TabItem>
+<TabItem value="3" label="500 INTERNAL SERVER ERROR">
+
+*Error thrown due to unexpected conditions. Returns a JSON object detailing the error with the following format:*
+
+```json
+{
+    "error": "A well-defined error code.",
+    "errorMessage": "A message with additional details about the error."
+}
+```
+
+</TabItem>
+</Tabs>
+
+##### Sample request
+
+The following example shows how to retrieve the list of schema names.
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/coordinator/v1/catalog/schemas"
+```
+
+##### Sample response
+
+```json
+[
+  "INFORMATION_SCHEMA",
+  "druid",
+  "ext",
+  "lookups",
+  "sys",
+  "view"
+]
+```
+
+#### Retrieve list of table names in schema
+
+Retrieve a list of table names in the schema.
+
+##### URL
+
+`GET` `/druid/coordinator/v1/catalog/schemas/{schema}/table`
+
+##### Responses
+
+<Tabs>
+
+<TabItem value="1" label="200 SUCCESS">
+
+*Successfully retrieved list of table names belonging to schema*
+
+</TabItem>
+<TabItem value="2" label="400 BAD REQUEST">
+
+*Error thrown due to bad request. Returns a JSON object detailing the error with the following format:*
+
+```json
+{
+    "error": "A well-defined error code.",
+    "errorMessage": "A message with additional details about the error."
+}
+```
+</TabItem>
+<TabItem value="3" label="500 INTERNAL SERVER ERROR">
+
+*Error thrown due to unexpected conditions. Returns a JSON object detailing the error with the following format:*
+
+```json
+{
+    "error": "A well-defined error code.",
+    "errorMessage": "A message with additional details about the error."
+}
+```
+
+</TabItem>
+</Tabs>
+
+##### Sample request
+
+The following example shows how to retrieve all of the table names of tables belonging to the `druid` schema.
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/coordinator/v1/catalog/schemas/druid/tables"
+```
+
+##### Sample response
+
+```json
+[
+  "test_table"
+]
+```
\ No newline at end of file
diff --git a/docs/35.0.0/development/extensions-core/datasketches-extension.md b/docs/35.0.0/development/extensions-core/datasketches-extension.md
new file mode 100644
index 0000000000..00c955dc98
--- /dev/null
+++ b/docs/35.0.0/development/extensions-core/datasketches-extension.md
@@ -0,0 +1,40 @@
+---
+id: datasketches-extension
+title: "DataSketches extension"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+Apache Druid aggregators based on [Apache DataSketches](https://datasketches.apache.org/) library. Sketches are data structures implementing approximate streaming mergeable algorithms. Sketches can be ingested from the outside of Druid or built from raw data at ingestion time. Sketches can be stored in Druid segments as additive metrics.
+
+To use the datasketches aggregators, make sure you [include](../../configuration/extensions.md#loading-extensions) the extension in your config file:
+
+```
+druid.extensions.loadList=["druid-datasketches"]
+```
+
+The following modules are available:
+
+* [Theta sketch](datasketches-theta.md) - approximate distinct counting with set operations (union, intersection and set difference).
+* [Tuple sketch](datasketches-tuple.md) - extension of Theta sketch to support values associated with distinct keys (arrays of numeric values in this specialized implementation).
+* [Quantiles sketch](datasketches-quantiles.md) - approximate distribution of comparable values to obtain ranks, quantiles and histograms. This is a specialized implementation for numeric values.
+* [KLL Quantiles sketch](datasketches-kll.md) - approximate distribution of comparable values to obtain ranks, quantiles and histograms. This is a specialized implementation for numeric values. This is a more advanced algorithm compared to the classic quantiles above, sketches are more compact for the same accuracy, or more accurate for the same size.
+* [HLL sketch](datasketches-hll.md) - approximate distinct counting using very compact HLL sketch.
diff --git a/docs/35.0.0/development/extensions-core/datasketches-hll.md b/docs/35.0.0/development/extensions-core/datasketches-hll.md
new file mode 100644
index 0000000000..4e2b369e5e
--- /dev/null
+++ b/docs/35.0.0/development/extensions-core/datasketches-hll.md
@@ -0,0 +1,155 @@
+---
+id: datasketches-hll
+title: "DataSketches HLL Sketch module"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+This module provides Apache Druid aggregators for distinct counting based on HLL sketch from [Apache DataSketches](https://datasketches.apache.org/) library. At ingestion time, this aggregator creates the HLL sketch objects to store in Druid segments. By default, Druid reads and merges sketches at query time. The default result is
+the estimate of the number of distinct values presented to the sketch. You can also use post aggregators to produce a union of sketch columns in the same row.
+You can use the HLL sketch aggregator on any column to estimate its cardinality.
+
+To use this aggregator, make sure you [include](../../configuration/extensions.md#loading-extensions) the extension in your config file:
+
+```
+druid.extensions.loadList=["druid-datasketches"]
+```
+
+For additional sketch types supported in Druid, see [DataSketches extension](datasketches-extension.md).
+
+## Aggregators
+
+|Property|Description|Required?|
+|--------|-----------|---------|
+|`type`|Either [`HLLSketchBuild`](#hllsketchbuild-aggregator) or [`HLLSketchMerge`](#hllsketchmerge-aggregator).|yes|
+|`name`|String representing the output column to store sketch values.|yes|
+|`fieldName`|The name of the input field.|yes|
+|`lgK`|log2 of K that is the number of buckets in the sketch, parameter that controls the size and the accuracy. Must be between 4 and 21 inclusively.|no, defaults to `12`|
+|`tgtHllType`|The type of the target HLL sketch. Must be `HLL_4`, `HLL_6` or `HLL_8` |no, defaults to `HLL_4`|
+|`round`|Round off values to whole numbers. Only affects query-time behavior and is ignored at ingestion-time.|no, defaults to `false`|
+|`shouldFinalize`|Return the final double type representing the estimate rather than the intermediate sketch type itself. In addition to controlling the finalization of this aggregator, you can control whether all aggregators are finalized with the query context parameters [`finalize`](../../querying/query-context-reference.md) and [`sqlFinalizeOuterSketches`](../../querying/sql-query-context.md).|no, defaults to `true`|
+
+:::info
+ The default `lgK` value has proven to be sufficient for most use cases; expect only very negligible improvements in accuracy with `lgK` values over `16` in normal circumstances.
+:::
+
+### HLLSketchBuild aggregator
+
+```
+{
+  "type": "HLLSketchBuild",
+  "name": <output name>,
+  "fieldName": <metric name>,
+  "lgK": <size and accuracy parameter>,
+  "tgtHllType": <target HLL type>,
+  "round": <false | true>
+ }
+```
+
+The `HLLSketchBuild` aggregator builds an HLL sketch object from the specified input column. When used during ingestion, Druid stores pre-generated HLL sketch objects in the datasource instead of the raw data from the input column.
+When applied at query time on an existing dimension, you can use the resulting column as an intermediate dimension by the [post-aggregators](#post-aggregators).
+
+:::info
+ It is very common to use `HLLSketchBuild` in combination with [rollup](../../ingestion/rollup.md) to create a [metric](../../ingestion/ingestion-spec.md#metricsspec) on high-cardinality columns.  In this example, a metric called `userid_hll` is included in the `metricsSpec`.  This will perform a HLL sketch on the `userid` field at ingestion time, allowing for highly-performant approximate `COUNT DISTINCT` query operations and improving roll-up ratios when `userid` is then left out of the `dimensionsSpec`.
+
+ ```
+ "metricsSpec": [
+   {
+     "type": "HLLSketchBuild",
+     "name": "userid_hll",
+     "fieldName": "userid",
+     "lgK": 12,
+     "tgtHllType": "HLL_4"
+   }
+ ]
+ ```
+
+:::
+
+### HLLSketchMerge aggregator
+
+```
+{
+  "type": "HLLSketchMerge",
+  "name": <output name>,
+  "fieldName": <metric name>,
+  "lgK": <size and accuracy parameter>,
+  "tgtHllType": <target HLL type>,
+  "round": <false | true>
+}
+```
+
+You can use the `HLLSketchMerge` aggregator to ingest pre-generated sketches from an input dataset. For example, you can set up a batch processing job to generate the sketches before sending the data to Druid. You must serialize the sketches in the input dataset to Base64-encoded bytes. Then, specify `HLLSketchMerge` for the input column in the native ingestion `metricsSpec`.
+
+## Post aggregators
+
+### Estimate
+
+Returns the distinct count estimate as a double.
+
+```
+{
+  "type": "HLLSketchEstimate",
+  "name": <output name>,
+  "field": <post aggregator that returns an HLL Sketch>,
+  "round": <if true, round the estimate. Default is false>
+}
+```
+
+### Estimate with bounds
+
+Returns a distinct count estimate and error bounds from an HLL sketch.
+The result will be an array containing three double values: estimate, lower bound and upper bound.
+The bounds are provided at a given number of standard deviations (optional, defaults to 1).
+This must be an integer value of 1, 2 or 3 corresponding to approximately 68.3%, 95.4% and 99.7% confidence intervals.
+
+```
+{
+  "type": "HLLSketchEstimateWithBounds",
+  "name": <output name>,
+  "field": <post aggregator that returns an HLL Sketch>,
+  "numStdDev": <number of standard deviations: 1 (default), 2 or 3>
+}
+```
+
+### Union
+
+```
+{
+  "type": "HLLSketchUnion",
+  "name": <output name>,
+  "fields": <array of post aggregators that return HLL sketches>,
+  "lgK": <log2 of K for the target sketch>,
+  "tgtHllType": <target HLL type>
+}
+```
+
+### Sketch to string
+
+Human-readable sketch summary for debugging.
+
+```
+{
+  "type": "HLLSketchToString",
+  "name": <output name>,
+  "field": <post aggregator that returns an HLL Sketch>
+}
+```
diff --git a/docs/35.0.0/development/extensions-core/datasketches-kll.md b/docs/35.0.0/development/extensions-core/datasketches-kll.md
new file mode 100644
index 0000000000..b8e372dc94
--- /dev/null
+++ b/docs/35.0.0/development/extensions-core/datasketches-kll.md
@@ -0,0 +1,140 @@
+---
+id: datasketches-kll
+title: "DataSketches KLL Sketch module"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+This module provides Apache Druid aggregators based on numeric quantiles KllFloatsSketch and KllDoublesSketch from [Apache DataSketches](https://datasketches.apache.org/) library. KLL quantiles sketch is a mergeable streaming algorithm to estimate the distribution of values, and approximately answer queries about the rank of a value, probability mass function of the distribution (PMF) or histogram, cumulative distribution function (CDF), and quantiles (median, min, max, 95th percentile and such). See [Quantiles Sketch Overview](https://datasketches.apache.org/docs/Quantiles/QuantilesSketchOverview.html). This document applies to both KllFloatsSketch and KllDoublesSketch. Only one of them will be used in the examples.
+
+There are three major modes of operation:
+
+1. Ingesting sketches built outside of Druid (say, with Pig or Hive)
+2. Building sketches from raw data during ingestion
+3. Building sketches from raw data at query time
+
+To use this aggregator, make sure you [include](../../configuration/extensions.md#loading-extensions) the extension in your config file:
+
+```
+druid.extensions.loadList=["druid-datasketches"]
+```
+
+For additional sketch types supported in Druid, see [DataSketches extension](datasketches-extension.md).
+
+## Aggregator
+
+The result of the aggregation is a KllFloatsSketch or KllDoublesSketch that is the union of all sketches either built from raw data or read from the segments.
+
+```json
+{
+  "type" : "KllDoublesSketch",
+  "name" : <output_name>,
+  "fieldName" : <metric_name>,
+  "k": <parameter that controls size and accuracy>
+ }
+```
+
+|Property|Description|Required?|
+|--------|-----------|---------|
+|`type`|Either "KllFloatsSketch" or "KllDoublesSketch"|yes|
+|`name`|A String for the output (result) name of the calculation.|yes|
+|`fieldName`|String for the name of the input field, which may contain sketches or raw numeric values.|yes|
+|`k`|Parameter that determines the accuracy and size of the sketch. Higher k means higher accuracy but more space to store sketches. Must be from 8 to 65535. See [KLL Sketch Accuracy and Size](https://datasketches.apache.org/docs/KLL/KLLAccuracyAndSize.html).|no, defaults to 200|
+|`maxStreamLength`|This parameter defines the number of items that can be presented to each sketch before it may need to move from off-heap to on-heap memory. This is relevant to query types that use off-heap memory, including [TopN](../../querying/topnquery.md) and [GroupBy](../../querying/groupbyquery.md). Ideally, should be set high enough such that most sketches can stay off-heap.|no, defaults to 1000000000|
+
+## Post aggregators
+
+### Quantile
+
+This returns an approximation to the value that would be preceded by a given fraction of a hypothetical sorted version of the input stream.
+
+```json
+{
+  "type"  : "KllDoublesSketchToQuantile",
+  "name": <output name>,
+  "field"  : <post aggregator that refers to a KllDoublesSketch (fieldAccess or another post aggregator)>,
+  "fraction" : <fractional position in the hypothetical sorted stream, number from 0 to 1 inclusive>
+}
+```
+
+### Quantiles
+
+This returns an array of quantiles corresponding to a given array of fractions
+
+```json
+{
+  "type"  : "KllDoublesSketchToQuantiles",
+  "name": <output name>,
+  "field"  : <post aggregator that refers to a KllDoublesSketch (fieldAccess or another post aggregator)>,
+  "fractions" : <array of fractional positions in the hypothetical sorted stream, number from 0 to 1 inclusive>
+}
+```
+
+### Histogram
+
+This returns an approximation to the histogram given an array of split points that define the histogram bins or a number of bins (not both). An array of <i>m</i> unique, monotonically increasing split points divide the real number line into <i>m+1</i> consecutive disjoint intervals. The definition of an interval is inclusive of the left split point and exclusive of the right split point. If the number of bins is specified instead of split points, the interval between the minimum and maximum values is divided into the given number of equally-spaced bins.
+
+```json
+{
+  "type"  : "KllDoublesSketchToHistogram",
+  "name": <output name>,
+  "field"  : <post aggregator that refers to a KllDoublesSketch (fieldAccess or another post aggregator)>,
+  "splitPoints" : <array of split points (optional)>,
+  "numBins" : <number of bins (optional, defaults to 10)>
+}
+```
+
+### Rank
+
+This returns an approximation to the rank of a given value that is the fraction of the distribution less than that value.
+
+```json
+{
+  "type"  : "KllDoublesSketchToRank",
+  "name": <output name>,
+  "field"  : <post aggregator that refers to a KllDoublesSketch (fieldAccess or another post aggregator)>,
+  "value" : <value>
+}
+```
+### CDF
+
+This returns an approximation to the Cumulative Distribution Function given an array of split points that define the edges of the bins. An array of <i>m</i> unique, monotonically increasing split points divide the real number line into <i>m+1</i> consecutive disjoint intervals. The definition of an interval is inclusive of the left split point and exclusive of the right split point. The resulting array of fractions can be viewed as ranks of each split point with one additional rank that is always 1.
+
+```json
+{
+  "type"  : "KllDoublesSketchToCDF",
+  "name": <output name>,
+  "field"  : <post aggregator that refers to a KllDoublesSketch (fieldAccess or another post aggregator)>,
+  "splitPoints" : <array of split points>
+}
+```
+
+### Sketch Summary
+
+This returns a summary of the sketch that can be used for debugging. This is the result of calling toString() method.
+
+```json
+{
+  "type"  : "KllDoublesSketchToString",
+  "name": <output name>,
+  "field"  : <post aggregator that refers to a KllDoublesSketch (fieldAccess or another post aggregator)>
+}
+```
diff --git a/docs/35.0.0/development/extensions-core/datasketches-quantiles.md b/docs/35.0.0/development/extensions-core/datasketches-quantiles.md
new file mode 100644
index 0000000000..e6845d92db
--- /dev/null
+++ b/docs/35.0.0/development/extensions-core/datasketches-quantiles.md
@@ -0,0 +1,141 @@
+---
+id: datasketches-quantiles
+title: "DataSketches Quantiles Sketch module"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+This module provides Apache Druid aggregators based on numeric quantiles DoublesSketch from [Apache DataSketches](https://datasketches.apache.org/) library. Quantiles sketch is a mergeable streaming algorithm to estimate the distribution of values, and approximately answer queries about the rank of a value, probability mass function of the distribution (PMF) or histogram, cumulative distribution function (CDF), and quantiles (median, min, max, 95th percentile and such). See [Quantiles Sketch Overview](https://datasketches.apache.org/docs/Quantiles/QuantilesSketchOverview.html).
+
+There are three major modes of operation:
+
+1. Ingesting sketches built outside of Druid (say, with Pig or Hive)
+2. Building sketches from raw data during ingestion
+3. Building sketches from raw data at query time
+
+To use this aggregator, make sure you [include](../../configuration/extensions.md#loading-extensions) the extension in your config file:
+
+```
+druid.extensions.loadList=["druid-datasketches"]
+```
+
+For additional sketch types supported in Druid, see [DataSketches extension](datasketches-extension.md).
+
+## Aggregator
+
+The result of the aggregation is a DoublesSketch that is the union of all sketches either built from raw data or read from the segments.
+
+```json
+{
+  "type" : "quantilesDoublesSketch",
+  "name" : <output_name>,
+  "fieldName" : <metric_name>,
+  "k": <parameter that controls size and accuracy>
+ }
+```
+
+|Property|Description|Required?|
+|--------|-----------|---------|
+|`type`|This string should always be "quantilesDoublesSketch"|yes|
+|`name`|String representing the output column to store sketch values.|yes|
+|`fieldName`|A string for the name of the input field (can contain sketches or raw numeric values).|yes|
+|`k`|Parameter that determines the accuracy and size of the sketch. Higher k means higher accuracy but more space to store sketches. Must be a power of 2 from 2 to 32768. See [accuracy information](https://datasketches.apache.org/docs/Quantiles/ClassicQuantilesSketch.html#accuracy-and-size) in the DataSketches documentation for details.|no, defaults to 128|
+|`maxStreamLength`|This parameter defines the number of items that can be presented to each sketch before it may need to move from off-heap to on-heap memory. This is relevant to query types that use off-heap memory, including [TopN](../../querying/topnquery.md) and [GroupBy](../../querying/groupbyquery.md). Ideally, should be set high enough such that most sketches can stay off-heap.|no, defaults to 1000000000|
+|`shouldFinalize`|Return the final double type representing the estimate rather than the intermediate sketch type itself. In addition to controlling the finalization of this aggregator, you can control whether all aggregators are finalized with the query context parameters [`finalize`](../../querying/query-context-reference.md) and [`sqlFinalizeOuterSketches`](../../querying/sql-query-context.md).|no, defaults to `true`|
+
+## Post aggregators
+
+### Quantile
+
+This returns an approximation to the value that would be preceded by a given fraction of a hypothetical sorted version of the input stream.
+
+```json
+{
+  "type"  : "quantilesDoublesSketchToQuantile",
+  "name": <output name>,
+  "field"  : <post aggregator that refers to a DoublesSketch (fieldAccess or another post aggregator)>,
+  "fraction" : <fractional position in the hypothetical sorted stream, number from 0 to 1 inclusive>
+}
+```
+
+### Quantiles
+
+This returns an array of quantiles corresponding to a given array of fractions
+
+```json
+{
+  "type"  : "quantilesDoublesSketchToQuantiles",
+  "name": <output name>,
+  "field"  : <post aggregator that refers to a DoublesSketch (fieldAccess or another post aggregator)>,
+  "fractions" : <array of fractional positions in the hypothetical sorted stream, number from 0 to 1 inclusive>
+}
+```
+
+### Histogram
+
+This returns an approximation to the histogram given an array of split points that define the histogram bins or a number of bins (not both). An array of <i>m</i> unique, monotonically increasing split points divide the real number line into <i>m+1</i> consecutive disjoint intervals. The definition of an interval is inclusive of the left split point and exclusive of the right split point. If the number of bins is specified instead of split points, the interval between the minimum and maximum values is divided into the given number of equally-spaced bins.
+
+```json
+{
+  "type"  : "quantilesDoublesSketchToHistogram",
+  "name": <output name>,
+  "field"  : <post aggregator that refers to a DoublesSketch (fieldAccess or another post aggregator)>,
+  "splitPoints" : <array of split points (optional)>,
+  "numBins" : <number of bins (optional, defaults to 10)>
+}
+```
+
+### Rank
+
+This returns an approximation to the rank of a given value that is the fraction of the distribution less than that value.
+
+```json
+{
+  "type"  : "quantilesDoublesSketchToRank",
+  "name": <output name>,
+  "field"  : <post aggregator that refers to a DoublesSketch (fieldAccess or another post aggregator)>,
+  "value" : <value>
+}
+```
+### CDF
+
+This returns an approximation to the Cumulative Distribution Function given an array of split points that define the edges of the bins. An array of <i>m</i> unique, monotonically increasing split points divide the real number line into <i>m+1</i> consecutive disjoint intervals. The definition of an interval is inclusive of the left split point and exclusive of the right split point. The resulting array of fractions can be viewed as ranks of each split point with one additional rank that is always 1.
+
+```json
+{
+  "type"  : "quantilesDoublesSketchToCDF",
+  "name": <output name>,
+  "field"  : <post aggregator that refers to a DoublesSketch (fieldAccess or another post aggregator)>,
+  "splitPoints" : <array of split points>
+}
+```
+
+### Sketch summary
+
+This returns a summary of the sketch that can be used for debugging. This is the result of calling toString() method.
+
+```json
+{
+  "type"  : "quantilesDoublesSketchToString",
+  "name": <output name>,
+  "field"  : <post aggregator that refers to a DoublesSketch (fieldAccess or another post aggregator)>
+}
+```
diff --git a/docs/35.0.0/development/extensions-core/datasketches-theta.md b/docs/35.0.0/development/extensions-core/datasketches-theta.md
new file mode 100644
index 0000000000..33bdbe9d3d
--- /dev/null
+++ b/docs/35.0.0/development/extensions-core/datasketches-theta.md
@@ -0,0 +1,333 @@
+---
+id: datasketches-theta
+title: "DataSketches Theta Sketch module"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+This module provides Apache Druid aggregators based on Theta sketch from [Apache DataSketches](https://datasketches.apache.org/) library.
+Sketch algorithms are approximate. For more information, see [Accuracy](https://datasketches.apache.org/docs/Theta/ThetaAccuracy.html) in the DataSketches documentation.
+
+At ingestion time, the Theta sketch aggregator creates Theta sketch objects which are stored in Druid segments. Logically speaking, a Theta sketch object can be thought of as a Set data structure. At query time, sketches are read and aggregated (set unioned) together. In the end, by default, you receive the estimate of the number of unique entries in the sketch object. You can use post aggregators to do union, intersection or difference on sketch columns in the same row.
+
+Note that you can use `thetaSketch` aggregator on columns which were not ingested using the same. It will return estimated cardinality of the column. It is recommended to use it at ingestion time as well to make querying faster.
+
+To use this aggregator, make sure you [include](../../configuration/extensions.md#loading-extensions) the extension in your config file:
+
+```
+druid.extensions.loadList=["druid-datasketches"]
+```
+
+For additional sketch types supported in Druid, see [DataSketches extension](datasketches-extension.md).
+
+## Aggregator
+
+```json
+{
+  "type" : "thetaSketch",
+  "name" : <output_name>,
+  "fieldName" : <metric_name>,
+  "isInputThetaSketch": false,
+  "size": 16384
+ }
+```
+
+|Property|Description|Required?|
+|--------|-----------|---------|
+|`type`|This string should always be "thetaSketch"|yes|
+|`name`|String representing the output column to store sketch values.|yes|
+|`fieldName`|A string for the name of the aggregator used at ingestion time.|yes|
+|`isInputThetaSketch`|Only set this to true at indexing time if your input data contains Theta sketch objects. This applies to cases when you use DataSketches outside of Druid, for example with Pig or Hive, to produce the data to ingest into Druid |no, defaults to false|
+|`size`|Must be a power of 2. Internally, size refers to the maximum number of entries sketch object retains. Higher size means higher accuracy but more space to store sketches. After you index with a particular size, Druid persists the sketch in segments. At query time you must use a size greater or equal to the ingested size. See the [DataSketches site](https://datasketches.apache.org/docs/Theta/ThetaSize) for details. The default is recommended for the majority of use cases.|no, defaults to 16384|
+|`shouldFinalize`|Return the final double type representing the estimate rather than the intermediate sketch type itself. In addition to controlling the finalization of this aggregator, you can control whether all aggregators are finalized with the query context parameters [`finalize`](../../querying/query-context-reference.md) and [`sqlFinalizeOuterSketches`](../../querying/sql-query-context.md).|no, defaults to `true`|
+
+## Post aggregators
+
+### Sketch estimator
+
+```json
+{
+  "type"  : "thetaSketchEstimate",
+  "name": <output name>,
+  "field"  : <post aggregator of type fieldAccess that refers to a thetaSketch aggregator or that of type thetaSketchSetOp>
+}
+```
+
+### Sketch operations
+
+```json
+{
+  "type"  : "thetaSketchSetOp",
+  "name": <output name>,
+  "func": <UNION|INTERSECT|NOT>,
+  "fields"  : <array of fieldAccess type post aggregators to access the thetaSketch aggregators or thetaSketchSetOp type post aggregators to allow arbitrary combination of set operations>,
+  "size": <16384 by default, must be max of size from sketches in fields input>
+}
+```
+
+### Sketch summary
+
+This returns a summary of the sketch that can be used for debugging. This is the result of calling toString() method.
+
+```json
+{
+  "type"  : "thetaSketchToString",
+  "name": <output name>,
+  "field"  : <post aggregator that refers to a Theta sketch (fieldAccess or another post aggregator)>
+}
+```
+
+
+
+### Constant Theta Sketch 
+
+You can use the constant theta sketch post aggregator to add a Base64-encoded constant theta sketch value for use in other post-aggregators. For example,  `thetaSketchSetOp`.
+
+```json
+{
+  "type"  : "thetaSketchConstant",
+  "name": DESTINATION_COLUMN_NAME,
+  "value"  : CONSTANT_SKETCH_VALUE
+}
+```
+
+### Example using a constant Theta Sketch 
+
+Assume you have a datasource with a variety of a variety of users. Using `filters` and `aggregation`, you generate a theta sketch of all `football fans`.  
+
+A third-party provider has provided a constant theta sketch of all `cricket fans` and you want to `INTERSECT` both cricket fans and football fans in a `post-aggregation` stage to identify users who are interested in both `cricket`. Then you want to use `thetaSketchEstimate` to calculate the number of unique users.
+
+```json
+{
+   "type":"thetaSketchEstimate",
+   "name":"football_cricket_users_count",
+   "field":{
+      "type":"thetaSketchSetOp",
+      "name":"football_cricket_fans_users_theta_sketch",
+      "func":"INTERSECT",
+      "fields":[
+         {
+            "type":"fieldAccess",
+            "fieldName":"football_fans_users_theta_sketch"
+         },
+         {
+            "type":"thetaSketchConstant",
+            "name":"cricket_fans_users_theta_sketch",
+            "value":"AgMDAAAazJMCAAAAAACAPzz9j7pWTMdROWGf15uY1nI="
+         }
+      ]
+   }
+}
+```
+
+## Examples
+
+Assuming, you have a dataset containing (timestamp, product, user_id). You want to answer questions like
+
+How many unique users visited product A?
+How many unique users visited both product A and product B?
+
+to answer above questions, you would index your data using following aggregator.
+
+```json
+{ "type": "thetaSketch", "name": "user_id_sketch", "fieldName": "user_id" }
+```
+
+then, sample query for, How many unique users visited product A?
+
+```json
+{
+  "queryType": "groupBy",
+  "dataSource": "test_datasource",
+  "granularity": "ALL",
+  "dimensions": [],
+  "aggregations": [
+    { "type": "thetaSketch", "name": "unique_users", "fieldName": "user_id_sketch" }
+  ],
+  "filter": { "type": "selector", "dimension": "product", "value": "A" },
+  "intervals": [ "2014-10-19T00:00:00.000Z/2014-10-22T00:00:00.000Z" ]
+}
+```
+
+sample query for, How many unique users visited both product A and B?
+
+```json
+{
+  "queryType": "groupBy",
+  "dataSource": "test_datasource",
+  "granularity": "ALL",
+  "dimensions": [],
+  "filter": {
+    "type": "or",
+    "fields": [
+      {"type": "selector", "dimension": "product", "value": "A"},
+      {"type": "selector", "dimension": "product", "value": "B"}
+    ]
+  },
+  "aggregations": [
+    {
+      "type" : "filtered",
+      "filter" : {
+        "type" : "selector",
+        "dimension" : "product",
+        "value" : "A"
+      },
+      "aggregator" :     {
+        "type": "thetaSketch", "name": "A_unique_users", "fieldName": "user_id_sketch"
+      }
+    },
+    {
+      "type" : "filtered",
+      "filter" : {
+        "type" : "selector",
+        "dimension" : "product",
+        "value" : "B"
+      },
+      "aggregator" :     {
+        "type": "thetaSketch", "name": "B_unique_users", "fieldName": "user_id_sketch"
+      }
+    }
+  ],
+  "postAggregations": [
+    {
+      "type": "thetaSketchEstimate",
+      "name": "final_unique_users",
+      "field":
+      {
+        "type": "thetaSketchSetOp",
+        "name": "final_unique_users_sketch",
+        "func": "INTERSECT",
+        "fields": [
+          {
+            "type": "fieldAccess",
+            "fieldName": "A_unique_users"
+          },
+          {
+            "type": "fieldAccess",
+            "fieldName": "B_unique_users"
+          }
+        ]
+      }
+    }
+  ],
+  "intervals": [
+    "2014-10-19T00:00:00.000Z/2014-10-22T00:00:00.000Z"
+  ]
+}
+```
+
+### Retention analysis example
+
+Suppose you want to answer a question like, "How many unique users performed a specific action in a particular time period and also performed another specific action in a different time period?"
+
+e.g., "How many unique users signed up in week 1, and purchased something in week 2?"
+
+Using the `(timestamp, product, user_id)` example dataset, data would be indexed with the following aggregator, like in the example above:
+
+```json
+{ "type": "thetaSketch", "name": "user_id_sketch", "fieldName": "user_id" }
+```
+
+The following query expresses:
+
+"Out of the unique users who visited Product A between 10/01/2014 and 10/07/2014, how many visited Product A again in the week of 10/08/2014 to 10/14/2014?"
+
+```json
+{
+  "queryType": "groupBy",
+  "dataSource": "test_datasource",
+  "granularity": "ALL",
+  "dimensions": [],
+  "filter": {
+    "type": "or",
+    "fields": [
+      {"type": "selector", "dimension": "product", "value": "A"}
+    ]
+  },
+  "aggregations": [
+    {
+      "type" : "filtered",
+      "filter" : {
+        "type" : "and",
+        "fields" : [
+          {
+            "type" : "selector",
+            "dimension" : "product",
+            "value" : "A"
+          },
+          {
+            "type" : "interval",
+            "dimension" : "__time",
+            "intervals" :  ["2014-10-01T00:00:00.000Z/2014-10-07T00:00:00.000Z"]
+          }
+        ]
+      },
+      "aggregator" :     {
+        "type": "thetaSketch", "name": "A_unique_users_week_1", "fieldName": "user_id_sketch"
+      }
+    },
+    {
+      "type" : "filtered",
+      "filter" : {
+        "type" : "and",
+        "fields" : [
+          {
+            "type" : "selector",
+            "dimension" : "product",
+            "value" : "A"
+          },
+          {
+            "type" : "interval",
+            "dimension" : "__time",
+            "intervals" :  ["2014-10-08T00:00:00.000Z/2014-10-14T00:00:00.000Z"]
+          }
+        ]
+      },
+      "aggregator" : {
+        "type": "thetaSketch", "name": "A_unique_users_week_2", "fieldName": "user_id_sketch"
+      }
+    },
+  ],
+  "postAggregations": [
+    {
+      "type": "thetaSketchEstimate",
+      "name": "final_unique_users",
+      "field":
+      {
+        "type": "thetaSketchSetOp",
+        "name": "final_unique_users_sketch",
+        "func": "INTERSECT",
+        "fields": [
+          {
+            "type": "fieldAccess",
+            "fieldName": "A_unique_users_week_1"
+          },
+          {
+            "type": "fieldAccess",
+            "fieldName": "A_unique_users_week_2"
+          }
+        ]
+      }
+    }
+  ],
+  "intervals": ["2014-10-01T00:00:00.000Z/2014-10-14T00:00:00.000Z"]
+}
+```
diff --git a/docs/35.0.0/development/extensions-core/datasketches-tuple.md b/docs/35.0.0/development/extensions-core/datasketches-tuple.md
new file mode 100644
index 0000000000..1dcf76c0b9
--- /dev/null
+++ b/docs/35.0.0/development/extensions-core/datasketches-tuple.md
@@ -0,0 +1,252 @@
+---
+id: datasketches-tuple
+title: "DataSketches Tuple Sketch module"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+This module provides Apache Druid aggregators based on Tuple sketch from [Apache DataSketches](https://datasketches.apache.org/) library. ArrayOfDoublesSketch sketches extend the functionality of the count-distinct Theta sketches by adding arrays of double values associated with unique keys.
+
+To use this aggregator, make sure you [include](../../configuration/extensions.md#loading-extensions) the extension in your config file:
+
+```
+druid.extensions.loadList=["druid-datasketches"]
+```
+
+For additional sketch types supported in Druid, see [DataSketches extension](datasketches-extension.md).
+
+## Aggregator
+
+```json
+{
+  "type" : "arrayOfDoublesSketch",
+  "name" : <output_name>,
+  "fieldName" : <metric_name>,
+  "nominalEntries": <number>,
+  "metricColumns" : <array of strings>,
+  "numberOfValues" : <number>
+ }
+```
+
+|Property|Description|Required?|
+|--------|-----------|---------|
+|`type`|This string should always be "arrayOfDoublesSketch"|yes|
+|`name`|String representing the output column to store sketch values.|yes|
+|`fieldName`|A string for the name of the input field.|yes|
+|`nominalEntries`|Parameter that determines the accuracy and size of the sketch. Higher k means higher accuracy but more space to store sketches. Must be a power of 2. See the [Theta sketch accuracy](https://datasketches.apache.org/docs/Theta/ThetaErrorTable) for details. |no, defaults to 16384|
+|`metricColumns`|When building sketches from raw data, an array input column that contain numeric values to associate with each distinct key. If not provided, assumes `fieldName` is an `arrayOfDoublesSketch`|no, if not provided `fieldName` is assumed to be an arrayOfDoublesSketch|
+|`numberOfValues`|Number of values associated with each distinct key. |no, defaults to the length of `metricColumns` if provided and 1 otherwise|
+
+You can use the `arrayOfDoublesSketch` aggregator to:
+
+- Build a sketch from raw data. In this case, set `metricColumns` to an array.
+- Build a sketch from an existing `ArrayOfDoubles` sketch . In this case, leave `metricColumns` unset and set the `fieldName` to an `ArrayOfDoubles` sketch with `numberOfValues` doubles. At ingestion time, you must base64 encode `ArrayOfDoubles`  sketches at ingestion time.
+
+### Example on top of raw data
+
+Compute a theta of unique users. For each user store the `added` and `deleted` scores. The new sketch column will be called `users_theta`.
+
+```json
+{
+  "type": "arrayOfDoublesSketch",
+  "name": "users_theta",
+  "fieldName": "user",
+  "nominalEntries": 16384,
+  "metricColumns": ["added", "deleted"],
+}
+```
+
+### Example ingesting a precomputed sketch column
+
+Ingest a sketch column called `user_sketches` that has a base64 encoded value of two doubles in its array and store it in a column called `users_theta`.
+
+```json
+{
+  "type": "arrayOfDoublesSketch",
+  "name": "users_theta",
+  "fieldName": "user_sketches",
+  "nominalEntries": 16384,
+  "numberOfValues": 2,
+}
+```
+
+## Post aggregators
+
+### Estimate of the number of distinct keys
+
+Returns a distinct count estimate from a given ArrayOfDoublesSketch.
+
+```json
+{
+  "type"  : "arrayOfDoublesSketchToEstimate",
+  "name": <output name>,
+  "field"  : <post aggregator that refers to an ArrayOfDoublesSketch (fieldAccess or another post aggregator)>
+}
+```
+
+### Estimate of the number of distinct keys with error bounds
+
+Returns a distinct count estimate and error bounds from a given ArrayOfDoublesSketch. The result will be three double values: estimate of the number of distinct keys, lower bound and upper bound. The bounds are provided at the given number of standard deviations (optional, defaults to 1). This must be an integer value of 1, 2 or 3 corresponding to approximately 68.3%, 95.4% and 99.7% confidence intervals.
+
+```json
+{
+  "type"  : "arrayOfDoublesSketchToEstimateAndBounds",
+  "name": <output name>,
+  "field"  : <post aggregator that refers to an  ArrayOfDoublesSketch (fieldAccess or another post aggregator)>,
+  "numStdDevs", <number from 1 to 3>
+}
+```
+
+### Number of retained entries
+
+Returns the number of retained entries from a given ArrayOfDoublesSketch.
+
+```json
+{
+  "type"  : "arrayOfDoublesSketchToNumEntries",
+  "name": <output name>,
+  "field"  : <post aggregator that refers to an ArrayOfDoublesSketch (fieldAccess or another post aggregator)>
+}
+```
+
+### Mean values for each column
+
+Returns a list of mean values from a given ArrayOfDoublesSketch. The result will be N double values, where N is the number of double values kept in the sketch per key.
+
+```json
+{
+  "type"  : "arrayOfDoublesSketchToMeans",
+  "name": <output name>,
+  "field"  : <post aggregator that refers to a DoublesSketch (fieldAccess or another post aggregator)>
+}
+```
+
+### Variance values for each column
+
+Returns a list of variance values from a given ArrayOfDoublesSketch. The result will be N double values, where N is the number of double values kept in the sketch per key.
+
+```json
+{
+  "type"  : "arrayOfDoublesSketchToVariances",
+  "name": <output name>,
+  "field"  : <post aggregator that refers to a DoublesSketch (fieldAccess or another post aggregator)>
+}
+```
+
+### Quantiles sketch from a column
+
+Returns a quantiles DoublesSketch constructed from a given column of values from a given ArrayOfDoublesSketch using optional parameter k that determines the accuracy and size of the quantiles sketch. See [Quantiles Sketch Module](datasketches-quantiles.md)
+
+* The column number is 1-based and is optional (the default is 1).
+* The parameter k is optional (the default is defined in the sketch library).
+* The result is a quantiles sketch.
+
+```json
+{
+  "type"  : "arrayOfDoublesSketchToQuantilesSketch",
+  "name": <output name>,
+  "field"  : <post aggregator that refers to a DoublesSketch (fieldAccess or another post aggregator)>,
+  "column" : <number>,
+  "k" : <parameter that determines the accuracy and size of the quantiles sketch>
+}
+```
+
+### Set operations
+
+Returns a result of a specified set operation on the given array of sketches. Supported operations are: union, intersection and set difference (UNION, INTERSECT, NOT).
+
+```json
+{
+  "type"  : "arrayOfDoublesSketchSetOp",
+  "name": <output name>,
+  "operation": <"UNION"|"INTERSECT"|"NOT">,
+  "fields"  : <array of post aggregators to access sketch aggregators or post aggregators to allow arbitrary combination of set operations>,
+  "nominalEntries" : <parameter that determines the accuracy and size of the sketch>,
+  "numberOfValues" : <number of values associated with each distinct key>
+}
+```
+
+### Student's t-test
+
+Performs Student's t-test and returns a list of p-values given two instances of ArrayOfDoublesSketch. The result will be N double values, where N is the number of double values kept in the sketch per key. See [t-test documentation](https://commons.apache.org/proper/commons-math/javadocs/api-3.6.1/org/apache/commons/math3/stat/inference/TTest.html).
+
+```json
+{
+  "type"  : "arrayOfDoublesSketchTTest",
+  "name": <output name>,
+  "fields"  : <array with two post aggregators to access sketch aggregators or post aggregators referring to an ArrayOfDoublesSketch>,
+}
+```
+
+### Sketch summary
+
+Returns a human-readable summary of a given ArrayOfDoublesSketch. This is a string returned by toString() method of the sketch. This can be useful for debugging.
+
+```json
+{
+  "type"  : "arrayOfDoublesSketchToString",
+  "name": <output name>,
+  "field"  : <post aggregator that refers to an ArrayOfDoublesSketch (fieldAccess or another post aggregator)>
+}
+```
+
+
+### Constant ArrayOfDoublesSketch 
+
+This post aggregator adds a Base64-encoded constant ArrayOfDoublesSketch value that you can use in other post aggregators.
+```json
+{
+  "type": "arrayOfDoublesSketchConstant",
+  "name": DESTINATION_COLUMN_NAME,
+  "value": CONSTANT_SKETCH_VALUE
+}
+```
+
+### Base64 output of ArrayOfDoublesSketch 
+
+This post aggregator outputs an ArrayOfDoublesSketch as a Base64-encoded string storing the constant tuple sketch value that you can use in other post aggregators. 
+
+```json
+{
+  "type": "arrayOfDoublesSketchToBase64String",
+  "name": DESTINATION_COLUMN_NAME,
+  "field": <post aggregator that refers to a ArrayOfDoublesSketch (fieldAccess or another post aggregator)>
+}
+```
+
+### Estimated metrics values for each column of ArrayOfDoublesSketch
+
+For the key-value pairs in the given ArrayOfDoublesSketch, this post aggregator estimates the sum for each set of values across the keys. For example, the post aggregator returns `{3.0, 8.0}` for the following key-value pairs:
+
+```
+Key_1, {1.0, 3.0}
+Key_2, {2.0, 5.0}
+```
+
+The post aggregator returns _N_ double values, where _N_ is the number of values associated with each key.
+
+```json
+{
+  "type": "arrayOfDoublesSketchToMetricsSumEstimate",
+  "name": DESTINATION_COLUMN_NAME,
+  "field": <post aggregator that refers to a ArrayOfDoublesSketch (fieldAccess or another post aggregator)>
+}
+```
diff --git a/docs/35.0.0/development/extensions-core/druid-aws-rds.md b/docs/35.0.0/development/extensions-core/druid-aws-rds.md
new file mode 100644
index 0000000000..48c4ba1747
--- /dev/null
+++ b/docs/35.0.0/development/extensions-core/druid-aws-rds.md
@@ -0,0 +1,38 @@
+---
+id: druid-aws-rds
+title: "Druid AWS RDS Module"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+[AWS RDS](https://aws.amazon.com/rds/) is a managed service to operate relation databases such as PostgreSQL, Mysql etc. These databases could be accessed using static db password mechanism or via [AWS IAM](https://docs.aws.amazon.com/AmazonRDS/latest/UserGuide/UsingWithRDS.IAMDBAuth.html) temporary tokens. This module provides AWS RDS token [password provider](../../operations/password-provider.md) implementation to be used with [mysql-metadata-store](mysql.md) or [postgresql-metadata-store](postgresql.md) when mysql/postgresql is operated using AWS RDS.
+
+```json
+{ "type": "aws-rds-token", "user": "USER", "host": "HOST", "port": PORT, "region": "AWS_REGION" }
+```
+
+Before using this password provider, please make sure that you have connected all dots for db user to connect using token.
+See [AWS Guide](https://docs.aws.amazon.com/AmazonRDS/latest/AuroraUserGuide/UsingWithRDS.IAMDBAuth.html).
+
+To use this extension, make sure you [include](../../configuration/extensions.md#loading-extensions) it in your config file along with other extensions e.g.
+
+```
+druid.extensions.loadList=["druid-aws-rds-extensions", "postgresql-metadata-storage", ...]
+```
diff --git a/docs/35.0.0/development/extensions-core/druid-basic-security.md b/docs/35.0.0/development/extensions-core/druid-basic-security.md
new file mode 100644
index 0000000000..de7c3d07dd
--- /dev/null
+++ b/docs/35.0.0/development/extensions-core/druid-basic-security.md
@@ -0,0 +1,735 @@
+---
+id: druid-basic-security
+title: "Basic Security"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+The Basic Security extension for Apache Druid adds:
+
+- an Authenticator which supports [HTTP Basic authentication](https://en.wikipedia.org/wiki/Basic_access_authentication) using the Druid metadata store or LDAP as its credentials store.
+- an Escalator which determines the authentication scheme for internal Druid processes.
+- an Authorizer which implements basic role-based access control for Druid metadata store or LDAP users and groups.
+
+To load the extension, [include](../../configuration/extensions.md#loading-extensions) `druid-basic-security` in the `druid.extensions.loadList` in your `common.runtime.properties`. For example:
+```
+druid.extensions.loadList=["postgresql-metadata-storage", "druid-hdfs-storage", "druid-basic-security"]
+```
+
+To enable basic auth, configure the basic Authenticator, Escalator, and Authorizer in `common.runtime.properties`.
+See [Security overview](../../operations/security-overview.md#enable-an-authenticator) for an example configuration for HTTP basic authentication.
+
+Visit [Authentication and Authorization](../../operations/auth.md) for more information on the implemented extension interfaces and for an example configuration.
+
+## Configuration
+
+The examples in the section use the following names for the Authenticators and Authorizers:
+- `MyBasicMetadataAuthenticator`
+- `MyBasicLDAPAuthenticator`
+- `MyBasicMetadataAuthorizer`
+- `MyBasicLDAPAuthorizer`
+
+These properties are not tied to specific Authenticator or Authorizer instances.
+
+To set the value for the configuration properties, add them to the common runtime properties file.
+
+### General properties
+
+**`druid.auth.basic.common.pollingPeriod`**
+
+Defines in milliseconds how often processes should poll the Coordinator for the current Druid metadata store authenticator/authorizer state.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: 60000
+
+**`druid.auth.basic.common.maxRandomDelay`**
+
+Defines in milliseconds the amount of random delay to add to the pollingPeriod, to spread polling requests across time.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: 6000
+
+**`druid.auth.basic.common.maxSyncRetries`**
+
+Determines how many times a service will retry if the authentication/authorization Druid metadata store state sync with the Coordinator fails.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: 10
+
+**`druid.auth.basic.common.cacheDirectory`**
+
+If defined, snapshots of the basic Authenticator and Authorizer Druid metadata store caches will be stored on disk in this directory. If this property is defined, when a service is starting, it will attempt to initialize its caches from these on-disk snapshots, if the service is unable to initialize its state by communicating with the Coordinator.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: null
+
+
+### Authenticator
+
+To use the Basic authenticator, add an authenticator with type `basic` to the authenticatorChain.
+The default credentials validator (`credentialsValidator`) is `metadata`. To use the LDAP validator, define a credentials validator with a type of 'ldap'.
+
+
+Use the following syntax to configure a named authenticator:
+
+```
+druid.auth.authenticator.<authenticatorName>.<authenticatorProperty>
+```
+
+Example configuration of an authenticator that uses the Druid metadata store to look up and validate credentials:
+```
+# Druid basic security
+druid.auth.authenticatorChain=["MyBasicMetadataAuthenticator"]
+druid.auth.authenticator.MyBasicMetadataAuthenticator.type=basic
+
+# Default password for 'admin' user, should be changed for production.
+druid.auth.authenticator.MyBasicMetadataAuthenticator.initialAdminPassword=password1
+
+# Default password for internal 'druid_system' user, should be changed for production.
+druid.auth.authenticator.MyBasicMetadataAuthenticator.initialInternalClientPassword=password2
+
+# Uses the metadata store for storing users, you can use authentication API to create new users and grant permissions
+druid.auth.authenticator.MyBasicMetadataAuthenticator.credentialsValidator.type=metadata
+
+# If true and the request credential doesn't exists in this credentials store, the request will proceed to next Authenticator in the chain.
+druid.auth.authenticator.MyBasicMetadataAuthenticator.skipOnFailure=false
+druid.auth.authenticator.MyBasicMetadataAuthenticator.authorizerName=MyBasicMetadataAuthorizer
+```
+The remaining examples of authenticator configuration use either `MyBasicMetadataAuthenticator` or `MyBasicLDAPAuthenticator` as the authenticator name.
+
+
+#### Properties for Druid metadata store user authentication
+
+**`druid.auth.authenticator.MyBasicMetadataAuthenticator.initialAdminPassword`**
+
+Initial [Password Provider](../../operations/password-provider.md) for the automatically created default admin user. If no password is specified, the default admin user will not be created. If the default admin user already exists, setting this property will not affect its password.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: null
+
+**`druid.auth.authenticator.MyBasicMetadataAuthenticator.initialInternalClientPassword`**
+
+Initial [Password Provider](../../operations/password-provider.md) for the default internal system user, used for internal process communication. If no password is specified, the default internal system user will not be created. If the default internal system user already exists, setting this property will not affect its password.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: null
+
+**`druid.auth.authenticator.MyBasicMetadataAuthenticator.enableCacheNotifications`**
+
+If true, the Coordinator will notify Druid processes whenever a configuration change to this Authenticator occurs, allowing them to immediately update their state without waiting for polling.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: True
+
+**`druid.auth.authenticator.MyBasicMetadataAuthenticator.cacheNotificationTimeout`**
+
+The timeout in milliseconds for the cache notifications.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: 5000
+
+**`druid.auth.authenticator.MyBasicMetadataAuthenticator.credentialIterations`**
+
+Number of iterations to use for password hashing. See [Credential iterations and API performance](#credential-iterations-and-api-performance)<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: 10000
+
+**`druid.auth.authenticator.MyBasicMetadataAuthenticator.credentialsValidator.type`**
+
+The type of credentials store (metadata) to validate requests credentials.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: metadata
+
+**`druid.auth.authenticator.MyBasicMetadataAuthenticator.skipOnFailure`**
+
+If true and the request credential doesn't exists or isn't fully configured in the credentials store, the request will proceed to next Authenticator in the chain.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: false
+
+**`druid.auth.authenticator.MyBasicMetadataAuthenticator.authorizerName`**
+
+Authorizer that requests should be directed to.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: Yes<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: N/A
+
+
+##### Credential iterations and API performance
+
+As noted above, the value of `credentialIterations` determines the number of iterations used to hash a password. A higher number of iterations increases security. The default value of 10,000 is intentionally high to prevent attackers from using brute force to guess passwords. We recommend that you don't lower this value. Druid caches the hash of up to 1000 passwords used in the last hour to ensure that having a large number of iterations does not meaningfully impact query performance. 
+
+If Druid uses the default credentials validator (i.e., `credentialsValidator.type=metadata`), changing the `credentialIterations` value affects the number of hashing iterations only for users created after the change or for users who subsequently update their passwords via the `/druid-ext/basic-security/authentication/db/basic/users/{userName}/credentials` endpoint. If Druid uses the `ldap` validator, the change applies to any user at next log in (as well as to new users or users who update their passwords).
+
+#### Properties for LDAP user authentication
+
+**`druid.auth.authenticator.MyBasicLDAPAuthenticator.initialAdminPassword`**
+
+Initial [Password Provider](../../operations/password-provider.md) for the automatically created default admin user. If no password is specified, the default admin user will not be created. If the default admin user already exists, setting this property will not affect its password.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: null
+
+**`druid.auth.authenticator.MyBasicLDAPAuthenticator.initialInternalClientPassword`**
+
+Initial [Password Provider](../../operations/password-provider.md) for the default internal system user, used for internal process communication. If no password is specified, the default internal system user will not be created. If the default internal system user already exists, setting this property will not affect its password.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: null
+
+**`druid.auth.authenticator.MyBasicLDAPAuthenticator.enableCacheNotifications`**
+
+If true, the Coordinator will notify Druid processes whenever a configuration change to this Authenticator occurs, allowing them to immediately update their state without waiting for polling.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: true
+
+**`druid.auth.authenticator.MyBasicLDAPAuthenticator.cacheNotificationTimeout`**
+
+The timeout in milliseconds for the cache notifications.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: 5000
+
+**`druid.auth.authenticator.MyBasicLDAPAuthenticator.credentialIterations`**
+
+Number of iterations to use for password hashing.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: 10000
+
+**`druid.auth.authenticator.MyBasicLDAPAuthenticator.credentialsValidator.type`**
+
+The type of credentials store (ldap) to validate requests credentials.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: metadata
+
+**`druid.auth.authenticator.MyBasicLDAPAuthenticator.credentialsValidator.url`**
+
+URL of the LDAP server.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: Yes<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: null
+
+**`druid.auth.authenticator.MyBasicLDAPAuthenticator.credentialsValidator.bindUser`**
+
+LDAP bind user username.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: Yes<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: null
+
+**`druid.auth.authenticator.MyBasicLDAPAuthenticator.credentialsValidator.bindPassword`**
+
+[Password Provider](../../operations/password-provider.md) LDAP bind user password.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: Yes<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: null
+
+**`druid.auth.authenticator.MyBasicLDAPAuthenticator.credentialsValidator.baseDn`**
+
+The point from where the LDAP server will search for users.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: Yes<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: null
+
+**`druid.auth.authenticator.MyBasicLDAPAuthenticator.credentialsValidator.userSearch`**
+
+The filter/expression to use for the search. For example, (&(sAMAccountName=%s)(objectClass=user))<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: Yes<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: null
+
+**`druid.auth.authenticator.MyBasicLDAPAuthenticator.credentialsValidator.userAttribute`**
+
+The attribute id identifying the attribute that will be returned as part of the search. For example, sAMAccountName.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: Yes<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: null
+
+**`druid.auth.authenticator.MyBasicLDAPAuthenticator.credentialsValidator.credentialVerifyDuration`**
+
+The duration in seconds for how long valid credentials are verifiable within the cache when not requested.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: 600
+
+**`druid.auth.authenticator.MyBasicLDAPAuthenticator.credentialsValidator.credentialMaxDuration`**
+
+The max duration in seconds for valid credentials that can reside in cache regardless of how often they are requested.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: 3600
+
+**`druid.auth.authenticator.MyBasicLDAPAuthenticator.credentialsValidator.credentialCacheSize`**
+
+The valid credentials cache size. The cache uses a LRU policy.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: 100
+
+**`druid.auth.authenticator.MyBasicLDAPAuthenticator.skipOnFailure`**
+
+If true and the request credential doesn't exists or isn't fully configured in the credentials store, the request will proceed to next Authenticator in the chain.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: false
+
+**`druid.auth.authenticator.MyBasicLDAPAuthenticator.authorizerName`**
+
+Authorizer that requests should be directed to.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: Yes<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: N/A
+
+### Escalator
+
+The Escalator determines the authentication scheme to use for internal Druid cluster communications, for example, when a Broker service communicates with a Historical service during query processing.
+
+Example configuration:
+```
+# Escalator
+druid.escalator.type=basic
+druid.escalator.internalClientUsername=druid_system
+druid.escalator.internalClientPassword=password2
+druid.escalator.authorizerName=MyBasicMetadataAuthorizer
+```
+
+#### Properties
+
+**`druid.escalator.internalClientUsername`**
+
+The escalator will use this username for requests made as the internal system user.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: Yes<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: N/A
+
+**`druid.escalator.internalClientPassword`**
+
+The escalator will use this [Password Provider](../../operations/password-provider.md) for requests made as the internal system user.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: Yes<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: N/A
+
+**`druid.escalator.authorizerName`**
+
+Authorizer that requests should be directed to.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: Yes<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: N/A
+
+
+### Authorizer
+
+To use the Basic authorizer, add an authorizer with type `basic` to the authorizers list.
+
+Use the following syntax to configure a named authorizer:
+
+```
+druid.auth.authorizer.<authorizerName>.<authorizerProperty>
+```
+
+Example configuration:
+```
+# Authorizer
+druid.auth.authorizers=["MyBasicMetadataAuthorizer"]
+druid.auth.authorizer.MyBasicMetadataAuthorizer.type=basic
+```
+
+The examples in the rest of this article use `MyBasicMetadataAuthorizer` or `MyBasicLDAPAuthorizer` as the authorizer name.
+
+#### Properties for Druid metadata store user authorization
+
+**`druid.auth.authorizer.MyBasicMetadataAuthorizer.enableCacheNotifications`**
+
+If true, the Coordinator will notify Druid processes whenever a configuration change to this Authorizer occurs, allowing them to immediately update their state without waiting for polling.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: true
+
+**`druid.auth.authorizer.MyBasicMetadataAuthorizer.cacheNotificationTimeout`**
+
+The timeout in milliseconds for the cache notifications.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: 5000
+
+**`druid.auth.authorizer.MyBasicMetadataAuthorizer.initialAdminUser`**
+
+The initial admin user with role defined in initialAdminRole property if specified, otherwise the default admin role will be assigned.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: admin
+
+**`druid.auth.authorizer.MyBasicMetadataAuthorizer.initialAdminRole`**
+
+The initial admin role to create if it doesn't already exists.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: admin
+
+**`druid.auth.authorizer.MyBasicMetadataAuthorizer.roleProvider.type`**
+
+The type of role provider to authorize requests credentials.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: metadata
+
+#### Properties for LDAP user authorization
+
+**`druid.auth.authorizer.MyBasicLDAPAuthorizer.enableCacheNotifications`**
+
+If true, the Coordinator will notify Druid processes whenever a configuration change to this Authorizer occurs, allowing them to immediately update their state without waiting for polling.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: true
+
+**`druid.auth.authorizer.MyBasicLDAPAuthorizer.cacheNotificationTimeout`**
+
+The timeout in milliseconds for the cache notifications.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: 5000
+
+**`druid.auth.authorizer.MyBasicLDAPAuthorizer.initialAdminUser`**
+
+The initial admin user with role defined in initialAdminRole property if specified, otherwise the default admin role will be assigned.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: admin
+
+**`druid.auth.authorizer.MyBasicLDAPAuthorizer.initialAdminRole`**
+
+The initial admin role to create if it doesn't already exists.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: admin
+
+**`druid.auth.authorizer.MyBasicLDAPAuthorizer.initialAdminGroupMapping`**
+
+The initial admin group mapping with role defined in initialAdminRole property if specified, otherwise the default admin role will be assigned. The name of this initial admin group mapping will be set to adminGroupMapping<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: null
+
+**`druid.auth.authorizer.MyBasicLDAPAuthorizer.roleProvider.type`**
+
+The type of role provider (ldap) to authorize requests credentials.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: metadata
+
+**`druid.auth.authorizer.MyBasicLDAPAuthorizer.roleProvider.groupFilters`**
+
+Array of LDAP group filters used to filter out the allowed set of groups returned from LDAP search. Filters can be begin with *, or end with ,* to provide configurational flexibility to limit or filter allowed set of groups available to LDAP Authorizer.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: null
+
+#### Properties for LDAPS
+
+Use the following properties to configure Druid authentication with LDAP over TLS (LDAPS). See [Configure LDAP authentication](../../operations/auth-ldap.md) for more information.
+
+**`druid.auth.basic.ssl.protocol`**
+
+SSL protocol to use. The TLS version is 1.2.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: Yes<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: tls
+
+**`druid.auth.basic.ssl.trustStorePath`**
+
+Path to the trust store file.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: Yes<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: N/A
+
+**`druid.auth.basic.ssl.trustStorePassword`**
+
+Password to access the trust store file.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: Yes<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: N/A
+
+**`druid.auth.basic.ssl.trustStoreType`**
+
+Format of the trust store file. For Java the format is jks.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: jks
+
+**`druid.auth.basic.ssl.trustStoreAlgorithm`**
+
+Algorithm used by the trust manager to validate certificate chains.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: N/A
+
+**`druid.auth.basic.ssl.trustStorePassword`**
+
+Password details that enable access to the truststore.<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Required**: No<br />
+&nbsp; &nbsp; &nbsp; &nbsp; &nbsp;**Default**: N/A
+
+Example LDAPS configuration:
+
+```json
+druid.auth.basic.ssl.protocol=tls
+druid.auth.basic.ssl.trustStorePath=/usr/local/druid-path/certs/truststore.jks
+druid.auth.basic.ssl.trustStorePassword=xxxxx
+druid.auth.basic.ssl.trustStoreType=jks
+druid.auth.basic.ssl.trustStoreAlgorithm=PKIX
+```
+You can configure `druid.auth.basic.ssl.trustStorePassword` to be a plain text password or you can set the password as an environment variable. See [Password providers](../../operations/password-provider.md) for more information.
+
+## Usage
+
+### Coordinator Security API
+To use these APIs, a user needs read/write permissions for the CONFIG resource type with name "security".
+
+#### Authentication API
+
+Root path: `/druid-ext/basic-security/authentication`
+
+Each API endpoint includes \{authenticatorName}, specifying which Authenticator instance is being configured.
+
+##### User/Credential Management
+`GET(/druid-ext/basic-security/authentication/db/{authenticatorName}/users)`<br />
+Return a list of all user names.
+
+`GET(/druid-ext/basic-security/authentication/db/{authenticatorName}/users/{userName})`<br />
+Return the name and credentials information of the user with name \{userName}
+
+`POST(/druid-ext/basic-security/authentication/db/{authenticatorName}/users/{userName})`<br />
+Create a new user with name \{userName}
+
+`DELETE(/druid-ext/basic-security/authentication/db/{authenticatorName}/users/{userName})`<br />
+Delete the user with name \{userName}
+
+`POST(/druid-ext/basic-security/authentication/db/{authenticatorName}/users/{userName}/credentials)`<br />
+Assign a password used for HTTP basic authentication for \{userName}
+Content: JSON password request object
+
+Example request body:
+
+```
+{
+  "password": "helloworld"
+}
+```
+
+##### Cache Load Status
+`GET(/druid-ext/basic-security/authentication/loadStatus)`<br />
+Return the current load status of the local caches of the authentication Druid metadata store.
+
+#### Authorization API
+
+Root path: `/druid-ext/basic-security/authorization`<br />
+
+Each API endpoint includes \{authorizerName}, specifying which Authorizer instance is being configured.
+
+##### User Creation/Deletion
+`GET(/druid-ext/basic-security/authorization/db/{authorizerName}/users)`<br />
+Return a list of all user names.
+
+`GET(/druid-ext/basic-security/authorization/db/{authorizerName}/users/{userName})`<br />
+Return the name and role information of the user with name \{userName}
+
+Example output:
+
+```json
+{
+  "name": "druid2",
+  "roles": [
+    "druidRole"
+  ]
+}
+```
+
+This API supports the following flags:
+
+- `?full`: The response will also include the full information for each role currently assigned to the user.
+
+Example output:
+
+```json
+{
+  "name": "druid2",
+  "roles": [
+    {
+      "name": "druidRole",
+      "permissions": [
+        {
+          "resourceAction": {
+            "resource": {
+              "name": "A",
+              "type": "DATASOURCE"
+            },
+            "action": "READ"
+          },
+          "resourceNamePattern": "A"
+        },
+        {
+          "resourceAction": {
+            "resource": {
+              "name": "C",
+              "type": "CONFIG"
+            },
+            "action": "WRITE"
+          },
+          "resourceNamePattern": "C"
+        }
+      ]
+    }
+  ]
+}
+```
+
+The output format of this API when `?full` is specified is deprecated and in later versions will be switched to the output format used when both `?full` and `?simplifyPermissions` flag is set.
+
+The `resourceNamePattern` is a compiled version of the resource name regex. It is redundant and complicates the use of this API for clients such as frontends that edit the authorization configuration, as the permission format in this output does not match the format used for adding permissions to a role.
+
+- `?full?simplifyPermissions`: When both `?full` and `?simplifyPermissions` are set, the permissions in the output will contain only a list of `resourceAction` objects, without the extraneous `resourceNamePattern` field.
+
+```json
+{
+  "name": "druid2",
+  "roles": [
+    {
+      "name": "druidRole",
+      "users": null,
+      "permissions": [
+        {
+          "resource": {
+            "name": "A",
+            "type": "DATASOURCE"
+          },
+          "action": "READ"
+        },
+        {
+          "resource": {
+            "name": "C",
+            "type": "CONFIG"
+          },
+          "action": "WRITE"
+        }
+      ]
+    }
+  ]
+}
+```
+
+`POST(/druid-ext/basic-security/authorization/db/{authorizerName}/users/{userName})`<br />
+Create a new user with name \{userName}
+
+`DELETE(/druid-ext/basic-security/authorization/db/{authorizerName}/users/{userName})`<br />
+Delete the user with name \{userName}
+
+##### Group mapping Creation/Deletion
+`GET(/druid-ext/basic-security/authorization/db/{authorizerName}/groupMappings)`<br />
+Return a list of all group mappings.
+
+`GET(/druid-ext/basic-security/authorization/db/{authorizerName}/groupMappings/{groupMappingName})`<br />
+Return the group mapping and role information of the group mapping with name \{groupMappingName}
+
+`POST(/druid-ext/basic-security/authorization/db/{authorizerName}/groupMappings/{groupMappingName})`<br />
+Create a new group mapping with name \{groupMappingName}
+Content: JSON group mapping object
+Example request body:
+
+```
+{
+    "name": "user",
+    "groupPattern": "CN=aaa,OU=aaa,OU=Groupings,DC=corp,DC=company,DC=com",
+    "roles": [
+        "user"
+    ]
+}
+```
+
+`DELETE(/druid-ext/basic-security/authorization/db/{authorizerName}/groupMappings/{groupMappingName})`<br />
+Delete the group mapping with name \{groupMappingName}
+
+#### Role Creation/Deletion
+`GET(/druid-ext/basic-security/authorization/db/{authorizerName}/roles)`<br />
+Return a list of all role names.
+
+`GET(/druid-ext/basic-security/authorization/db/{authorizerName}/roles/{roleName})`<br />
+Return name and permissions for the role named \{roleName}.
+
+Example output:
+
+```json
+{
+  "name": "druidRole2",
+  "permissions": [
+    {
+      "resourceAction": {
+        "resource": {
+          "name": "E",
+          "type": "DATASOURCE"
+        },
+        "action": "WRITE"
+      },
+      "resourceNamePattern": "E"
+    }
+  ]
+}
+```
+
+The default output format of this API is deprecated and in later versions will be switched to the output format used when the `?simplifyPermissions` flag is set. The `resourceNamePattern` is a compiled version of the resource name regex. It is redundant and complicates the use of this API for clients such as frontends that edit the authorization configuration, as the permission format in this output does not match the format used for adding permissions to a role.
+
+This API supports the following flags:
+
+- `?full`: The output will contain an extra `users` list, containing the users that currently have this role.
+
+```json
+{"users":["druid"]}
+```
+
+- `?simplifyPermissions`: The permissions in the output will contain only a list of `resourceAction` objects, without the extraneous `resourceNamePattern` field. The `users` field will be null when `?full` is not specified.
+
+Example output:
+
+```json
+{
+  "name": "druidRole2",
+  "users": null,
+  "permissions": [
+    {
+      "resource": {
+        "name": "E",
+        "type": "DATASOURCE"
+      },
+      "action": "WRITE"
+    }
+  ]
+}
+```
+
+
+`POST(/druid-ext/basic-security/authorization/db/{authorizerName}/roles/{roleName})`<br />
+Create a new role with name \{roleName}.
+Content: username string
+
+`DELETE(/druid-ext/basic-security/authorization/db/{authorizerName}/roles/{roleName})`<br />
+Delete the role with name \{roleName}.
+
+
+#### Role Assignment
+`POST(/druid-ext/basic-security/authorization/db/{authorizerName}/users/{userName}/roles/{roleName})`<br />
+Assign role \{roleName} to user \{userName}.
+
+`DELETE(/druid-ext/basic-security/authorization/db/{authorizerName}/users/{userName}/roles/{roleName})`<br />
+Unassign role \{roleName} from user \{userName}
+
+`POST(/druid-ext/basic-security/authorization/db/{authorizerName}/groupMappings/{groupMappingName}/roles/{roleName})`<br />
+Assign role \{roleName} to group mapping \{groupMappingName}.
+
+`DELETE(/druid-ext/basic-security/authorization/db/{authorizerName}/groupMappings/{groupMappingName}/roles/{roleName})`<br />
+Unassign role \{roleName} from group mapping \{groupMappingName}
+
+
+#### Permissions
+`POST(/druid-ext/basic-security/authorization/db/{authorizerName}/roles/{roleName}/permissions)`<br />
+Set the permissions of \{roleName}. This replaces the previous set of permissions on the role.
+
+Content: List of JSON Resource-Action objects, e.g.:
+
+```
+[
+{
+  "resource": {
+    "name": "wiki.*",
+    "type": "DATASOURCE"
+  },
+  "action": "READ"
+},
+{
+  "resource": {
+    "name": "wikiticker",
+    "type": "DATASOURCE"
+  },
+  "action": "WRITE"
+}
+]
+```
+
+The "name" field for resources in the permission definitions are regexes used to match resource names during authorization checks.
+
+Please see [Defining permissions](../../operations/security-user-auth.md#defining-permissions) for more details.
+
+##### Cache Load Status
+`GET(/druid-ext/basic-security/authorization/loadStatus)`<br />
+Return the current load status of the local caches of the authorization Druid metadata store.
\ No newline at end of file
diff --git a/docs/35.0.0/development/extensions-core/druid-kerberos.md b/docs/35.0.0/development/extensions-core/druid-kerberos.md
new file mode 100644
index 0000000000..8858e53548
--- /dev/null
+++ b/docs/35.0.0/development/extensions-core/druid-kerberos.md
@@ -0,0 +1,125 @@
+---
+id: druid-kerberos
+title: "Kerberos"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+Apache Druid Extension to enable Authentication for Druid Processes using Kerberos.
+This extension adds an Authenticator which is used to protect HTTP Endpoints using the simple and protected GSSAPI negotiation mechanism [SPNEGO](https://en.wikipedia.org/wiki/SPNEGO).
+Make sure to [include](../../configuration/extensions.md#loading-extensions) `druid-kerberos` in the extensions load list.
+
+
+## Configuration
+
+### Creating an Authenticator
+```
+druid.auth.authenticatorChain=["MyKerberosAuthenticator"]
+
+druid.auth.authenticator.MyKerberosAuthenticator.type=kerberos
+```
+
+To use the Kerberos authenticator, add an authenticator with type `kerberos` to the authenticatorChain. The example above uses the name "MyKerberosAuthenticator" for the Authenticator.
+
+Configuration of the named authenticator is assigned through properties with the form:
+
+```
+druid.auth.authenticator.<authenticatorName>.<authenticatorProperty>
+```
+
+The configuration examples in the rest of this document will use "kerberos" as the name of the authenticator being configured.
+
+### Properties
+|Property|Possible Values|Description| Default | required |
+|--------|---------------|-----------|-----|--|
+|`druid.auth.authenticator.kerberos.serverPrincipal`|`HTTP/_HOST@EXAMPLE.COM`| SPNEGO service principal used by druid processes|Empty|Yes|
+|`druid.auth.authenticator.kerberos.serverKeytab`|`/etc/security/keytabs/spnego.service.keytab`|SPNego service keytab used by druid processes|Empty|Yes|
+|`druid.auth.authenticator.kerberos.authToLocal`|`RULE:[1:$1@$0](druid@EXAMPLE.COM)s/.*/druid DEFAULT`|It allows you to set a general rule for mapping principal names to local user names. It will be used if there is not an explicit mapping for the principal name that is being translated.|DEFAULT|No|
+|`druid.auth.authenticator.kerberos.cookieSignatureSecret`|`secretString`| Secret used to sign authentication cookies|Empty|Yes|
+|`druid.auth.authenticator.kerberos.authorizerName`|Depends on available authorizers|Authorizer that requests should be directed to|Empty|Yes|
+
+As a note, it is required that the SPNego principal in use by the druid processes must start with HTTP (This specified by [RFC-4559](https://tools.ietf.org/html/rfc4559)) and must be of the form "HTTP/_HOST@REALM".
+The special string _HOST will be replaced automatically with the value of config `druid.host`
+
+### `druid.auth.authenticator.kerberos.excludedPaths`
+
+In older releases, the Kerberos authenticator had an `excludedPaths` property that allowed the user to specify a list of paths where authentication checks should be skipped. This property has been removed from the Kerberos authenticator because the path exclusion functionality is now handled across all authenticators/authorizers by setting `druid.auth.unsecuredPaths`, as described in the [main auth documentation](../../operations/auth.md).
+
+### Auth to Local Syntax
+`druid.auth.authenticator.kerberos.authToLocal` allows you to set a general rules for mapping principal names to local user names.
+The syntax for mapping rules is `RULE:\[n:string](regexp)s/pattern/replacement/g`. The integer n indicates how many components the target principal should have. If this matches, then a string will be formed from string, substituting the realm of the principal for $0 and the nth component of the principal for $n. e.g. if the principal was druid/admin then `\[2:$2$1suffix]` would result in the string `admindruidsuffix`.
+If this string matches regexp, then the s//\[g] substitution command will be run over the string. The optional g will cause the substitution to be global over the string, instead of replacing only the first match in the string.
+If required, multiple rules can be joined by newline character and specified as a String.
+
+### Increasing HTTP Header size for large SPNEGO negotiate header
+In Active Directory environment, SPNEGO token in the Authorization header includes PAC (Privilege Access Certificate) information,
+which includes all security groups for the user. In some cases when the user belongs to many security groups the header to grow beyond what druid can handle by default.
+In such cases, max request header size that druid can handle can be increased by setting `druid.server.http.maxRequestHeaderSize` (default 8KiB) and `druid.router.http.maxRequestBufferSize` (default 8KiB).
+
+## Configuring Kerberos Escalated Client
+
+Druid internal processes communicate with each other using an escalated http Client. A Kerberos enabled escalated HTTP Client can be configured by following properties -
+
+
+|Property|Example Values|Description|Default|required|
+|--------|---------------|-----------|-------|--------|
+|`druid.escalator.type`|`kerberos`| Type of Escalator client used for internal process communication.|n/a|Yes|
+|`druid.escalator.internalClientPrincipal`|`druid@EXAMPLE.COM`| Principal user name, used for internal process communication|n/a|Yes|
+|`druid.escalator.internalClientKeytab`|`/etc/security/keytabs/druid.keytab`|Path to keytab file used for internal process communication|n/a|Yes|
+|`druid.escalator.authorizerName`|`MyBasicAuthorizer`|Authorizer that requests should be directed to.|n/a|Yes|
+
+## Accessing Druid HTTP end points when kerberos security is enabled
+1. To access druid HTTP endpoints via curl user will need to first login using `kinit` command as follows -
+
+    ```
+    kinit -k -t <path_to_keytab_file> user@REALM.COM
+    ```
+
+2. Once the login is successful verify that login is successful using `klist` command
+3. Now you can access druid HTTP endpoints using curl command as follows -
+
+    ```
+    curl --negotiate -u:anyUser -b ~/cookies.txt -c ~/cookies.txt -X POST -H'Content-Type: application/json' <HTTP_END_POINT>
+    ```
+
+    e.g to send a query from file `query.json` to the Druid Broker use this command -
+
+    ```
+    curl --negotiate -u:anyUser -b ~/cookies.txt -c ~/cookies.txt -X POST -H'Content-Type: application/json'  http://broker-host:port/druid/v2/?pretty -d @query.json
+    ```
+    Note: Above command will authenticate the user first time using SPNego negotiate mechanism and store the authentication cookie in file. For subsequent requests the cookie will be used for authentication.
+
+## Accessing Coordinator or Overlord console from web browser
+To access Coordinator/Overlord console from browser you will need to configure your browser for SPNego authentication as follows -
+
+1. Safari - No configurations required.
+2. Firefox - Open firefox and follow these steps -
+    1. Go to `about:config` and search for `network.negotiate-auth.trusted-uris`.
+    2. Double-click and add the following values: `"http://druid-coordinator-hostname:ui-port"` and `"http://druid-overlord-hostname:port"`
+3. Google Chrome - From the command line run following commands -
+    1. `google-chrome --auth-server-whitelist="druid-coordinator-hostname" --auth-negotiate-delegate-whitelist="druid-coordinator-hostname"`
+    2. `google-chrome --auth-server-whitelist="druid-overlord-hostname" --auth-negotiate-delegate-whitelist="druid-overlord-hostname"`
+4. Internet Explorer -
+    1. Configure trusted websites to include `"druid-coordinator-hostname"` and `"druid-overlord-hostname"`
+    2. Allow negotiation for the UI website.
+
+## Sending Queries programmatically
+Many HTTP client libraries, such as Apache Commons [HttpComponents](https://hc.apache.org/), already have support for performing SPNEGO authentication. You can use any of the available HTTP client library to communicate with druid cluster.
diff --git a/docs/35.0.0/development/extensions-core/druid-lookups.md b/docs/35.0.0/development/extensions-core/druid-lookups.md
new file mode 100644
index 0000000000..e3514a0d0c
--- /dev/null
+++ b/docs/35.0.0/development/extensions-core/druid-lookups.md
@@ -0,0 +1,223 @@
+---
+id: druid-lookups
+title: "Cached Lookup Module"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+## Description
+This Apache Druid module provides a per-lookup caching mechanism for JDBC data sources.
+The main goal of this cache is to speed up the access to a high latency lookup sources and to provide a caching isolation for every lookup source.
+Thus user can define various caching strategies or and implementation per lookup, even if the source is the same.
+This module can be used side to side with other lookup module like the global cached lookup module.
+
+To use this Apache Druid extension, [include](../../configuration/extensions.md#loading-extensions) `druid-lookups-cached-single` in the extensions load list.
+
+:::info
+To use JDBC, you must add your database client JAR files to the extension's directory.
+ For Postgres, the connector JAR is already included.
+ See the MySQL extension documentation for instructions to obtain [MySQL](./mysql.md#install-mysql-connectorj) or [MariaDB](./mysql.md#install-mariadb-connectorj) connector libraries.
+ Copy or symlink the downloaded file to `extensions/druid-lookups-cached-single` under the distribution root directory.
+:::
+
+## Architecture
+Generally speaking this module can be divided into two main component, namely, the data fetcher layer and caching layer.
+
+### Data Fetcher layer
+
+First part is the data fetcher layer API `DataFetcher`, that exposes a set of fetch methods to fetch data from the actual Lookup dimension source.
+For instance `JdbcDataFetcher` provides an implementation of `DataFetcher` that can be used to fetch key/value from a RDBMS via JDBC driver.
+If you need new type of data fetcher, all you need to do, is to implement the interface `DataFetcher` and load it via another druid module.
+### Caching layer
+
+This extension comes with two different caching strategies. First strategy is a poll based and the second is a load based.
+#### Poll lookup cache
+
+The poll strategy cache strategy will fetch and swap all the pair of key/values periodically from the lookup source.
+Hence, user should make sure that the cache can fit all the data.
+The current implementation provides 2 type of poll cache, the first is on-heap (uses immutable map), while the second uses MapDB based off-heap map.
+User can also implement a different lookup polling cache by implementing `PollingCacheFactory` and `PollingCache` interfaces.
+
+#### Loading lookup
+Loading cache strategy will load the key/value pair upon request on the key it self, the general algorithm is load key if absent.
+Once the key/value  pair is loaded eviction will occur according to the cache eviction policy.
+This module comes with two loading lookup implementation, the first is on-heap backed by a Guava cache implementation, the second is MapDB off-heap implementation.
+Both implementations offer various eviction strategies.
+Same for Loading cache, developer can implement a new type of loading cache by implementing `LookupLoadingCache` interface.
+
+## Configuration and Operation:
+
+
+### Polling Lookup
+
+**Note that the current implementation of `offHeapPolling` and `onHeapPolling` will create two caches one to lookup value based on key and the other to reverse lookup the key from value**
+
+|Field|Type|Description|Required|default|
+|-----|----|-----------|--------|-------|
+|dataFetcher|JSON object|Specifies the lookup data fetcher type for fetching data|yes|null|
+|cacheFactory|JSON Object|Cache factory implementation|no |onHeapPolling|
+|pollPeriod|Period|polling period |no |null (poll once)|
+
+
+#####   Example of Polling On-heap Lookup
+This example demonstrates a polling cache that will update its on-heap cache every 10 minutes
+
+```json
+{
+    "type": "pollingLookup",
+    "pollPeriod": "PT10M",
+    "dataFetcher": {
+       "type": "jdbcDataFetcher",
+       "connectorConfig": {
+          "connectURI": "jdbc://mysql://localhost:3306/my_data_base",
+          "user": "druid",
+          "password": "druid"
+       },
+       "table": "lookup_table_name",
+       "keyColumn": "key_column_name",
+       "valueColumn": "value_column_name"
+    },
+    "cacheFactory": {
+       "type": "onHeapPolling"
+    }
+}
+
+```
+
+#####   Example Polling Off-heap Lookup
+This example demonstrates an off-heap lookup that will be cached once and never swapped `(pollPeriod == null)`
+
+```json
+{
+   "type": "pollingLookup",
+   "dataFetcher": {
+      "type": "jdbcDataFetcher",
+      "connectorConfig": {
+         "connectURI": "jdbc://mysql://localhost:3306/my_data_base",
+         "user": "druid",
+         "password": "druid"
+      },
+      "table": "lookup_table_name",
+      "keyColumn": "key_column_name",
+      "valueColumn": "value_column_name"
+   },
+   "cacheFactory": {
+      "type": "offHeapPolling"
+   }
+}
+
+```
+
+
+### Loading lookup
+
+|Field|Type|Description|Required|default|
+|-----|----|-----------|--------|-------|
+|dataFetcher|JSON object|Specifies the lookup data fetcher type  to use in order to fetch data|yes|null|
+|loadingCacheSpec|JSON Object|Lookup cache spec implementation|yes |null|
+|reverseLoadingCacheSpec|JSON Object| Reverse lookup cache  implementation|yes |null|
+
+
+##### Example Loading On-heap Guava
+
+Guava cache configuration spec.
+
+|Field|Type|Description|Required|default|
+|-----|----|-----------|--------|-------|
+|concurrencyLevel|int|Allowed concurrency among update operations|no|4|
+|initialCapacity|int|Initial capacity size|no |null|
+|maximumSize|long| Specifies the maximum number of entries the cache may contain.|no |null (infinite capacity)|
+|expireAfterAccess|long| Specifies the eviction time after last read in milliseconds.|no |null (No read-time-based eviction when set to null)|
+|expireAfterWrite|long| Specifies the eviction time after last write in milliseconds.|no |null (No write-time-based eviction when set to null)|
+
+```json
+{
+   "type": "loadingLookup",
+   "dataFetcher": {
+      "type": "jdbcDataFetcher",
+      "connectorConfig": {
+         "connectURI": "jdbc://mysql://localhost:3306/my_data_base",
+         "user": "druid",
+         "password": "druid"
+      },
+      "table": "lookup_table_name",
+      "keyColumn": "key_column_name",
+      "valueColumn": "value_column_name"
+   },
+   "loadingCacheSpec": {
+      "type": "guava"
+   },
+   "reverseLoadingCacheSpec": {
+      "type": "guava",
+      "maximumSize": 500000,
+      "expireAfterAccess": 100000,
+      "expireAfterWrite": 10000
+   }
+}
+```
+
+##### Example Loading Off-heap MapDB
+
+Off heap cache is backed by [MapDB](http://www.mapdb.org/) implementation. MapDB is using direct memory as memory pool, please take that into account when limiting the JVM direct memory setup.
+
+|Field|Type|Description|Required|default|
+|-----|----|-----------|--------|-------|
+|maxStoreSize|double|maximal size of store in GiB, if store is larger entries will start expiring|no |0|
+|maxEntriesSize|long| Specifies the maximum number of entries the cache may contain.|no |0 (infinite capacity)|
+|expireAfterAccess|long| Specifies the eviction time after last read in milliseconds.|no |0 (No read-time-based eviction when set to null)|
+|expireAfterWrite|long| Specifies the eviction time after last write in milliseconds.|no |0 (No write-time-based eviction when set to null)|
+
+
+```json
+{
+   "type": "loadingLookup",
+   "dataFetcher": {
+      "type": "jdbcDataFetcher",
+      "connectorConfig": {
+         "connectURI": "jdbc://mysql://localhost:3306/my_data_base",
+         "user": "druid",
+         "password": "druid"
+      },
+      "table": "lookup_table_name",
+      "keyColumn": "key_column_name",
+      "valueColumn": "value_column_name"
+   },
+   "loadingCacheSpec": {
+      "type": "mapDb",
+      "maxEntriesSize": 100000
+   },
+   "reverseLoadingCacheSpec": {
+      "type": "mapDb",
+      "maxStoreSize": 5,
+      "expireAfterAccess": 100000,
+      "expireAfterWrite": 10000
+   }
+}
+```
+
+### JDBC Data Fetcher
+
+|Field|Type|Description|Required|default|
+|-----|----|-----------|--------|-------|
+|`connectorConfig`|JSON object|Specifies the database connection details. You can set `connectURI`, `user` and `password`. You can selectively allow JDBC properties in `connectURI`. See [JDBC connections security config](../../configuration/index.md#jdbc-connections-to-external-databases) for more details.|yes||
+|`table`|string|The table name to read from.|yes||
+|`keyColumn`|string|The column name that contains the lookup key.|yes||
+|`valueColumn`|string|The column name that contains the lookup value.|yes||
+|`streamingFetchSize`|int|Fetch size used in JDBC connections.|no|1000|
diff --git a/docs/35.0.0/development/extensions-core/druid-pac4j.md b/docs/35.0.0/development/extensions-core/druid-pac4j.md
new file mode 100644
index 0000000000..243350cc51
--- /dev/null
+++ b/docs/35.0.0/development/extensions-core/druid-pac4j.md
@@ -0,0 +1,63 @@
+---
+id: druid-pac4j
+title: "Druid pac4j based Security extension"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+Apache Druid Extension to enable [OpenID Connect](https://openid.net/connect/) based Authentication for Druid Processes using [pac4j](https://github.com/pac4j/pac4j) as the underlying client library.
+This can be used  with any authentication server that supports same e.g. [Okta](https://developer.okta.com/).
+The pac4j authenticator should only be used at the router node to enable a group of users in existing authentication server to interact with Druid cluster, using the [web console](../../operations/web-console.md). 
+
+This extension also provides a JWT authenticator that validates [ID Tokens](https://openid.net/specs/openid-connect-core-1_0.html#CodeIDToken) associated with a request. ID Tokens are attached to the request under the `Authorization` header with the bearer token prefix - `Bearer `. This authenticator is intended for services to talk to Druid by initially authenticating with an OIDC server to retrieve the ID Token which is then attached to every Druid request.
+
+This extension does not support JDBC client authentication.
+
+## Configuration
+
+### Creating an Authenticator
+```
+#Create a pac4j web user authenticator
+druid.auth.authenticatorChain=["pac4j"]
+druid.auth.authenticator.pac4j.type=pac4j
+
+#Create a JWT token authenticator
+druid.auth.authenticatorChain=["jwt"]
+druid.auth.authenticator.jwt.type=jwt
+```
+
+### Properties
+|Property|Description|Default|required|
+|--------|---------------|-----------|-------|
+|`druid.auth.pac4j.cookiePassphrase`|Passphrase for encrypting the cookies used to manage authentication session with browser. It can be provided as plaintext string or the (recommended) [Password Provider](../../operations/password-provider.md).|none|Yes|
+|`druid.auth.pac4j.readTimeout`|Socket connect and read timeout duration used when communicating with authentication server|PT5S|No|
+|`druid.auth.pac4j.enableCustomSslContext`|Whether to use custom SSLContext setup via [simple-client-sslcontext](simple-client-sslcontext.md) extension which must be added to extensions list when this property is set to true.|false|No|
+|`druid.auth.pac4j.oidc.clientID`|OAuth Client Application id.|none|Yes|
+|`druid.auth.pac4j.oidc.clientSecret`|OAuth Client Application secret. It can be provided as plaintext string or The [Password Provider](../../operations/password-provider.md).|none|Yes|
+|`druid.auth.pac4j.oidc.discoveryURI`|discovery URI for fetching OP metadata [see this](http://openid.net/specs/openid-connect-discovery-1_0.html).|none|Yes|
+|`druid.auth.pac4j.oidc.oidcClaim`|[claim](https://openid.net/specs/openid-connect-core-1_0.html#Claims) that will be extracted from the ID Token after validation.|name|No|
+|`druid.auth.pac4j.oidc.scope`| scope is used by an application during authentication to authorize access to a user's details.|`openid profile email`|No|
+
+:::info
+Users must set a strong passphrase to ensure that an attacker is not able to guess it simply by brute force.
+A compromised passphrase may allow an attacker to read and manipulate session cookies.
+For more details, see [CVE-2024-45384](https://nvd.nist.gov/vuln/detail/CVE-2024-45384).
+:::
\ No newline at end of file
diff --git a/docs/35.0.0/development/extensions-core/examples.md b/docs/35.0.0/development/extensions-core/examples.md
new file mode 100644
index 0000000000..577ee30f65
--- /dev/null
+++ b/docs/35.0.0/development/extensions-core/examples.md
@@ -0,0 +1,26 @@
+---
+id: examples
+title: "Extension Examples"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+This extension was removed in Apache Druid 0.16.0. In prior versions, the extension provided obsolete facilities to ingest data from the Twitter 'Spritzer' data stream as well as the Wikipedia changes IRC channel.
diff --git a/docs/35.0.0/development/extensions-core/google.md b/docs/35.0.0/development/extensions-core/google.md
new file mode 100644
index 0000000000..6df933f2da
--- /dev/null
+++ b/docs/35.0.0/development/extensions-core/google.md
@@ -0,0 +1,56 @@
+---
+id: google
+title: "Google Cloud Storage"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+## Google Cloud Storage Extension
+
+This extension allows you to do 2 things:
+* [Ingest data](#reading-data-from-google-cloud-storage) from files stored in Google Cloud Storage.
+* Write segments to [deep storage](#deep-storage) in GCS.
+
+To use this Apache Druid extension, [include](../../configuration/extensions.md#loading-extensions) `druid-google-extensions` in the extensions load list.
+
+### Required Configuration
+
+To configure connectivity to google cloud, run druid processes with `GOOGLE_APPLICATION_CREDENTIALS=/path/to/service_account_keyfile` in the environment.
+
+### Reading data from Google Cloud Storage
+
+The [Google Cloud Storage input source](../../ingestion/input-sources.md) is supported by the [Parallel task](../../ingestion/native-batch.md)
+to read objects directly from Google Cloud Storage. If you use the [Hadoop task](../../ingestion/hadoop.md),
+you can read data from Google Cloud Storage by specifying the paths in your [`inputSpec`](../../ingestion/hadoop.md#inputspec).
+
+### Deep Storage
+
+Deep storage can be written to Google Cloud Storage either via this extension or the [druid-hdfs-storage extension](../extensions-core/hdfs.md).
+
+#### Configuration
+
+To configure connectivity to google cloud, run druid processes with `GOOGLE_APPLICATION_CREDENTIALS=/path/to/service_account_keyfile` in the environment.
+
+|Property|Description|Possible Values|Default|
+|--------|---------------|-----------|-------|
+|`druid.storage.type`|google||Must be set.|
+|`druid.google.bucket`||Google Storage bucket name.|Must be set.|
+|`druid.google.prefix`|A prefix string that will be prepended to the blob names for the segments published to Google deep storage| |""|
+|`druid.google.maxListingLength`|maximum number of input files matching a given prefix to retrieve at a time| |1024|
diff --git a/docs/35.0.0/development/extensions-core/hdfs.md b/docs/35.0.0/development/extensions-core/hdfs.md
new file mode 100644
index 0000000000..b1d2d0ceaa
--- /dev/null
+++ b/docs/35.0.0/development/extensions-core/hdfs.md
@@ -0,0 +1,166 @@
+---
+id: hdfs
+title: "HDFS"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+To use this Apache Druid extension, [include](../../configuration/extensions.md#loading-extensions) `druid-hdfs-storage` in the extensions load list and run druid processes with `GOOGLE_APPLICATION_CREDENTIALS=/path/to/service_account_keyfile` in the environment.
+
+## Deep Storage
+
+### Configuration for HDFS
+
+|Property|Possible Values|Description|Default|
+|--------|---------------|-----------|-------|
+|`druid.storage.type`|hdfs||Must be set.|
+|`druid.storage.storageDirectory`||Directory for storing segments.|Must be set.|
+|`druid.hadoop.security.kerberos.principal`|`druid@EXAMPLE.COM`| Principal user name |empty|
+|`druid.hadoop.security.kerberos.keytab`|`/etc/security/keytabs/druid.headlessUser.keytab`|Path to keytab file|empty|
+
+Besides the above settings, you also need to include all Hadoop configuration files (such as `core-site.xml`, `hdfs-site.xml`)
+in the Druid classpath. One way to do this is copying all those files under `${DRUID_HOME}/conf/_common`.
+
+If you are using the Hadoop ingestion, set your output directory to be a location on Hadoop and it will work.
+If you want to eagerly authenticate against a secured hadoop/hdfs cluster you must set `druid.hadoop.security.kerberos.principal` and `druid.hadoop.security.kerberos.keytab`, this is an alternative to the cron job method that runs `kinit` command periodically.
+
+### Configuration for Cloud Storage
+
+You can also use the Amazon S3 or the Google Cloud Storage as the deep storage via HDFS.
+
+#### Configuration for Amazon S3
+
+To use the Amazon S3 as the deep storage, you need to configure `druid.storage.storageDirectory` properly.
+
+|Property|Possible Values|Description|Default|
+|--------|---------------|-----------|-------|
+|`druid.storage.type`|hdfs| |Must be set.|
+|`druid.storage.storageDirectory`|s3a://bucket/example/directory or s3n://bucket/example/directory|Path to the deep storage|Must be set.|
+
+You also need to include the [Hadoop AWS module](https://hadoop.apache.org/docs/stable/hadoop-aws/tools/hadoop-aws/), especially the `hadoop-aws.jar` in the Druid classpath.
+Run the below command to install the `hadoop-aws.jar` file under `${DRUID_HOME}/extensions/druid-hdfs-storage` in all nodes.
+
+```bash
+${DRUID_HOME}/bin/run-java -classpath "${DRUID_HOME}/lib/*" org.apache.druid.cli.Main tools pull-deps -h "org.apache.hadoop:hadoop-aws:${HADOOP_VERSION}";
+cp ${DRUID_HOME}/hadoop-dependencies/hadoop-aws/${HADOOP_VERSION}/hadoop-aws-${HADOOP_VERSION}.jar ${DRUID_HOME}/extensions/druid-hdfs-storage/
+```
+
+Finally, you need to add the below properties in the `core-site.xml`.
+For more configurations, see the [Hadoop AWS module](https://hadoop.apache.org/docs/stable/hadoop-aws/tools/hadoop-aws/).
+
+```xml
+<property>
+  <name>fs.s3a.impl</name>
+  <value>org.apache.hadoop.fs.s3a.S3AFileSystem</value>
+  <description>The implementation class of the S3A Filesystem</description>
+</property>
+
+<property>
+  <name>fs.AbstractFileSystem.s3a.impl</name>
+  <value>org.apache.hadoop.fs.s3a.S3A</value>
+  <description>The implementation class of the S3A AbstractFileSystem.</description>
+</property>
+
+<property>
+  <name>fs.s3a.access.key</name>
+  <description>AWS access key ID. Omit for IAM role-based or provider-based authentication.</description>
+  <value>your access key</value>
+</property>
+
+<property>
+  <name>fs.s3a.secret.key</name>
+  <description>AWS secret key. Omit for IAM role-based or provider-based authentication.</description>
+  <value>your secret key</value>
+</property>
+```
+
+#### Configuration for Google Cloud Storage
+
+To use the Google Cloud Storage as the deep storage, you need to configure `druid.storage.storageDirectory` properly.
+
+|Property|Possible Values|Description|Default|
+|--------|---------------|-----------|-------|
+|`druid.storage.type`|hdfs||Must be set.|
+|`druid.storage.storageDirectory`|gs://bucket/example/directory|Path to the deep storage|Must be set.|
+
+All services that need to access GCS need to have the [GCS connector jar](https://cloud.google.com/dataproc/docs/concepts/connectors/cloud-storage#other_sparkhadoop_clusters) in their class path.
+Please read the [install instructions](https://github.com/GoogleCloudPlatform/bigdata-interop/blob/master/gcs/INSTALL.md)
+to properly set up the necessary libraries and configurations.
+One option is to place this jar in `${DRUID_HOME}/lib/` and `${DRUID_HOME}/extensions/druid-hdfs-storage/`.
+
+Finally, you need to configure the `core-site.xml` file with the filesystem
+and authentication properties needed for GCS. You may want to copy the below
+example properties. Please follow the instructions at
+[https://github.com/GoogleCloudPlatform/bigdata-interop/blob/master/gcs/INSTALL.md](https://github.com/GoogleCloudPlatform/bigdata-interop/blob/master/gcs/INSTALL.md)
+for more details.
+For more configurations, [GCS core default](https://github.com/GoogleCloudDataproc/hadoop-connectors/blob/v2.0.0/gcs/conf/gcs-core-default.xml)
+and [GCS core template](https://github.com/GoogleCloudDataproc/hadoop-connectors/blob/master/gcs/src/test/resources/core-site.xml).
+
+```xml
+<property>
+  <name>fs.gs.impl</name>
+  <value>com.google.cloud.hadoop.fs.gcs.GoogleHadoopFileSystem</value>
+  <description>The FileSystem for gs: (GCS) uris.</description>
+</property>
+
+<property>
+  <name>fs.AbstractFileSystem.gs.impl</name>
+  <value>com.google.cloud.hadoop.fs.gcs.GoogleHadoopFS</value>
+  <description>The AbstractFileSystem for gs: uris.</description>
+</property>
+
+<property>
+  <name>google.cloud.auth.service.account.enable</name>
+  <value>true</value>
+  <description>
+    Whether to use a service account for GCS authorization.
+    Setting this property to `false` will disable use of service accounts for
+    authentication.
+  </description>
+</property>
+
+<property>
+  <name>google.cloud.auth.service.account.json.keyfile</name>
+  <value>/path/to/keyfile</value>
+  <description>
+    The JSON key file of the service account used for GCS
+    access when google.cloud.auth.service.account.enable is true.
+  </description>
+</property>
+```
+
+## Reading data from HDFS or Cloud Storage
+
+### Native batch ingestion
+
+The [HDFS input source](../../ingestion/input-sources.md#hdfs-input-source) is supported by the [Parallel task](../../ingestion/native-batch.md)
+to read files directly from the HDFS Storage. You may be able to read objects from cloud storage
+with the HDFS input source, but we highly recommend to use a proper
+[Input Source](../../ingestion/input-sources.md) instead if possible because
+it is simple to set up. For now, only the [S3 input source](../../ingestion/input-sources.md#s3-input-source)
+and the [Google Cloud Storage input source](../../ingestion/input-sources.md#google-cloud-storage-input-source)
+are supported for cloud storage types, and so you may still want to use the HDFS input source
+to read from cloud storage other than those two.
+
+### Hadoop-based ingestion
+
+If you use the [Hadoop ingestion](../../ingestion/hadoop.md), you can read data from HDFS
+by specifying the paths in your [`inputSpec`](../../ingestion/hadoop.md#inputspec).
+See the [Static](../../ingestion/hadoop.md#static) inputSpec for details.
diff --git a/docs/35.0.0/development/extensions-core/k8s-jobs.md b/docs/35.0.0/development/extensions-core/k8s-jobs.md
new file mode 100644
index 0000000000..c97caf5be2
--- /dev/null
+++ b/docs/35.0.0/development/extensions-core/k8s-jobs.md
@@ -0,0 +1,898 @@
+---
+id: k8s-jobs
+title: "MM-less Druid in K8s"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+import Tabs from '@theme/Tabs';
+import TabItem from '@theme/TabItem';
+
+Apache Druid Extension to enable using Kubernetes for launching and managing tasks instead of the Middle Managers.  This extension allows you to launch tasks as kubernetes jobs removing the need for your middle manager.  
+
+Consider this an [EXPERIMENTAL](../experimental.md) feature mostly because it has not been tested yet on a wide variety of long-running Druid clusters.
+
+## How it works
+
+The K8s extension builds a pod spec for each task using the specified pod adapter. All jobs are natively restorable, they are decoupled from the Druid deployment, thus restarting pods or doing upgrades has no effect on tasks in flight.  They will continue to run and when the overlord comes back up it will start tracking them again.  
+
+
+## Configuration
+
+To use this extension please make sure to [include](../../configuration/extensions.md#loading-extensions) `druid-kubernetes-overlord-extensions` in the extensions load list for your overlord process.
+
+The extension uses `druid.indexer.runner.capacity` to limit the number of k8s jobs in flight. A good initial value for this would be the sum of the total task slots of all the middle managers you were running before switching to K8s based ingestion. The K8s task runner uses one thread per Job that is created, so setting this number too large can cause memory issues on the overlord. Additionally set the variable `druid.indexer.runner.namespace` to the namespace in which you are running druid.
+
+Other configurations required are:
+`druid.indexer.runner.type: k8s` and `druid.indexer.task.encapsulatedTask: true`
+
+### Dynamic config
+
+Druid operators can dynamically tune certain features within this extension. You don't need to restart the Overlord
+service for these changes to take effect.
+
+Druid can dynamically tune [pod template selection](#pod-template-selection), which allows you to configure the pod 
+template based on the task to be run. To enable dynamic pod template selection, first configure the 
+[custom template pod adapter](#custom-template-pod-adapter).
+
+Use the following APIs to view and update the dynamic configuration for the Kubernetes task runner.
+
+To use these APIs, ensure you have read and write permissions for the CONFIG resource type with the resource name
+"CONFIG". For more information on permissions, see 
+[User authentication and authorization](../../operations/security-user-auth.md#config).
+
+#### Get dynamic configuration
+
+Retrieves the current dynamic execution config for the Kubernetes task runner. 
+Returns a JSON object with the dynamic configuration properties.
+
+##### URL
+
+`GET` `/druid/indexer/v1/k8s/taskrunner/executionconfig`
+
+##### Responses
+
+<Tabs>
+
+<TabItem value="1" label="200 SUCCESS">
+
+
+*Successfully retrieved dynamic configuration*
+
+</TabItem>
+</Tabs>
+
+---
+
+##### Sample request
+
+<Tabs>
+
+<TabItem value="2" label="cURL">
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/k8s/taskrunner/executionconfig"
+```
+</TabItem>
+
+<TabItem value="3" label="HTTP">
+
+```HTTP
+GET /druid/indexer/v1/k8s/taskrunner/executionconfig HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+##### Sample response
+
+<details>
+<summary>View the response</summary>
+
+```json
+{
+  "type": "default",
+  "podTemplateSelectStrategy":
+  {
+    "type": "selectorBased",
+    "selectors": [
+      {
+        "selectionKey": "podSpec1",
+        "context.tags": {
+          "userProvidedTag": ["tag1", "tag2"]
+        },
+        "dataSource": ["wikipedia"]
+      },
+      {
+        "selectionKey": "podSpec2",
+        "type": ["index_kafka"]
+      }
+    ]
+  }
+}
+```
+</details>
+
+#### Update dynamic configuration
+
+Updates the dynamic configuration for the Kubernetes Task Runner
+
+##### URL
+
+`POST` `/druid/indexer/v1/k8s/taskrunner/executionconfig`
+
+##### Header parameters
+
+The endpoint supports the following optional header parameters to populate the `author` and `comment` fields in the configuration history.
+
+* `X-Druid-Author`
+  * Type: String
+  * Author of the configuration change.
+* `X-Druid-Comment`
+  * Type: String
+  * Description for the update.
+
+##### Responses
+
+<Tabs>
+
+<TabItem value="4" label="200 SUCCESS">
+
+
+*Successfully updated dynamic configuration*
+
+</TabItem>
+</Tabs>
+
+---
+
+##### Sample request
+
+<Tabs>
+
+<TabItem value="5" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/k8s/taskrunner/executionconfig" \
+--header 'Content-Type: application/json' \
+--data '{
+  "type": "default",
+  "podTemplateSelectStrategy":
+  {
+    "type": "selectorBased",
+    "selectors": [
+      {
+        "selectionKey": "podSpec1",
+        "context.tags":
+        {
+          "userProvidedTag": ["tag1", "tag2"]
+        },
+        "dataSource": ["wikipedia"]
+      },
+      {
+        "selectionKey": "podSpec2",
+        "type": ["index_kafka"]
+      }
+    ]
+  }
+}'
+```
+
+</TabItem>
+<TabItem value="6" label="HTTP">
+
+
+```HTTP
+POST /druid/indexer/v1/k8s/taskrunner/executionconfig HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+Content-Type: application/json
+
+{
+  "type": "default",
+  "podTemplateSelectStrategy":
+  {
+    "type": "selectorBased",
+    "selectors": [
+      {
+        "selectionKey": "podSpec1",
+        "context.tags":
+        {
+          "userProvidedTag": ["tag1", "tag2"]
+        },
+        "dataSource": ["wikipedia"]
+      },
+      {
+        "selectionKey": "podSpec2",
+        "type": ["index_kafka"]
+      }
+    ]
+  }
+}
+```
+
+</TabItem>
+</Tabs>
+
+##### Sample response
+
+A successful request returns an HTTP `200 OK` message code and an empty response body.
+
+#### Get dynamic configuration history
+
+Retrieves the history of changes to Kubernetes task runner's dynamic execution config over an interval of time. Returns 
+an empty array if there are no history records available.
+
+##### URL
+
+`GET` `/druid/indexer/v1/k8s/taskrunner/executionconfig/history`
+
+##### Query parameters
+
+The endpoint supports the following optional query parameters to filter results.
+
+* `interval`
+  * Type: String
+  * Limit the results to the specified time interval in ISO 8601 format delimited with `/`. For example, `2023-07-13/2023-07-19`. The default interval is one week. You can change this period by setting `druid.audit.manager.auditHistoryMillis` in the `runtime.properties` file for the Coordinator.
+
+* `count`
+  * Type: Integer
+  * Limit the number of results to the last `n` entries.
+
+##### Responses
+
+<Tabs>
+
+<TabItem value="1" label="200 SUCCESS">
+
+
+*Successfully retrieved dynamic configuration*
+
+</TabItem>
+</Tabs>
+
+---
+
+##### Sample request
+
+<Tabs>
+
+<TabItem value="2" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/k8s/taskrunner/executionconfig/history"
+```
+
+</TabItem>
+<TabItem value="3" label="HTTP">
+
+
+```HTTP
+GET /druid/indexer/v1/k8s/taskrunner/executionconfig/history HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
+##### Sample response
+
+<details>
+<summary>View the response</summary>
+
+```json
+[
+  {
+    "key": "k8s.taskrunner.config",
+    "type": "k8s.taskrunner.config",
+    "auditInfo": {
+      "author": "",
+      "comment": "",
+      "ip": "127.0.0.1"
+    },
+    "payload": "{\"type\": \"default\",\"podTemplateSelectStrategy\":{\"type\": \"taskType\"}",
+    "auditTime": "2024-06-13T20:59:51.622Z"
+  }
+]
+```
+</details>
+
+## Pod adapters
+The logic defining how the pod template is built for your Kubernetes Job depends on which pod adapter you have specified.
+
+### Overlord Single Container Pod Adapter/Overlord Multi Container Pod Adapter
+The overlord single container pod adapter takes the podSpec of your `Overlord` pod and creates a kubernetes job from this podSpec.  This is the default pod adapter implementation, to explicitly enable it you can specify the runtime property `druid.indexer.runner.k8s.adapter.type: overlordSingleContainer`
+
+The overlord multi container pod adapter takes the podSpec of your `Overlord` pod and creates a kubernetes job from this podSpec.  It uses kubexit to manage dependency ordering between the main container that runs your druid peon and other sidecars defined in the `Overlord` pod spec. Thus if you have sidecars such as Splunk or Istio it will be able to handle them. To enable this pod adapter you can specify the runtime property `druid.indexer.runner.k8s.adapter.type: overlordMultiContainer` 
+
+For the sidecar support to work for the multi container pod adapter, your entry point / command in docker must be explicitly defined your spec.
+
+You can't have something like this:
+Dockerfile:
+``` ENTRYPOINT: ["foo.sh"] ```
+
+and in your sidecar specs:
+``` container:
+        name: foo
+        args: 
+           - arg1
+           - arg2 
+```
+
+That will not work, because we cannot decipher what your command is, the extension needs to know it explicitly.
+**Even for sidecars like Istio which are dynamically created by the service mesh, this needs to happen.*
+
+Instead, do the following:
+You can keep your Dockerfile the same but you must have a sidecar spec like so:
+``` container:
+        name: foo
+        command: foo.sh
+        args: 
+           - arg1
+           - arg2 
+```
+
+For both of these adapters, you can add optional labels to your K8s jobs / pods if you need them by using the following configuration:
+`druid.indexer.runner.labels: '{"key":"value"}'`
+Annotations are the same with:
+`druid.indexer.runner.annotations: '{"key":"value"}'`
+
+All other configurations you had for the middle manager tasks must be moved under the overlord with one caveat, you must specify javaOpts as an array:
+`druid.indexer.runner.javaOptsArray`, `druid.indexer.runner.javaOpts` is no longer supported.
+
+If you are running without a middle manager you need to also use `druid.processing.intermediaryData.storage.type=deepstore`
+
+### Custom Template Pod Adapter
+The custom template pod adapter allows you to specify a pod template file per task type for more flexibility on how to define your pods. This adapter expects a [Pod Template](https://kubernetes.io/docs/concepts/workloads/pods/#pod-templates) to be available on the overlord's file system. This pod template is used as the base of the pod spec for the Kubernetes Job. You can override things like labels, environment variables, resources, annotation, or even the base image with this template. To enable this pod adapter you can specify the runtime property `druid.indexer.runner.k8s.adapter.type: customTemplateAdapter`
+
+The base pod template must be specified as the runtime property `druid.indexer.runner.k8s.podTemplate.base: /path/to/basePodSpec.yaml`
+
+The below runtime properties need to be passed to the Job's peon process.
+
+```
+druid.port=8100 (what port the peon should run on)
+druid.peon.mode=remote
+druid.service=druid/peon (for metrics reporting)
+druid.indexer.runner.type=k8s
+druid.indexer.task.encapsulatedTask=true
+```
+
+**Note**: Prior to Druid 35.0.0, you will need the `druid.indexer.task.baseTaskDir` runtime property, along with the `TASK_DIR` and `attemptId` arguments to `/peon.sh` to run your jobs. There is no need for that now as Druid will automatically configure the task directory. You can still choose to customize the target task directory by adjusting `druid.indexer.task.baseTaskDir` on the Overlord service.
+
+#### Example 1: Using a Pod Template that retrieves values from a ConfigMap 
+
+<details>
+<summary>Example Pod Template that uses the regular druid docker image</summary>
+
+```yaml
+apiVersion: "v1"
+kind: "PodTemplate"
+template:
+  metadata:
+    annotations:
+      sidecar.istio.io/proxyCPU: "512m" # to handle an injected istio sidecar
+    labels:
+      app.kubernetes.io/name: "druid-realtime-backend"
+  spec:
+    affinity: {}
+    containers:
+    - command:
+        - sh
+        - -c
+        - |
+          /peon.sh
+      env:
+      - name: CUSTOM_ENV_VARIABLE
+        value: "hello"
+      image: apache/druid:35.0.0
+      name: main
+      ports:
+      - containerPort: 8091
+        name: druid-tls-port
+        protocol: TCP
+      - containerPort: 8100
+        name: druid-port
+        protocol: TCP
+      resources:
+        limits:
+          cpu: "1"
+          memory: 2400M
+        requests:
+          cpu: "1"
+          memory: 2400M
+      volumeMounts:
+      - mountPath: /opt/druid/conf/druid/cluster/master/coordinator-overlord # runtime props are still mounted in this location because that's where peon.sh looks for configs
+        name: nodetype-config-volume
+        readOnly: true
+      - mountPath: /druid/data
+        name: data-volume
+      - mountPath: /druid/deepstorage
+        name: deepstorage-volume
+    restartPolicy: "Never"
+    securityContext:
+      fsGroup: 1000
+      runAsGroup: 1000
+      runAsUser: 1000
+    tolerations:
+    - effect: NoExecute
+      key: node.kubernetes.io/not-ready
+      operator: Exists
+      tolerationSeconds: 300
+    - effect: NoExecute
+      key: node.kubernetes.io/unreachable
+      operator: Exists
+      tolerationSeconds: 300
+    volumes:
+    - configMap:
+        defaultMode: 420
+        name: druid-tiny-cluster-peons-config
+      name: nodetype-config-volume
+    - emptyDir: {}
+      name: data-volume
+    - emptyDir: {}
+      name: deepstorage-volume
+```
+</details>
+
+Any runtime property or JVM config used by the peon process can also be passed. E.G. below is an example of a ConfigMap that can be used to generate the `nodetype-config-volume` mount in the above template.
+
+<details>
+<summary>Example ConfigMap</summary>
+
+```yaml
+apiVersion: v1
+kind: ConfigMap
+metadata:
+    name: druid-tiny-cluster-peons-config
+    namespace: default
+data:
+    jvm.config: |-
+        -server
+        -XX:MaxDirectMemorySize=1000M
+        -Duser.timezone=UTC
+        -Dfile.encoding=UTF-8
+        -Dlog4j.debug
+        -Djava.util.logging.manager=org.apache.logging.log4j.jul.LogManager
+        -Djava.io.tmpdir=/druid/data
+        -Xmx1024M
+        -Xms1024M
+    log4j2.xml: |-
+        <?xml version="1.0" encoding="UTF-8" ?>
+        <Configuration status="WARN">
+            <Appenders>
+                <Console name="Console" target="SYSTEM_OUT">
+                    <PatternLayout pattern="%d{ISO8601} %p [%t] %c - %m%n"/>
+                </Console>
+            </Appenders>
+            <Loggers>
+                <Root level="info">
+                    <AppenderRef ref="Console"/>
+                </Root>
+            </Loggers>
+        </Configuration>
+    runtime.properties: |
+        druid.port=8100
+        druid.service=druid/peon
+        druid.server.http.numThreads=5
+        druid.indexer.runner.type=k8s
+        druid.peon.mode=remote
+        druid.indexer.task.encapsulatedTask=true
+```
+</details>
+
+#### Example 2: Using a ConfigMap to upload the Pod Template file
+
+Alternatively, we can mount the ConfigMap onto Overlord services, and use the ConfigMap to generate the pod template files we want.
+
+<details>
+<summary>Mounting to Overlord deployment</summary>
+
+```yaml
+  volumeMounts:
+    - name: druid-pod-templates
+      mountPath: /path/to/podTemplate/directory
+
+  volumes:
+    - name: druid-pod-templates
+      configMap:
+        name: druid-pod-templates
+```
+</details>
+
+<details>
+<summary>Example ConfigMap that generates the Base Pod Template</summary>
+
+```yaml
+apiVersion: v1
+kind: ConfigMap
+metadata:
+  name: druid-pod-templates
+data:
+  basePodSpec.yaml: |-
+    apiVersion: "v1"
+    kind: "PodTemplate"
+    template:
+      metadata:
+        labels:
+          app.kubernetes.io/name: "druid-realtime-backend"
+        annotations:
+          sidecar.istio.io/proxyCPU: "512m"
+      spec:
+        containers:
+        - name: main
+          image: apache/druid:35.0.0
+          command:
+            - sh
+            - -c
+            - |
+              /peon.sh
+          env:
+            - name: druid_port
+              value: 8100
+            - name: druid_plaintextPort
+              value: 8100
+            - name: druid_tlsPort
+              value: 8091
+            - name: druid_peon_mode
+              value: remote
+            - name: druid_service
+              value: "druid/peon"
+            - name: druid_indexer_runner_type
+              value: k8s
+            - name: druid_indexer_task_encapsulatedTask
+              value: true
+          ports:
+            - containerPort: 8091
+              name: druid-tls-port
+              protocol: TCP
+            - containerPort: 8100
+              name: druid-port
+              protocol: TCP
+          resources:
+            limits:
+              cpu: "1"
+              memory: 2400M
+            requests:
+              cpu: "1"
+              memory: 2400M
+          restartPolicy: "Never"
+          securityContext:
+            fsGroup: 1000
+            runAsGroup: 1000
+            runAsUser: 1000
+          tolerations:
+            - effect: NoExecute
+              key: node.kubernetes.io/not-ready
+              operator: Exists
+              tolerationSeconds: 300
+            - effect: NoExecute
+              key: node.kubernetes.io/unreachable
+              operator: Exists
+              tolerationSeconds: 300
+
+```
+</details>
+
+#### Lazy Loading of Pod Templates
+
+Whenever the Overlord wants to spin up a Kubernetes task pod, it will first read the relevant pod template file, and then create a task pod according to the specifications of the pod template file. This is helpful when you want to make configuration changes to the task pods (e.g. increase/decrease CPU limit or resources). You can edit the pod template files directly, and the next task pod spun up by the Overlord will reflect these changes in its configurations.
+
+#### Pod template selection
+
+The pod template adapter can select which pod template should be used for a task using the [task runner execution config](#dynamic-config)
+
+##### Select based on task type
+
+The `TaskTypePodTemplateSelectStrategy` strategy selects pod templates based on task type for execution purposes,
+implementing the behavior that maps templates to specific task types. This is the default pod template selection
+strategy. To explicitly select this strategy, set the `podTemplateSelectStrategy` in the dynamic execution config to
+
+```json
+{ "type": "default" }
+```
+
+Task specific pod templates can be specified as the runtime property 
+`druid.indexer.runner.k8s.podTemplate.{taskType}: /path/to/taskSpecificPodSpec.yaml` where `{taskType}` is the name of the
+task type. For example, `index_parallel`.
+
+If you are trying to use the default image's environment variable parsing feature to set runtime properties, you need to add an extra escape underscore when specifying pod templates.
+For example, set the environment variable `druid_indexer_runner_k8s_podTemplate_index__kafka` when you set the runtime property `druid.indexer.runner.k8s.podTemplate.index_kafka`
+
+
+The following example shows a configuration for task-based pod template selection:
+
+```properties
+druid.indexer.runner.k8s.podTemplate.base=/path/to/basePodSpec.yaml
+druid.indexer.runner.k8s.podTemplate.index_kafka=/path/to/kafkaPodSpec.yaml
+```
+
+##### Select based on one or more conditions
+
+The `SelectorBasedPodTemplateSelectStrategy` strategy evaluates a series of criteria within `selectors` to determine
+which pod template to use to run the task. Pod  templates are configured in the runtime properties like
+`druid.indexer.runner.k8s.podTemplate.<selectionKey>=...`.
+
+```json
+{
+  "type": "selectorBased",
+  "selectors": [
+    {
+      "selectionKey": "podSpec1", 
+      "context.tags":
+      {
+        "userProvidedTag": ["tag1", "tag2"]
+      },
+      "dataSource": ["wikipedia"]
+    },
+    {
+      "selectionKey": "podSpec2",
+      "type": ["index_kafka"]
+    }
+  ]
+}
+```
+
+Selectors are processed in order. Druid selects the template based on the first matching selector. If a  task does not
+match any selector in the list, it will use the `base` pod template.
+
+For a task to match a selector, all the conditions within the selector must match. A selector can match on
+- `type`: Type of the task
+- `dataSource`: Destination datasource of the task.
+- `context.tags`: Tags passed in the task's context.
+
+##### Example
+
+Set the following runtime properties to define the pod specs that can be used by Druid.
+
+```properties
+druid.indexer.runner.k8s.podTemplate.base=/path/to/basePodSpec.yaml
+druid.indexer.runner.k8s.podTemplate.podSpec1=/path/to/podSpecWithHighMemRequests.yaml
+druid.indexer.runner.k8s.podTemplate.podSpec2=/path/to/podSpecWithLowCpuRequests.yaml
+```
+
+Set the dynamic execution config to define the pod template selection strategy.
+
+```json
+{
+  "type": "default",
+  "podTemplateSelectStrategy": {
+    "type": "selectorBased",
+    "selectors": [
+      {
+        "selectionKey": "podSpec1",
+        "context.tags": { "userProvidedTag": ["tag1", "tag2"] },
+        "dataSource": ["wikipedia"]
+      },
+      {
+        "selectionKey": "podSpec2",
+        "type": ["index_kafka"]
+      }
+    ]
+  }
+}
+```
+
+Druid selects the pod templates as follows: 
+1. Use `podSpecWithHighMemRequests.yaml` when both of the following conditions are met:
+   1. The task context contains a tag with the key `userProvidedTag` that has the value `tag1` or `tag2`.
+   2. The task targets the `wikipedia` datasource.
+2. Use `podSpecWithLowCpuRequests.yaml` when the task type is `index_kafka`.
+3. Use the `basePodSpec.yaml` for all other tasks.
+
+In this example, if there is an `index_kafka` task for the `wikipedia` datasource with the tag `userProvidedTag: tag1`,
+Druid selects the pod template `podSpecWithHighMemRequests.yaml`.
+
+In the above example, for selection key `podSpec1` we didn't specify task `type`. This is equivalent to setting `type` to `null` or an empty array.
+All three examples below are equivalent.
+
+- Not setting `type`
+    ```json
+    {
+      "selectionKey": "podSpec1",
+      "context.tags": { "userProvidedTag": ["tag1", "tag2"] },
+      "dataSource": ["wikipedia"]
+    }
+    ```
+
+- Setting `type` to `null`
+    ```json
+    {
+      "selectionKey": "podSpec1",
+      "context.tags": { "userProvidedTag": ["tag1", "tag2"] },
+      "dataSource": ["wikipedia"],
+      "type": null
+    }
+    ```
+
+- Setting `type` to an empty array
+    ```json
+    {
+      "selectionKey": "podSpec1",
+      "context.tags": { "userProvidedTag": ["tag1", "tag2"] },
+      "dataSource": ["wikipedia"],
+      "type": []
+    }
+    ```
+
+In all the above cases, Druid will match the selector to any value of task type. Druid applies similar logic for `dataSource`. For `context.tags` setting `null` or an empty object `{}` is equivalent. 
+
+#### Running Task Pods in Another Namespace
+
+It is possible to run task pods in a different namespace from the rest of your Druid cluster.
+
+If you are running multiple Druid clusters and would like to have a dedicated namespace for all your task pods, you can make the following changes to the runtime properties for your Overlord deployment:
+
+- `druid.indexer.runner.namespace`: The namespace where the task pods will run. It can be the same as the namespace where your Druid cluster is deployed, or different from it. In the latter case, you need to define the following `overlordNamespace`.
+- `druid.indexer.runner.overlordNamespace`: The namespace where the Overlord resides. This must be defined when tasks are scheduled in different namespace.
+- `druid.indexer.runner.k8sTaskPodNamePrefix` (Optional):  Self-defined field to differentiate which task pods are created from which namespace. More information [here](#differentiating-task-pods-created-from-multiple-namespaces).
+
+Warning: When `druid.indexer.runner.overlordNamespace` and `druid.indexer.runner.k8sTaskPodNamePrefix` is configured, users should ensure that all running tasks are stopped when changing these values. Failure to do so will cause the Overlord to lose track of running tasks, and re-launch them. This may lead to duplicate data and possibly metadata inconsistency issues.
+
+Druid will tag Kubernetes jobs with a `druid.overlord.namespace` label. This label helps Druid filter out Kubernetes jobs belonging to other namespaces. Should you need to deploy a Druid cluster on a namespace `N1` that is already running tasks from another namespace `N2`, take note to set `druid.indexer.runner.overlordNamespace` to `druid.indexer.runner.namespace` (which is `N1`). Failure to do so will result in the cluster in `N1` detecting task pods created from both `N1` and `N2`.
+
+##### Differentiating Task Pods Created From Multiple Namespaces
+
+When we have task pods started by Overlord servers of different Druid clusters, running in different K8S namespaces, it will be difficult to tell which task pods are being started by which overlord or Druid cluster. You can specify a task name prefix, `druid.indexer.runner.k8sTaskPodNamePrefix`, to apply your specified prefix to all task pods created by your cluster.
+
+After configuration, you can witness the change from `coordinatorissuedcompactdataso-0e74d5132781cc950eecf04--1-vbx6t` to `yourtaskprefix-0e74d5132781cc950eecf04--1-vbx6t` by either doing `kubectl get pods` or by viewing the "Location" column under the web console.
+
+When configuring the `druid.indexer.runner.k8sTaskPodNamePrefix`, you should note that:
+- The prefix will cut off at 30 characters, as the task pod names must respect a character limit of 63 in Kubernetes.
+- Special characters `: - . _` will be ignored.
+- The prefix will be converted to lowercase.
+- All running tasks must be stopped during configuration. Failure to do so will cause the Overlord to lose track of running tasks, and re-launch them. This may lead to duplicate data and possibly metadata inconsistency issues.
+
+##### Dealing with ZooKeeper Problems
+
+Ensure that when you are running task pods in another namespace, your task pods are able to communicate with ZooKeeper which might be deployed in the same namespace with overlord. If you are using custom pod templates as described below, you can configure `druid.zk.service.host` to your tasks.
+
+##### Dealing with Permissions
+
+Should you require the needed permissions for interacting across Kubernetes namespaces, you can specify a kubeconfig file, and provided the necessary permissions. You can then use the `KUBECONFIG` environment variable to allow your Overlord deployment to find your kubeconfig file. Refer to the [Kubernetes documentation](https://kubernetes.io/docs/concepts/configuration/organize-cluster-access-kubeconfig/) for more information.
+
+### Properties
+| Property | Possible Values | Description | Default | Required |
+| --- | --- | --- | --- | --- |
+| `druid.indexer.runner.namespace` | `String` | If Overlord and task pods are running in different namespaces, specify the Overlord namespace. | - | Yes |
+| `druid.indexer.runner.overlordNamespace` | `String` | Only applicable when using Custom Template Pod Adapter. If Overlord and task pods are running in different namespaces, specify the Overlord namespace. <br /> Warning: You need to stop all running tasks in Druid to change this property. Failure to do so will lead to duplicate data and metadata inconsistencies. | `""` | No |
+| `druid.indexer.runner.k8sTaskPodNamePrefix` | `String` |  Use this if you want to change your task name to contain a more human-readable prefix. Maximum 30 characters. Special characters `: - . _` will be ignored. <br /> Warning: You need to stop all running tasks in Druid to change this property. Failure to do so will lead to duplicate data and metadata inconsistencies. | `""` | No |
+| `druid.indexer.runner.debugJobs` | `boolean` | Boolean flag used to disable clean up of K8s jobs after tasks complete. | False | No |
+| `druid.indexer.runner.sidecarSupport` | `boolean` | Deprecated, specify adapter type as runtime property `druid.indexer.runner.k8s.adapter.type: overlordMultiContainer` instead. If your overlord pod has sidecars, this will attempt to start the task with the same sidecars as the overlord pod. | False | No |
+| `druid.indexer.runner.primaryContainerName` | `String` | If running with sidecars, the `primaryContainerName` should be that of your druid container like `druid-overlord`. | First container in `podSpec` list | No |
+| `druid.indexer.runner.kubexitImage` | `String` | Used kubexit project to help shutdown sidecars when the main pod completes. Otherwise, jobs with sidecars never terminate. | karlkfi/kubexit:latest | No |
+| `druid.indexer.runner.disableClientProxy` | `boolean` | Use this if you have a global http(s) proxy and you wish to bypass it. | false | No |
+| `druid.indexer.runner.maxTaskDuration` | `Duration` | Max time a task is allowed to run for before getting killed. | `PT4H` | No |
+| `druid.indexer.runner.taskCleanupDelay` | `Duration` | How long do jobs stay around before getting reaped from K8s. | `P2D` | No |
+| `druid.indexer.runner.taskCleanupInterval` | `Duration` | How often to check for jobs to be reaped. | `PT10M` | No |
+| `druid.indexer.runner.taskJoinTimeout` | `Duration` | Timeout for gathering metadata about existing tasks on startup. | `PT1M` | No |
+| `druid.indexer.runner.k8sjobLaunchTimeout` | `Duration` | How long to wait to launch a K8s task before marking it as failed, on a resource constrained cluster it may take some time. | `PT1H` | No |
+| `druid.indexer.runner.javaOptsArray` | `JsonArray` | java opts for the task. | `-Xmx1g` | No |
+| `druid.indexer.runner.labels` | `JsonObject` | Additional labels you want to add to peon pod. | `{}` | No |
+| `druid.indexer.runner.annotations` | `JsonObject` | Additional annotations you want to add to peon pod. | `{}` | No |
+| `druid.indexer.runner.peonMonitors` | `JsonArray` | Overrides `druid.monitoring.monitors`. Use this property if you don't want to inherit monitors from the Overlord. | `[]` | No |
+| `druid.indexer.runner.graceTerminationPeriodSeconds` | `Long` | Number of seconds you want to wait after a sigterm for container lifecycle hooks to complete. Keep at a smaller value if you want tasks to hold locks for shorter periods. | `PT30S` (K8s default) | No |
+| `druid.indexer.runner.capacity` | `Integer` | Number of concurrent jobs that can be sent to Kubernetes. | `2147483647` | No |
+| `druid.indexer.runner.cpuCoreInMicro` | `Integer` | Number of CPU micro core for the task. | `1000` | No |
+| `druid.indexer.runner.logSaveTimeout` | `Duration` | The peon executing the ingestion task makes a best effort to persist the pod logs from `k8s` to persistent task log storage. The timeout ensures that `k8s` connection issues do not cause the pod to hang indefinitely thereby blocking Overlord operations. If the timeout occurs before the logs are saved, those logs will not be available in Druid. | `PT300S` | NO |
+
+
+### Metrics added
+
+|Metric|Description|Dimensions|Normal value|
+|------|-----------|----------|------------|
+| `k8s/peon/startup/time` | Metric indicating the milliseconds for peon pod to startup. | `dataSource`, `taskId`, `taskType`, `groupId`, `taskStatus`, `tags` |Varies|
+
+### Gotchas
+
+- With the exception of task pods, all Druid Pods belonging to one Druid cluster must be inside the same Kubernetes namespace.
+
+- You must have a role binding for the overlord's service account that provides the needed permissions for interacting with Kubernetes. An example spec could be:
+
+```yaml
+kind: Role
+apiVersion: rbac.authorization.k8s.io/v1
+metadata:
+  namespace: <druid-namespace>
+  name: druid-k8s-task-scheduler
+rules:
+  - apiGroups: ["batch"]
+    resources: ["jobs"]
+    verbs: ["get", "watch", "list", "delete", "create"]
+  - apiGroups: [""]
+    resources: ["events", "pods", "pods/log"]
+    verbs: ["get", "watch", "list", "delete", "create"]
+---
+kind: RoleBinding
+apiVersion: rbac.authorization.k8s.io/v1
+metadata:
+  name: druid-k8s-binding
+  namespace: <druid-namespace>
+subjects:
+  - kind: ServiceAccount
+    name: <druid-overlord-k8s-service-account>
+    namespace: <druid-namespace>
+roleRef:
+  kind: Role
+  name: druid-k8s-task-scheduler
+  apiGroup: rbac.authorization.k8s.io
+```
+
+## Migration/Kubernetes and Worker Task Runner
+:::info
+This feature is only available starting in Druid 28. If you require a rolling update to enable Kubernetes-based ingestion, first update your cluster to Druid 28 then apply the overlord configurations mentioned in this section.
+:::
+
+If you are running a cluster with tasks running on middle managers or indexers and want to do a zero downtime migration to mm-less ingestion, the mm-less ingestion system is capable of running in migration mode by reading tasks from middle managers/indexers and Kubernetes and writing tasks to either middle managers or to Kubernetes.
+
+To do this, set the following property.
+`druid.indexer.runner.type: k8sAndWorker` (instead of `druid.indexer.runner.type: k8s`)
+
+### Additional Configurations
+
+|Property| Possible Values |Description|Default|required|
+|--------|-----------------|-----------|-------|--------|
+|`druid.indexer.runner.k8sAndWorker.runnerStrategy.type`| `String` (e.g., `k8s`, `worker`, `taskType`)| Defines the strategy for task runner selection. |`k8s`|No|
+|`druid.indexer.runner.k8sAndWorker.runnerStrategy.workerType`| `String` (e.g., `httpRemote`, `remote`)| Specifies the variant of the worker task runner to be utilized.|`httpRemote`|No|
+| **For `taskType` runner strategy:**|||||
+|`druid.indexer.runner.k8sAndWorker.runnerStrategy.taskType.default`| `String` (e.g., `k8s`, `worker`) | Specifies the default runner to use if no overrides apply. This setting ensures there is always a fallback runner available.|None|No|
+|`druid.indexer.runner.k8sAndWorker.runnerStrategy.taskType.overrides`| `JsonObject`(e.g., `{"index_kafka": "worker"}`)| Defines task-specific overrides for runner types. Each entry sets a task type to a specific runner, allowing fine control. |`{}`|No|
+
+### Experimental Fabric8 Http Client Configurations
+
+:::warning
+
+This section is experimental and subject to change. The Druid developer community intends on selecting a stable default HTTP client and configuration in the future, simplifying configuration and distribution packaging. This means that not all exposed HTTP clients and their configurations will be supported long term. If you opt in to using this experimental configuration, please provide feedback to the Druid developer community ([GitHub Issue](https://github.com/apache/druid/issues/18629) ... Apache mailing list: `dev@druid.apache.org`) on your experience to help guide our long term decisions.
+
+:::
+
+The extension uses [fabric8 KubernetesClient](https://github.com/fabric8io/kubernetes-client) to communicate with the Kubernetes API server. This client creates an
+underlying HTTP Client using a pluggable HTTP client library. By default, the client is [vert.x](https://github.com/fabric8io/kubernetes-client/tree/main/httpclient-vertx). The legacy default
+was [okhttp](https://github.com/fabric8io/kubernetes-client/tree/main/httpclient-okhttp).
+
+|Property| Possible Values |Description| Default |required|
+|--------|-----------------|-----------|---------|--------|
+|`druid.indexer.runner.k8sAndWorker.http.httpClientType`|`String` (e.g., `okhttp`, `vertx`, `javaStandardHttp`)|Specifies the HTTP client library to be used by the worker task runner for communication with worker nodes.|`vertx`|No|
+
+#### vert.x HTTP Client
+
+|Property| Possible Values |Description| Default |required|
+|--------|-----------------|-----------|---------|--------|
+|`druid.indexer.runner.k8sAndWorker.http.vertx.workerPoolSize`|`Integer`|...|20|No|
+|`druid.indexer.runner.k8sAndWorker.http.vertx.eventLoopPoolSize`|`Integer`|...|`2 * number cores`|No|
+|`druid.indexer.runner.k8sAndWorker.http.vertx.internalBlockingPoolSize`|`Integer`|...|20|No|
+
+#### OkHttp Client
+
+|Property| Possible Values |Description| Default |required|
+|--------|-----------------|-----------|---------|--------|
+|`druid.indexer.runner.k8sAndWorker.http.okhttp.useCustomDispatcherExecutor`|`Boolean`|Flag indicating if okhttp client will use a custom defined thread pool for okhttp http client request dispatcher|false|No|
+|`druid.indexer.runner.k8sAndWorker.http.okhttp.coreWorkerThreads`|`Integer`|The number of threads to keep in the pool, even if they are idle. Only applicable if `useCustomDispatcherExecutor` is true.|50|No|
+|`druid.indexer.runner.k8sAndWorker.http.okhttp.maxWorkerThreads`|`Integer`|Maximum number of threads in the custom thread pool for okhttp client request dispatcher. Must be greater than or equal to `druid.indexer.runner.k8sAndWorker.http.okhttp.coreWorkerThreads` Only applicable if `useCustomDispatcherExecutor` is true.|`druid.indexer.runner.k8sAndWorker.http.okhttp.coreWorkerThreads`|No|
+|`druid.indexer.runner.k8sAndWorker.http.okhttp.workerThreadKeepAliveTime`|`Long`|Idle timeout in seconds for non-core threads in the worker thread pool. Only applicable if `useCustomDispatcherExecutor` is true.|60|No|
+
+#### Native Java HTTP Client
+
+|Property| Possible Values |Description| Default |required|
+|--------|-----------------|-----------|---------|--------|
+|`druid.indexer.runner.k8sAndWorker.http.javaStandardHttp.coreWorkerThreads`|`Integer`|The number of threads to keep in the pool, even if they are idle.|20|No|
+|`druid.indexer.runner.k8sAndWorker.http.javaStandardHttp.maxWorkerThreads`|`Integer`|Maximum number of threads in the custom thread pool for okhttp client request dispatcher.|20|No|
+|`druid.indexer.runner.k8sAndWorker.http.javaStandardHttp.workerThreadKeepAliveTime`|`Long`|Idle timeout in seconds for non-core threads in the worker thread pool.|60|No|
diff --git a/docs/35.0.0/development/extensions-core/kubernetes.md b/docs/35.0.0/development/extensions-core/kubernetes.md
new file mode 100644
index 0000000000..25696546df
--- /dev/null
+++ b/docs/35.0.0/development/extensions-core/kubernetes.md
@@ -0,0 +1,86 @@
+---
+id: kubernetes
+title: "Kubernetes"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+Consider this an [EXPERIMENTAL](../experimental.md) feature mostly because it has not been tested yet on a wide variety of long running Druid clusters.
+
+Apache Druid Extension to enable using Kubernetes API Server for node discovery and leader election. This extension allows Druid cluster deployment on Kubernetes without Zookeeper. It allows running multiple Druid clusters within same Kubernetes Cluster, See `clusterIdentifier` config below.
+
+
+## Configuration
+
+To use this extension please make sure to  [include](../../configuration/extensions.md#loading-extensions) `druid-kubernetes-extensions` in the extensions load list.
+
+This extension works together with HTTP-based segment and task management in Druid. Consequently, following configurations must be set on all Druid nodes.
+
+`druid.zk.service.enabled=false`
+`druid.serverview.type=http`
+`druid.indexer.runner.type=httpRemote`
+`druid.discovery.type=k8s`
+
+For Node Discovery, Each Druid process running inside a pod "announces" itself by adding few "labels" and "annotations" in the pod spec. Druid process needs to be aware of pod name and namespace which it reads from environment variables `POD_NAME` and `POD_NAMESPACE`. These variable names can be changed, see configuration below. But in the end, each pod needs to have self pod name and namespace added as environment variables.
+
+Additionally, this extension has following configuration.
+
+### Properties
+|Property|Possible Values|Description|Default|required|
+|--------|---------------|-----------|-------|--------|
+|`druid.discovery.k8s.clusterIdentifier`|`string that matches [a-z0-9][a-z0-9-]*[a-z0-9]`|Unique identifier for this Druid cluster in Kubernetes e.g. us-west-prod-druid.|None|Yes|
+|`druid.discovery.k8s.podNameEnvKey`|`Pod Env Variable`|Pod Env variable whose value is that pod's name.|POD_NAME|No|
+|`druid.discovery.k8s.podNamespaceEnvKey`|`Pod Env Variable`|Pod Env variable whose value is that pod's kubernetes namespace.|POD_NAMESPACE|No|
+|`druid.discovery.k8s.leaseDuration`|`Duration`|Lease duration used by Leader Election algorithm. Candidates wait for this time before taking over previous Leader.|PT60S|No|
+|`druid.discovery.k8s.renewDeadline`|`Duration`|Lease renewal period used by Leader.|PT17S|No|
+|`druid.discovery.k8s.retryPeriod`|`Duration`|Retry wait used by Leader Election algorithm on failed operations.|PT5S|No|
+
+### Gotchas
+
+- Label/Annotation path in each pod spec MUST EXIST, which is easily satisfied if there is at least one label/annotation in the pod spec already. 
+- All Druid Pods belonging to one Druid cluster must be inside same kubernetes namespace.
+- All Druid Pods need permissions to be able to add labels to self-pod, List and Watch other Pods, create and read ConfigMap for leader election. Assuming, "default" service account is used by Druid pods, you might need to add following or something similar Kubernetes Role and Role Binding.
+
+```
+apiVersion: rbac.authorization.k8s.io/v1
+kind: Role
+metadata:
+  name: druid-cluster
+rules:
+- apiGroups:
+  - ""
+  resources:
+  - pods
+  - configmaps
+  verbs:
+  - '*'
+---
+kind: RoleBinding
+apiVersion: rbac.authorization.k8s.io/v1
+metadata:
+  name: druid-cluster
+subjects:
+- kind: ServiceAccount
+  name: default
+roleRef:
+  kind: Role
+  name: druid-cluster
+  apiGroup: rbac.authorization.k8s.io
+```
diff --git a/docs/35.0.0/development/extensions-core/mysql.md b/docs/35.0.0/development/extensions-core/mysql.md
new file mode 100644
index 0000000000..a3678f6505
--- /dev/null
+++ b/docs/35.0.0/development/extensions-core/mysql.md
@@ -0,0 +1,213 @@
+---
+id: mysql
+title: "MySQL metadata store"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+To use this Apache Druid extension, [include](../../configuration/extensions.md#loading-extensions) `mysql-metadata-storage` in the extensions load list.
+
+With the MySQL extension, you can use MySQL as a metadata store or ingest from a MySQL database.
+
+The extension requires a connector library that's not included with Druid.
+See the [Prerequisites](#prerequisites) for installation instructions.
+
+## Prerequisites
+
+To use the MySQL extension, you need to install one of the following libraries:
+* [MySQL Connector/J](#install-mysql-connectorj)
+* [MariaDB Connector/J](#install-mariadb-connectorj)
+
+### Install MySQL Connector/J
+
+The MySQL extension uses Oracle's MySQL JDBC driver.
+The current version of Druid uses version 8.2.0.
+Other versions may not work with this extension.
+
+You can download the library from one of the following sources:
+
+- [MySQL website](https://dev.mysql.com/downloads/connector/j/)  
+  Visit the archives page to access older product versions.
+- [Maven Central (direct download)](https://repo1.maven.org/maven2/com/mysql/mysql-connector-j/8.2.0/mysql-connector-j-8.2.0.jar)
+- Your package manager. For example, `libmysql-java` on APT for a Debian-based OS.
+
+The download includes the MySQL connector JAR file with a name like `mysql-connector-j-8.2.0.jar`.
+Copy or create a symbolic link to this file inside the `lib` folder in the distribution root directory.
+
+### Install MariaDB Connector/J
+
+This extension also supports using the MariaDB connector jar.
+The current version of Druid uses version 2.7.3.
+Other versions may not work with this extension.
+
+You can download the library from one of the following sources:
+
+- [MariaDB website](https://mariadb.com/downloads/connectors/connectors-data-access/java8-connector)  
+  Click **Show All Files** to access older product versions.
+- [Maven Central (direct download)](https://repo1.maven.org/maven2/org/mariadb/jdbc/mariadb-java-client/2.7.3/mariadb-java-client-2.7.3.jar)
+
+The download includes the MariaDB connector JAR file with a name like `maria-java-client-2.7.3.jar`.
+Copy or create a symbolic link to this file inside the `lib` folder in the distribution root directory.
+
+To configure the `mysql-metadata-storage` extension to use the MariaDB connector library instead of MySQL, set `druid.metadata.mysql.driver.driverClassName=org.mariadb.jdbc.Driver`.
+
+The protocol of the connection string is `jdbc:mysql:` or `jdbc:mariadb:`,
+depending on your specific version of the MariaDB client library.
+For more information on the parameters to configure a connection,
+[see the MariaDB documentation](https://mariadb.com/kb/en/about-mariadb-connector-j/#connection-strings)
+for your connector version.
+
+
+## Set up MySQL
+
+To avoid issues with upgrades that require schema changes to a large metadata table, consider a MySQL version that supports instant ADD COLUMN semantics. For example, MySQL 8.
+
+1. Install MySQL
+
+  Use your favorite package manager to install mysql, e.g.:
+  - on Ubuntu/Debian using apt `apt-get install mysql-server`
+  - on OS X, using [Homebrew](http://brew.sh/) `brew install mysql`
+
+  Alternatively, download and follow installation instructions for MySQL
+  Community Server here:
+  [http://dev.mysql.com/downloads/mysql/](http://dev.mysql.com/downloads/mysql/).
+
+This extension also supports using MariaDB server, https://mariadb.org/download/, substituting for MariaDB in the following instructions where appropriate.
+
+2. Create a druid database and user
+
+  Connect to MySQL from the machine where it is installed.
+
+  ```bash
+  mysql -u root
+  ```
+
+  Paste the following snippet into the mysql prompt:
+
+  ```sql
+  -- create a druid database, make sure to use utf8mb4 as encoding
+  CREATE DATABASE druid DEFAULT CHARACTER SET utf8mb4;
+
+  -- create a druid user
+  CREATE USER 'druid'@'localhost' IDENTIFIED BY 'password';
+
+  -- grant the user all the permissions on the database we just created
+  GRANT ALL PRIVILEGES ON druid.* TO 'druid'@'localhost';
+  ```
+
+3. Configure your Druid metadata storage extension:
+
+  Add the following parameters to your Druid configuration, replacing `<host>`
+  with the location (host name and port) of the database.
+
+  ```properties
+  druid.extensions.loadList=["mysql-metadata-storage"]
+  druid.metadata.storage.type=mysql
+  druid.metadata.storage.connector.connectURI=jdbc:mysql://<host>/druid
+  druid.metadata.storage.connector.user=druid
+  druid.metadata.storage.connector.password=diurd
+  ```
+
+If using the MariaDB connector library, set `druid.metadata.mysql.driver.driverClassName=org.mariadb.jdbc.Driver`.
+
+## Encrypt MySQL connections
+
+This extension provides support for encrypting MySQL connections. To get more information about encrypting MySQL connections using TLS/SSL in general, please refer to this [guide](https://dev.mysql.com/doc/refman/5.7/en/using-encrypted-connections.html).
+
+## Configuration properties
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|--------|
+|`druid.metadata.mysql.ssl.useSSL`|Enable SSL|`false`|no|
+|`druid.metadata.mysql.ssl.clientCertificateKeyStoreUrl`|The file path URL to the client certificate key store.|none|no|
+|`druid.metadata.mysql.ssl.clientCertificateKeyStoreType`|The type of the key store where the client certificate is stored.|none|no|
+|`druid.metadata.mysql.ssl.clientCertificateKeyStorePassword`|The [Password Provider](../../operations/password-provider.md) or String password for the client key store.|none|no|
+|`druid.metadata.mysql.ssl.verifyServerCertificate`|Enables server certificate verification.|false|no|
+|`druid.metadata.mysql.ssl.trustCertificateKeyStoreUrl`|The file path to the trusted root certificate key store.|Default trust store provided by MySQL|yes if `verifyServerCertificate` is set to true and a custom trust store is used|
+|`druid.metadata.mysql.ssl.trustCertificateKeyStoreType`|The type of the key store where trusted root certificates are stored.|JKS|yes if `verifyServerCertificate` is set to true and keystore type is not JKS|
+|`druid.metadata.mysql.ssl.trustCertificateKeyStorePassword`|The [Password Provider](../../operations/password-provider.md) or String password for the trust store.|none|yes if `verifyServerCertificate` is set to true and password is not null|
+|`druid.metadata.mysql.ssl.enabledSSLCipherSuites`|Overrides the existing cipher suites with these cipher suites.|none|no|
+|`druid.metadata.mysql.ssl.enabledTLSProtocols`|Overrides the TLS protocols with these protocols.|none|no|
+
+## MySQL input source
+
+The MySQL extension provides an implementation of an SQL input source to ingest data into Druid from a MySQL database.
+For more information on the input source parameters, see [SQL input source](../../ingestion/input-sources.md#sql-input-source).
+
+```json
+{
+  "type": "index_parallel",
+  "spec": {
+    "dataSchema": {
+      "dataSource": "some_datasource",
+      "dimensionsSpec": {
+        "dimensionExclusions": [],
+        "dimensions": [
+          "dim1",
+          "dim2",
+          "dim3"
+        ]
+      },
+      "timestampSpec": {
+        "format": "auto",
+        "column": "ts"
+      },
+      "metricsSpec": [],
+      "granularitySpec": {
+        "type": "uniform",
+        "segmentGranularity": "DAY",
+        "queryGranularity": {
+          "type": "none"
+        },
+        "rollup": false,
+        "intervals": null
+      },
+      "transformSpec": {
+        "filter": null,
+        "transforms": []
+      }
+    },
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "sql",
+        "database": {
+          "type": "mysql",
+          "connectorConfig": {
+            "connectURI": "jdbc:mysql://some-rds-host.us-west-1.rds.amazonaws.com:3306/druid",
+            "user": "admin",
+            "password": "secret"
+          }
+        },
+        "sqls": [
+          "SELECT * FROM some_table"
+        ]
+      },
+      "inputFormat": {
+        "type": "json"
+      }
+    },
+    "tuningConfig": {
+      "type": "index_parallel"
+    }
+  }
+}
+```
diff --git a/docs/35.0.0/development/extensions-core/orc.md b/docs/35.0.0/development/extensions-core/orc.md
new file mode 100644
index 0000000000..4be5867409
--- /dev/null
+++ b/docs/35.0.0/development/extensions-core/orc.md
@@ -0,0 +1,84 @@
+---
+id: orc
+title: "ORC Extension"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+## ORC extension
+
+This Apache Druid extension enables Druid to ingest and understand the Apache ORC data format.
+
+The extension provides the [ORC input format](../../ingestion/data-formats.md#orc) and the [ORC Hadoop parser](../../ingestion/data-formats.md#orc-hadoop-parser)
+for [native batch ingestion](../../ingestion/native-batch.md) and [Hadoop batch ingestion](../../ingestion/hadoop.md), respectively.
+Please see corresponding docs for details.
+
+To use this extension, make sure to [include](../../configuration/extensions.md#loading-extensions) `druid-orc-extensions` in the extensions load list.
+
+### Migration from 'contrib' extension
+This extension, first available in version 0.15.0, replaces the previous 'contrib' extension which was available until
+0.14.0-incubating. While this extension can index any data the 'contrib' extension could, the JSON spec for the
+ingestion task is *incompatible*, and will need modified to work with the newer 'core' extension.
+
+To migrate to 0.15.0+:
+
+* In `inputSpec` of `ioConfig`, `inputFormat` must be changed from `"org.apache.hadoop.hive.ql.io.orc.OrcNewInputFormat"` to
+`"org.apache.orc.mapreduce.OrcInputFormat"`
+* The 'contrib' extension supported a `typeString` property, which provided the schema of the
+ORC file, of which was essentially required to have the types correct, but notably _not_ the column names, which
+facilitated column renaming. In the 'core' extension, column renaming can be achieved with
+[`flattenSpec`](../../ingestion/ingestion-spec.md#flattenspec). For example, `"typeString":"struct<time:string,name:string>"`
+with the actual schema `struct<_col0:string,_col1:string>`, to preserve Druid schema would need replaced with:
+
+```json
+"flattenSpec": {
+  "fields": [
+    {
+      "type": "path",
+      "name": "time",
+      "expr": "$._col0"
+    },
+    {
+      "type": "path",
+      "name": "name",
+      "expr": "$._col1"
+    }
+  ]
+  ...
+}
+```
+
+* The 'contrib' extension supported a `mapFieldNameFormat` property, which provided a way to specify a dimension to
+ flatten `OrcMap` columns with primitive types. This functionality has also been replaced with
+ [`flattenSpec`](../../ingestion/ingestion-spec.md#flattenspec). For example: `"mapFieldNameFormat": "<PARENT>_<CHILD>"`
+ for a dimension `nestedData_dim1`, to preserve Druid schema could be replaced with
+
+ ```json
+"flattenSpec": {
+  "fields": [
+    {
+      "type": "path",
+      "name": "nestedData_dim1",
+      "expr": "$.nestedData.dim1"
+    }
+  ]
+  ...
+}
+```
diff --git a/docs/35.0.0/development/extensions-core/parquet.md b/docs/35.0.0/development/extensions-core/parquet.md
new file mode 100644
index 0000000000..a655c8989c
--- /dev/null
+++ b/docs/35.0.0/development/extensions-core/parquet.md
@@ -0,0 +1,36 @@
+---
+id: parquet
+title: "Apache Parquet Extension"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+This Apache Druid module extends [Druid Hadoop based indexing](../../ingestion/hadoop.md) to ingest data directly from offline
+Apache Parquet files.
+
+Note: If using the `parquet-avro` parser for Apache Hadoop based indexing, `druid-parquet-extensions` depends on the `druid-avro-extensions` module, so be sure to
+ [include  both](../../configuration/extensions.md#loading-extensions).
+
+The `druid-parquet-extensions` provides the [Parquet input format](../../ingestion/data-formats.md#parquet), the [Parquet Hadoop parser](../../ingestion/data-formats.md#parquet-hadoop-parser),
+and the [Parquet Avro Hadoop Parser](../../ingestion/data-formats.md#parquet-avro-hadoop-parser) with `druid-avro-extensions`.
+The Parquet input format is available for [native batch ingestion](../../ingestion/native-batch.md)
+and the other 2 parsers are for [Hadoop batch ingestion](../../ingestion/hadoop.md).
+Please see corresponding docs for details.
diff --git a/docs/35.0.0/development/extensions-core/postgresql.md b/docs/35.0.0/development/extensions-core/postgresql.md
new file mode 100644
index 0000000000..006a65ed42
--- /dev/null
+++ b/docs/35.0.0/development/extensions-core/postgresql.md
@@ -0,0 +1,155 @@
+---
+id: postgresql
+title: "PostgreSQL metadata store"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+To use this Apache Druid extension, [include](../../configuration/extensions.md#loading-extensions) `postgresql-metadata-storage` in the extensions load list.
+
+With the  PostgreSQL extension, you can use PostgreSQL as a metadata store or ingest from a PostgreSQL database.
+
+## Set up PostgreSQL
+
+To avoid issues with upgrades that require schema changes to a large metadata table, consider a PostgreSQL version that supports instant ADD COLUMN semantics.
+
+1. Install PostgreSQL
+
+  Use your favorite package manager to install PostgreSQL, e.g.:
+  - on Ubuntu/Debian using apt `apt-get install postgresql`
+  - on OS X, using [Homebrew](http://brew.sh/) `brew install postgresql`
+
+2. Create a druid database and user
+
+  On the machine where PostgreSQL is installed, using an account with proper
+  postgresql permissions:
+
+  Create a druid user, enter `diurd` when prompted for the password.
+
+  ```bash
+  createuser druid -P
+  ```
+
+  Create a druid database owned by the user we just created
+
+  ```bash
+  createdb druid -O druid
+  ```
+
+  *Note:* On Ubuntu / Debian you may have to prefix the `createuser` and
+  `createdb` commands with `sudo -u postgres` in order to gain proper
+  permissions.
+
+3. Configure your Druid metadata storage extension:
+
+  Add the following parameters to your Druid configuration, replacing `<host>`
+  with the location (host name and port) of the database.
+
+  ```properties
+  druid.extensions.loadList=["postgresql-metadata-storage"]
+  druid.metadata.storage.type=postgresql
+  druid.metadata.storage.connector.connectURI=jdbc:postgresql://<host>/druid
+  druid.metadata.storage.connector.user=druid
+  druid.metadata.storage.connector.password=diurd
+  ```
+
+## Configuration properties
+
+In most cases, the configuration options map directly to the [postgres JDBC connection options](https://jdbc.postgresql.org/documentation/use/#connecting-to-the-database).
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|--------|
+| `druid.metadata.postgres.ssl.useSSL` | Enables SSL | `false` | no |
+| `druid.metadata.postgres.ssl.sslPassword` | The [Password Provider](../../operations/password-provider.md) or String password for the client's key. | none | no |
+| `druid.metadata.postgres.ssl.sslFactory` | The class name to use as the `SSLSocketFactory` | none | no |
+| `druid.metadata.postgres.ssl.sslFactoryArg` | An optional argument passed to the sslFactory's constructor | none | no |
+| `druid.metadata.postgres.ssl.sslMode` | The sslMode. Possible values are "disable", "require", "verify-ca", "verify-full", "allow" and "prefer"| none | no |
+| `druid.metadata.postgres.ssl.sslCert` | The full path to the certificate file. | none | no |
+| `druid.metadata.postgres.ssl.sslKey` | The full path to the key file. | none | no |
+| `druid.metadata.postgres.ssl.sslRootCert` | The full path to the root certificate. | none | no |
+| `druid.metadata.postgres.ssl.sslHostNameVerifier` | The classname of the hostname verifier. | none | no |
+| `druid.metadata.postgres.ssl.sslPasswordCallback` | The classname of the SSL password provider. | none | no |
+| `druid.metadata.postgres.dbTableSchema` | druid meta table schema | `public` | no |
+
+## PostgreSQL input source
+
+The PostgreSQL extension provides an implementation of an SQL input source to ingest data into Druid from a PostgreSQL database.
+For more information on the input source parameters, see [SQL input source](../../ingestion/input-sources.md#sql-input-source).
+
+```json
+{
+  "type": "index_parallel",
+  "spec": {
+    "dataSchema": {
+      "dataSource": "some_datasource",
+      "dimensionsSpec": {
+        "dimensionExclusions": [],
+        "dimensions": [
+          "dim1",
+          "dim2",
+          "dim3"
+        ]
+      },
+      "timestampSpec": {
+        "format": "auto",
+        "column": "ts"
+      },
+      "metricsSpec": [],
+      "granularitySpec": {
+        "type": "uniform",
+        "segmentGranularity": "DAY",
+        "queryGranularity": {
+          "type": "none"
+        },
+        "rollup": false,
+        "intervals": null
+      },
+      "transformSpec": {
+        "filter": null,
+        "transforms": []
+      }
+    },
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "sql",
+        "database": {
+          "type": "postgresql",
+          "connectorConfig": {
+            "connectURI": "jdbc:postgresql://some-rds-host.us-west-1.rds.amazonaws.com:5432/druid",
+            "user": "admin",
+            "password": "secret"
+          }
+        },
+        "sqls": [
+          "SELECT * FROM some_table"
+        ]
+      },
+      "inputFormat": {
+        "type": "json"
+      }
+    },
+    "tuningConfig": {
+      "type": "index_parallel"
+    }
+  }
+}
+```
diff --git a/docs/35.0.0/development/extensions-core/protobuf.md b/docs/35.0.0/development/extensions-core/protobuf.md
new file mode 100644
index 0000000000..5e6fefbdd6
--- /dev/null
+++ b/docs/35.0.0/development/extensions-core/protobuf.md
@@ -0,0 +1,321 @@
+---
+id: protobuf
+title: "Protobuf"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+This Apache Druid extension enables Druid to ingest and understand the Protobuf data format. Make sure to [include](../../configuration/extensions.md#loading-extensions) `druid-protobuf-extensions` in the extensions load list.
+
+The `druid-protobuf-extensions` provides the [Protobuf Parser](../../ingestion/data-formats.md#protobuf-parser)
+for [stream ingestion](../../ingestion/index.md#streaming). See corresponding docs for details.
+
+## Example: Load Protobuf messages from Kafka
+
+This example demonstrates how to load Protobuf messages from Kafka.  Please read the [Load from Kafka tutorial](../../tutorials/tutorial-kafka.md) first, and see [Kafka Indexing Service](../../ingestion/kafka-ingestion.md) documentation for more details.
+
+The files used in this example are found at [`./examples/quickstart/protobuf` in your Druid directory](https://github.com/apache/druid/tree/master/examples/quickstart/protobuf).
+
+For this example:
+- Kafka broker host is `localhost:9092`
+- Kafka topic is `metrics_pb`
+- Datasource name is `metrics-protobuf`
+
+Here is a JSON example of the 'metrics' data schema used in the example.
+
+```json
+{
+  "unit": "milliseconds",
+  "http_method": "GET",
+  "value": 44,
+  "timestamp": "2017-04-06T02:36:22Z",
+  "http_code": "200",
+  "page": "/",
+  "metricType": "request/latency",
+  "server": "www1.example.com"
+}
+```
+
+### Proto file
+
+The corresponding proto file for our 'metrics' dataset looks like this. You can use Protobuf `inputFormat` with a proto file or [Confluent Schema Registry](https://docs.confluent.io/platform/current/schema-registry/index.html).
+```
+syntax = "proto3";
+message Metrics {
+  string unit = 1;
+  string http_method = 2;
+  int32 value = 3;
+  string timestamp = 4;
+  string http_code = 5;
+  string page = 6;
+  string metricType = 7;
+  string server = 8;
+}
+```
+
+### When using a descriptor file
+
+Next, we use the `protoc` Protobuf compiler to generate the descriptor file and save it as `metrics.desc`. The descriptor file must be either in the classpath or reachable by URL.  In this example the descriptor file was saved at `/tmp/metrics.desc`, however this file is also available in the example files. From your Druid install directory:
+
+```
+protoc -o /tmp/metrics.desc ./quickstart/protobuf/metrics.proto
+```
+
+### When using Schema Registry
+
+Make sure your Schema Registry version is later than 5.5. Next, we can post a schema to add it to the registry:
+
+```
+POST /subjects/test/versions HTTP/1.1
+Host: schemaregistry.example1.com
+Accept: application/vnd.schemaregistry.v1+json, application/vnd.schemaregistry+json, application/json
+
+{
+    "schemaType": "PROTOBUF",
+    "schema": "syntax = \"proto3\";\nmessage Metrics {\n  string unit = 1;\n  string http_method = 2;\n  int32 value = 3;\n string timestamp = 4;\n string http_code = 5;\n string page = 6;\n string metricType = 7;\n string server = 8;\n}\n"
+}
+```
+
+This feature uses Confluent's Protobuf provider which is not included in the Druid distribution and must be installed separately. You can fetch it and its dependencies from the Confluent repository and Maven Central at: 
+- https://packages.confluent.io/maven/io/confluent/kafka-protobuf-provider/6.0.1/kafka-protobuf-provider-6.0.1.jar
+- https://repo1.maven.org/maven2/org/jetbrains/kotlin/kotlin-stdlib/1.4.0/kotlin-stdlib-1.4.0.jar
+- https://repo1.maven.org/maven2/com/squareup/wire/wire-schema/3.2.2/wire-schema-3.2.2.jar
+
+Copy or symlink those files inside the folder `extensions-core/protobuf-extensions` under the distribution root directory.
+
+## Create Kafka Supervisor
+
+Below is the complete Supervisor spec JSON to be submitted to the Overlord.
+Make sure these keys are properly configured for successful ingestion.
+
+### When using a descriptor file
+
+Important supervisor properties
+- `protoBytesDecoder.descriptor` for the descriptor file URL
+- `protoBytesDecoder.protoMessageType` from the proto definition
+- `protoBytesDecoder.type` set to `file`, indicate use descriptor file to decode Protobuf file
+- `inputFormat` should have `type` set to `protobuf`
+
+```json
+{
+"type": "kafka",
+"spec": {
+    "dataSchema": {
+        "dataSource": "metrics-protobuf",
+        "timestampSpec": {
+            "column": "timestamp",
+            "format": "auto"
+        },
+        "dimensionsSpec": {
+            "dimensions": [
+                "unit",
+                "http_method",
+                "http_code",
+                "page",
+                "metricType",
+                "server"
+            ],
+            "dimensionExclusions": [
+                "timestamp",
+                "value"
+            ]
+        },
+        "metricsSpec": [
+            {
+                "name": "count",
+                "type": "count"
+            },
+            {
+                "name": "value_sum",
+                "fieldName": "value",
+                "type": "doubleSum"
+            },
+            {
+                "name": "value_min",
+                "fieldName": "value",
+                "type": "doubleMin"
+            },
+            {
+                "name": "value_max",
+                "fieldName": "value",
+                "type": "doubleMax"
+            }
+        ],
+        "granularitySpec": {
+            "type": "uniform",
+            "segmentGranularity": "HOUR",
+            "queryGranularity": "NONE"
+        }
+    },
+    "tuningConfig": {
+        "type": "kafka",
+        "maxRowsPerSegment": 5000000
+    },
+    "ioConfig": {
+        "topic": "metrics_pb",
+        "consumerProperties": {
+            "bootstrap.servers": "localhost:9092"
+        },
+        "inputFormat": {
+            "type": "protobuf",
+            "protoBytesDecoder": {
+                "type": "file",
+                "descriptor": "file:///tmp/metrics.desc",
+                "protoMessageType": "Metrics"
+            },
+            "flattenSpec": {
+                "useFieldDiscovery": true
+            },
+            "binaryAsString": false
+        },
+        "taskCount": 1,
+        "replicas": 1,
+        "taskDuration": "PT1H",
+        "type": "kafka"
+    }
+}
+}
+```
+
+To adopt to old version. You can use old parser style, which also works.
+
+```json
+{
+  "parser": {
+    "type": "protobuf",
+    "descriptor": "file:///tmp/metrics.desc",
+    "protoMessageType": "Metrics"
+  }
+}
+```
+
+### When using Schema Registry
+
+Important supervisor properties
+- `protoBytesDecoder.url` for the schema registry URL with single instance.
+- `protoBytesDecoder.urls` for the schema registry URLs with multi instances.
+- `protoBytesDecoder.capacity` capacity for schema registry cached schemas.
+- `protoBytesDecoder.config` to send additional configurations, configured for Schema Registry.
+- `protoBytesDecoder.headers` to send headers to the Schema Registry.
+- `protoBytesDecoder.type` set to `schema_registry`, indicate use schema registry to decode Protobuf file.
+- `parser` should have `type` set to `protobuf`, but note that the `format` of the `parseSpec` must be `json`.
+
+```json
+{
+  "parser": {
+    "type": "protobuf",
+    "protoBytesDecoder": {
+      "urls": ["http://schemaregistry.example1.com:8081","http://schemaregistry.example2.com:8081"],
+      "type": "schema_registry",
+      "capacity": 100,
+      "config" : {
+           "basic.auth.credentials.source": "USER_INFO",
+           "basic.auth.user.info": "fred:letmein",
+           "schema.registry.ssl.truststore.location": "/some/secrets/kafka.client.truststore.jks",
+           "schema.registry.ssl.truststore.password": "<password>",
+           "schema.registry.ssl.keystore.location": "/some/secrets/kafka.client.keystore.jks",
+           "schema.registry.ssl.keystore.password": "<password>",
+           "schema.registry.ssl.key.password": "<password>",
+             ... 
+      },
+      "headers": {
+          "traceID" : "b29c5de2-0db4-490b-b421",
+          "timeStamp" : "1577191871865",
+          ...
+      }
+    }
+  }
+}
+```
+
+## Adding Protobuf messages to Kafka
+
+If necessary, from your Kafka installation directory run the following command to create the Kafka topic
+
+```
+./bin/kafka-topics.sh --create --bootstrap-server localhost:9092 --replication-factor 1 --partitions 1 --topic metrics_pb
+```
+
+This example script requires `protobuf` and `kafka-python` modules. With the topic in place, messages can be inserted running the following command from your Druid installation directory
+
+```
+./bin/generate-example-metrics | python /quickstart/protobuf/pb_publisher.py
+```
+
+You can confirm that data has been inserted to your Kafka topic using the following command from your Kafka installation directory
+
+```
+./bin/kafka-console-consumer.sh --bootstrap-server localhost:9092 --topic metrics_pb --from-beginning
+```
+
+which should print messages like this
+
+```
+millisecondsGETR"2017-04-06T03:23:56Z*2002/list:request/latencyBwww1.example.com
+```
+
+If your supervisor created in the previous step is running, the indexing tasks should begin producing the messages and the data will soon be available for querying in Druid.
+
+## Generating the example files
+
+The files provided in the example quickstart can be generated in the following manner starting with only `metrics.proto`.
+
+### `metrics.desc`
+
+The descriptor file is generated using `protoc` Protobuf compiler. Given a `.proto` file, a `.desc` file can be generated like so.
+
+```
+protoc -o metrics.desc metrics.proto
+```
+
+### `metrics_pb2.py`
+`metrics_pb2.py` is also generated with `protoc`
+
+```
+ protoc -o metrics.desc metrics.proto --python_out=.
+```
+
+### `pb_publisher.py`
+After `metrics_pb2.py` is generated, another script can be constructed to parse JSON data, convert it to Protobuf, and produce to a Kafka topic
+
+```python
+#!/usr/bin/env python
+
+import sys
+import json
+
+from kafka import KafkaProducer
+from metrics_pb2 import Metrics
+
+
+producer = KafkaProducer(bootstrap_servers='localhost:9092')
+topic = 'metrics_pb'
+
+for row in iter(sys.stdin):
+    d = json.loads(row)
+    metrics = Metrics()
+    for k, v in d.items():
+        setattr(metrics, k, v)
+    pb = metrics.SerializeToString()
+    producer.send(topic, pb)
+
+producer.flush()
+```
diff --git a/docs/35.0.0/development/extensions-core/s3.md b/docs/35.0.0/development/extensions-core/s3.md
new file mode 100644
index 0000000000..ed33d4337e
--- /dev/null
+++ b/docs/35.0.0/development/extensions-core/s3.md
@@ -0,0 +1,154 @@
+---
+id: s3
+title: "S3-compatible"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+## S3 extension
+
+This extension allows you to do 2 things:
+
+* [Ingest data](#reading-data-from-s3) from files stored in S3.
+* Write segments to [deep storage](#deep-storage) in S3.
+
+To use this Apache Druid extension, [include](../../configuration/extensions.md#loading-extensions) `druid-s3-extensions` in the extensions load list.
+
+### Reading data from S3
+
+Use a native batch [Parallel task](../../ingestion/native-batch.md) with an [S3 input source](../../ingestion/input-sources.md#s3-input-source) to read objects directly from S3.
+
+Alternatively, use a [Hadoop task](../../ingestion/hadoop.md),
+and specify S3 paths in your [`inputSpec`](../../ingestion/hadoop.md#inputspec).
+
+To read objects from S3, you must supply [connection information](#configuration) in configuration.
+
+### Deep Storage
+
+S3-compatible deep storage means either Amazon S3 or a compatible service like Google Storage which exposes the same API as S3.
+
+S3 deep storage needs to be explicitly enabled by setting `druid.storage.type=s3`. **Only after setting the storage type to S3 will any of the settings below take effect.**
+
+To use S3 for Deep Storage, you must supply [connection information](#configuration) in configuration *and* set additional configuration, specific for [Deep Storage](#deep-storage-specific-configuration).
+
+#### Deep storage specific configuration
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.storage.bucket`|Bucket to store in.|Must be set.|
+|`druid.storage.baseKey`|A prefix string that will be prepended to the object names for the segments published to S3 deep storage|Must be set.|
+|`druid.storage.type`|Global deep storage provider. Must be set to `s3` to make use of this extension.|Must be set (likely `s3`).|
+|`druid.storage.disableAcl`|Boolean flag for how object permissions are handled. To use ACLs, set this property to `false`. To use Object Ownership, set it to `true`. The permission requirements for ACLs and Object Ownership are different. For more information, see [S3 permissions settings](#s3-permissions-settings).|false|
+|`druid.storage.useS3aSchema`|If true, use the "s3a" filesystem when using Hadoop-based ingestion. If false, the "s3n" filesystem will be used. Only affects Hadoop-based ingestion.|false|
+|`druid.storage.zip`|`true`, `false`|Whether segments in `s3` are written as directories (`false`) or zip files (`true`).|`false`|
+|`druid.storage.transfer.useTransferManager`| If true, use AWS S3 Transfer Manager to upload segments to S3.|true|
+|`druid.storage.transfer.minimumUploadPartSize`| Minimum size (in bytes) of each part in a multipart upload.|20971520 (20 MB)|
+|`druid.storage.transfer.multipartUploadThreshold`| The file size threshold (in bytes) above which a file upload is converted into a multipart upload instead of a single PUT request.| 20971520 (20 MB)|
+
+## Configuration
+
+### S3 authentication methods
+
+You can provide credentials to connect to S3 in a number of ways, whether for [deep storage](#deep-storage) or as an [ingestion source](#reading-data-from-s3).
+
+The configuration options are listed in order of precedence.  For example, if you would like to use profile information given in `~/.aws/credentials`, do not set `druid.s3.accessKey` and `druid.s3.secretKey` in your Druid config file because they would take precedence.
+
+|order|type|details|
+|--------|-----------|-------|
+|1|Druid config file|Based on your runtime.properties if it contains values `druid.s3.accessKey` and `druid.s3.secretKey` |
+|2|Custom properties file| Based on custom properties file where you can supply `sessionToken`, `accessKey` and `secretKey` values. This file is provided to Druid through `druid.s3.fileSessionCredentials` properties|
+|3|Environment variables|Based on environment variables `AWS_ACCESS_KEY_ID` and `AWS_SECRET_ACCESS_KEY`|
+|4|Java system properties|Based on JVM properties `aws.accessKeyId` and `aws.secretKey` |
+|5|Profile information|Based on credentials you may have on your druid instance (generally in `~/.aws/credentials`)|
+|6|ECS container credentials|Based on environment variables available on AWS ECS (AWS_CONTAINER_CREDENTIALS_RELATIVE_URI or AWS_CONTAINER_CREDENTIALS_FULL_URI) as described in the [EC2ContainerCredentialsProviderWrapper documentation](https://docs.aws.amazon.com/AWSJavaSDK/latest/javadoc/com/amazonaws/auth/EC2ContainerCredentialsProviderWrapper.html)|
+|7|Instance profile information|Based on the instance profile you may have attached to your druid instance|
+
+For more information, refer to the [Amazon Developer Guide](https://docs.aws.amazon.com/fr_fr/sdk-for-java/v1/developer-guide/credentials).
+
+Alternatively, you can bypass this chain by specifying an access key and secret key using a [Properties Object](../../ingestion/input-sources.md#s3-input-source) inside your ingestion specification.
+
+Use the property [`druid.startup.logging.maskProperties`](../../configuration/index.md#startup-logging) to mask credentials information in Druid logs. For example, `["password", "secretKey", "awsSecretAccessKey"]`.
+
+### S3 permissions settings
+
+To manage the permissions for objects in an S3 bucket, you can use either ACLs or Object Ownership. The permissions required for each method are different.
+
+By default, Druid uses ACLs. With ACLs, any object that Druid puts into the bucket inherits the ACL settings from the bucket.
+
+You can switch from using ACLs to Object Ownership by setting `druid.storage.disableAcl` to `true`. The bucket owner owns any object that gets created, so you need to use S3's bucket policies to manage permissions.
+
+Note that this setting only affects Druid's behavior. Changing S3 to use Object Ownership requires additional configuration. For more information, see the AWS documentation on [Controlling ownership of objects and disabling ACLs for your bucket](https://docs.aws.amazon.com/AmazonS3/latest/userguide/about-object-ownership.html).
+
+#### ACL permissions
+
+If you're using ACLs, Druid needs the following permissions:
+
+* `s3:GetObject`
+* `s3:PutObject`
+* `s3:DeleteObject`
+* `s3:GetBucketAcl`
+* `s3:PutObjectAcl`
+
+#### Object Ownership permissions
+
+If you're using Object Ownership, Druid needs the following permissions:
+
+* `s3:GetObject`
+* `s3:PutObject`
+* `s3:DeleteObject`
+
+### AWS region
+
+The AWS SDK requires that a target region be specified.  You can set these by using the JVM system property `aws.region` or by setting an environment variable `AWS_REGION`.
+
+For example, to set the region to 'us-east-1' through system properties:
+
+* Add `-Daws.region=us-east-1` to the `jvm.config` file for all Druid services.
+* Add `"-Daws.region=us-east-1"` to `druid.indexer.runner.javaOptsArray` in [Middle Manager configuration](../../configuration/index.md#middle-manager-configuration) so that the property will be passed to Peon (worker) processes.
+
+### Connecting to S3 configuration
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.s3.accessKey`|S3 access key. See [S3 authentication methods](#s3-authentication-methods) for more details|Can be omitted according to authentication methods chosen.|
+|`druid.s3.secretKey`|S3 secret key. See [S3 authentication methods](#s3-authentication-methods) for more details|Can be omitted according to authentication methods chosen.|
+|`druid.s3.fileSessionCredentials`|Path to properties file containing `sessionToken`, `accessKey` and `secretKey` value. One key/value pair per line (format `key=value`). See [S3 authentication methods](#s3-authentication-methods) for more details |Can be omitted according to authentication methods chosen.|
+|`druid.s3.protocol`|Communication protocol type to use when sending requests to AWS. `http` or `https` can be used. This configuration would be ignored if `druid.s3.endpoint.url` is filled with a URL with a different protocol.|`https`|
+|`druid.s3.disableChunkedEncoding`|Disables chunked encoding. See [AWS document](https://docs.aws.amazon.com/AWSJavaSDK/latest/javadoc/com/amazonaws/services/s3/AmazonS3Builder.html#disableChunkedEncoding--) for details.|false|
+|`druid.s3.enablePathStyleAccess`|Enables path style access. See [AWS document](https://docs.aws.amazon.com/AWSJavaSDK/latest/javadoc/com/amazonaws/services/s3/AmazonS3Builder.html#enablePathStyleAccess--) for details.|false|
+|`druid.s3.forceGlobalBucketAccessEnabled`|Enables global bucket access. See [AWS document](https://docs.aws.amazon.com/AWSJavaSDK/latest/javadoc/com/amazonaws/services/s3/AmazonS3Builder.html#setForceGlobalBucketAccessEnabled-java.lang.Boolean-) for details.|false|
+|`druid.s3.endpoint.url`|Service endpoint either with or without the protocol.|None|
+|`druid.s3.endpoint.signingRegion`|Region to use for SigV4 signing of requests (e.g. us-west-1).|None|
+|`druid.s3.proxy.host`|Proxy host to connect through.|None|
+|`druid.s3.proxy.port`|Port on the proxy host to connect through.|None|
+|`druid.s3.proxy.username`|User name to use when connecting through a proxy.|None|
+|`druid.s3.proxy.password`|Password to use when connecting through a proxy.|None|
+|`druid.storage.sse.type`|Server-side encryption type. Should be one of `s3`, `kms`, and `custom`. See the below [Server-side encryption section](#server-side-encryption) for more details.|None|
+|`druid.storage.sse.kms.keyId`|AWS KMS key ID. This is used only when `druid.storage.sse.type` is `kms` and can be empty to use the default key ID.|None|
+|`druid.storage.sse.custom.base64EncodedKey`|Base64-encoded key. Should be specified if `druid.storage.sse.type` is `custom`.|None|
+
+## Server-side encryption
+
+You can enable [server-side encryption](https://docs.aws.amazon.com/AmazonS3/latest/dev/serv-side-encryption) by setting
+`druid.storage.sse.type` to a supported type of server-side encryption. The current supported types are:
+
+* s3: [Server-side encryption with S3-managed encryption keys](https://docs.aws.amazon.com/AmazonS3/latest/dev/UsingServerSideEncryption)
+* kms: [Server-side encryption with AWS KMS–Managed Keys](https://docs.aws.amazon.com/AmazonS3/latest/dev/UsingKMSEncryption)
+* custom: [Server-side encryption with Customer-Provided Encryption Keys](https://docs.aws.amazon.com/AmazonS3/latest/dev/ServerSideEncryptionCustomerKeys)
diff --git a/docs/35.0.0/development/extensions-core/simple-client-sslcontext.md b/docs/35.0.0/development/extensions-core/simple-client-sslcontext.md
new file mode 100644
index 0000000000..981e00107a
--- /dev/null
+++ b/docs/35.0.0/development/extensions-core/simple-client-sslcontext.md
@@ -0,0 +1,52 @@
+---
+id: simple-client-sslcontext
+title: "Simple SSLContext Provider Module"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+This Apache Druid module contains a simple implementation of [SSLContext](https://docs.oracle.com/en/java/javase/17/docs/api/java.base/javax/net/ssl/SSLContext.html)
+that will be injected to be used with HttpClient that Druid processes use internally to communicate with each other. To learn more about
+Java's SSL support, please refer to [this](https://docs.oracle.com/en/java/javase/17/security/java-secure-socket-extension-jsse-reference-guide.html) guide.
+
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|--------|
+|`druid.client.https.protocol`|SSL protocol to use.|`TLSv1.2`|no|
+|`druid.client.https.trustStoreType`|The type of the key store where trusted root certificates are stored.|`java.security.KeyStore.getDefaultType()`|no|
+|`druid.client.https.trustStorePath`|The file path or URL of the TLS/SSL Key store where trusted root certificates are stored.|none|yes|
+|`druid.client.https.trustStoreAlgorithm`|Algorithm to be used by TrustManager to validate certificate chains|`javax.net.ssl.TrustManagerFactory.getDefaultAlgorithm()`|no|
+|`druid.client.https.trustStorePassword`|The [Password Provider](../../operations/password-provider.md) or String password for the Trust Store.|none|yes|
+
+The following table contains optional parameters for supporting client certificate authentication:
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|--------|
+|`druid.client.https.keyStorePath`|The file path or URL of the TLS/SSL Key store containing the client certificate that Druid will use when communicating with other Druid services. If this is null, the other properties in this table are ignored.|none|yes|
+|`druid.client.https.keyStoreType`|The type of the key store.|none|yes|
+|`druid.client.https.certAlias`|Alias of TLS client certificate in the keystore.|none|yes|
+|`druid.client.https.keyStorePassword`|The [Password Provider](../../operations/password-provider.md) or String password for the Key Store.|none|no|
+|`druid.client.https.keyManagerFactoryAlgorithm`|Algorithm to use for creating KeyManager, more details [here](https://docs.oracle.com/javase/7/docs/technotes/guides/security/jsse/JSSERefGuide.html#KeyManager).|`javax.net.ssl.KeyManagerFactory.getDefaultAlgorithm()`|no|
+|`druid.client.https.keyManagerPassword`|The [Password Provider](../../operations/password-provider.md) or String password for the Key Manager.|none|no|
+|`druid.client.https.validateHostnames`|Validate the hostname of the server. This should not be disabled unless you are using [custom TLS certificate checks](../../operations/tls-support.md) and know that standard hostname validation is not needed.|true|no|
+
+This [document](https://docs.oracle.com/en/java/javase/17/docs/specs/security/standard-names.html) lists all the possible
+values for the above mentioned configs among others provided by Java implementation.
diff --git a/docs/35.0.0/development/extensions-core/stats.md b/docs/35.0.0/development/extensions-core/stats.md
new file mode 100644
index 0000000000..280c3d5b6d
--- /dev/null
+++ b/docs/35.0.0/development/extensions-core/stats.md
@@ -0,0 +1,236 @@
+---
+id: stats
+title: "Stats aggregator"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+This Apache Druid extension includes stat-related aggregators, including variance and standard deviations, etc. Make sure to [include](../../configuration/extensions.md#loading-extensions) `druid-stats` in the extensions load list.
+
+## Variance aggregator
+
+Algorithm of the aggregator is the same with that of apache hive. This is the description in GenericUDAFVariance in hive.
+
+Evaluate the variance using the algorithm described by Chan, Golub, and LeVeque in
+"Algorithms for computing the sample variance: analysis and recommendations"
+The American Statistician, 37 (1983) pp. 242--247.
+
+variance = variance1 + variance2 + n/(m*(m+n)) * pow(((m/n)*t1 - t2),2)
+
+where: 
+ - variance is sum(x-avg^2) (this is actually n times the variance)
+and is updated at every step. 
+ - n is the count of elements in chunk1 
+ - m is the count of elements in chunk2 
+ - t1 is the sum of elements in chunk1
+ - t2 is the sum of elements in chunk2
+
+This algorithm was proven to be numerically stable by J.L. Barlow in
+"Error analysis of a pairwise summation algorithm to compute sample variance"
+Numer. Math, 58 (1991) pp. 583--590
+
+:::info
+ As with all [aggregators](../../querying/sql-aggregations.md), the order of operations across segments is
+ non-deterministic. This means that if this aggregator operates with an input type of "float" or "double", the result
+ of the aggregation may not be precisely the same across multiple runs of the query.
+
+ To produce consistent results, round the variance to a fixed number of decimal places so that the results are
+ precisely the same across query runs.
+:::
+
+### Variance and Standard Deviation SQL Aggregators
+
+You can use the variance and standard deviation aggregation functions in the SELECT clause of any Druid SQL query.
+
+|Function|Notes|Default|
+|--------|-----|-------|
+|`VAR_POP(expr)`|Computes variance population of `expr`.|`null`|
+|`VAR_SAMP(expr)`|Computes variance sample of `expr`.|`null`|
+|`VARIANCE(expr)`|Computes variance sample of `expr`.|`null`|
+|`STDDEV_POP(expr)`|Computes standard deviation population of `expr`.|`null`|
+|`STDDEV_SAMP(expr)`|Computes standard deviation sample of `expr`.|`null`|
+|`STDDEV(expr)`|Computes standard deviation sample of `expr`.|`null`|
+
+### Pre-aggregating variance at ingestion time
+
+To use this feature, an "variance" aggregator must be included at indexing time.
+The ingestion aggregator can only apply to numeric values. If you use "variance"
+then any input rows missing the value will be considered to have a value of 0.
+
+User can specify expected input type as one of "float", "double", "long", "variance" for ingestion, which is by default "float".
+
+```json
+{
+  "type" : "variance",
+  "name" : <output_name>,
+  "fieldName" : <metric_name>,
+  "inputType" : <input_type>,
+  "estimator" : <string>
+}
+```
+
+To query for results, "variance" aggregator with "variance" input type or simply a "varianceFold" aggregator must be included in the query.
+
+```json
+{
+  "type" : "varianceFold",
+  "name" : <output_name>,
+  "fieldName" : <metric_name>,
+  "estimator" : <string>
+}
+```
+
+|Property                 |Description                   |Default                           |
+|-------------------------|------------------------------|----------------------------------|
+|`estimator`|Set "population" to get variance_pop rather than variance_sample, which is default.|null|
+
+
+### Standard deviation post-aggregator
+
+To acquire standard deviation from variance, user can use "stddev" post aggregator.
+
+```json
+{
+  "type": "stddev",
+  "name": "<output_name>",
+  "fieldName": "<aggregator_name>",
+  "estimator": <string>
+}
+```
+
+## Query examples:
+
+### Timeseries query
+
+#### Druid SQL
+
+```SQL
+SELECT 
+  DATE_TRUNC('day', __time),
+  VARIANCE("index_var") AS index_var
+FROM "testing"
+WHERE TIME_IN_INTERVAL(__time, '2013-03-01/2016-03-20')
+GROUP BY 1
+```
+
+#### Native Query
+```json
+{
+  "queryType": "timeseries",
+  "dataSource": "testing",
+  "granularity": "day",
+  "aggregations": [
+    {
+      "type": "variance",
+      "name": "index_var",
+      "fieldName": "index_var"
+    }
+  ],
+  "intervals": [
+    "2016-03-01/2013-03-20"
+  ]
+}
+```
+
+### TopN query
+
+#### Druid SQL
+
+```SQL
+SELECT
+  alias,
+  VARIANCE("index") AS index_var
+FROM "testing"
+WHERE TIME_IN_INTERVAL(__time, '2016-03-06/2016-03-07')
+GROUP BY 1
+ORDER BY 2
+LIMIT 5
+```
+
+#### Native Query
+
+```json
+{
+  "queryType": "topN",
+  "dataSource": "testing",
+  "dimensions": ["alias"],
+  "threshold": 5,
+  "granularity": "all",
+  "aggregations": [
+    {
+      "type": "variance",
+      "name": "index_var",
+      "fieldName": "index"
+    }
+  ],
+  "postAggregations": [
+    {
+      "type": "stddev",
+      "name": "index_stddev",
+      "fieldName": "index_var"
+    }
+  ],
+  "intervals": [
+    "2016-03-06/2016-03-07"
+  ]
+}
+```
+
+### GroupBy query
+
+#### Druid SQL
+
+```SQL
+SELECT
+  alias,
+  VARIANCE("index") AS index_var
+FROM "testing"
+WHERE TIME_IN_INTERVAL(__time, '2016-03-06/2016-03-07')
+GROUP BY alias
+```
+
+#### Native Query
+
+```json
+{
+  "queryType": "groupBy",
+  "dataSource": "testing",
+  "dimensions": ["alias"],
+  "granularity": "all",
+  "aggregations": [
+    {
+      "type": "variance",
+      "name": "index_var",
+      "fieldName": "index"
+    }
+  ],
+  "postAggregations": [
+    {
+      "type": "stddev",
+      "name": "index_stddev",
+      "fieldName": "index_var"
+    }
+  ],
+  "intervals": [
+    "2016-03-06/2016-03-07"
+  ]
+}
+```
diff --git a/docs/35.0.0/development/extensions-core/test-stats.md b/docs/35.0.0/development/extensions-core/test-stats.md
new file mode 100644
index 0000000000..9b760a1fe3
--- /dev/null
+++ b/docs/35.0.0/development/extensions-core/test-stats.md
@@ -0,0 +1,122 @@
+---
+id: test-stats
+title: "Test stats aggregators"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+The `druid-stats` extension for Apache Druid incorporates aggregators to compute test statistics, including z-scores and p-values.
+Please refer to [Democratizing Experimentation Data for Product Innovations](https://medium.com/paypal-tech/democratizing-experimentation-data-for-product-innovations-8b6e1cf40c27) for math background and details.
+
+Make sure to include `druid-stats` extension in order to use these aggregators.
+
+## Z-Score for two sample ztests post aggregator
+
+Please refer to [Making Sense of the Two-Proportions Test](https://www.isixsigma.com/tools-templates/hypothesis-testing/making-sense-two-proportions-test/) and [An Introduction to Statistics: Comparing Two Means](https://userweb.ucs.louisiana.edu/~jcb0773/Berry_statbook/427bookall-August2024.pdf) for more details.
+
+```
+z = (p1 - p2) / S.E.  (assuming null hypothesis is true)
+```
+
+Please see below for p1 and p2.
+Please note S.E. stands for standard error where
+
+```
+S.E. = sqrt{ p1 * ( 1 - p1 )/n1 + p2 * (1 - p2)/n2) }
+```
+(p1 – p2) is the observed difference between two sample proportions.
+
+### zscore2sample post aggregator
+
+* **`zscore2sample`**: calculate the z-score using two-sample z-test while converting binary variables (***e.g.*** success or not) to continuous variables (***e.g.*** conversion rate).
+
+```json
+{
+  "type": "zscore2sample",
+  "name": "<output_name>",
+  "successCount1": <post_aggregator> success count of sample 1,
+  "sample1Size": <post_aggregaror> sample 1 size,
+  "successCount2": <post_aggregator> success count of sample 2,
+  "sample2Size" : <post_aggregator> sample 2 size
+}
+```
+
+Please note the post aggregator will be converting binary variables to continuous variables for two population proportions.  Specifically
+
+p1 = (successCount1) / (sample size 1)
+
+p2 = (successCount2) / (sample size 2)
+
+### pvalue2tailedZtest post aggregator
+
+* **`pvalue2tailedZtest`**: calculate p-value of two-sided z-test from zscore
+    - ***pvalue2tailedZtest(zscore)*** - the input is a z-score which can be calculated using the zscore2sample post aggregator
+
+
+```json
+{
+  "type": "pvalue2tailedZtest",
+  "name": "<output_name>",
+  "zScore": <zscore post_aggregator>
+}
+```
+
+## Example usage
+
+In this example, we use zscore2sample post aggregator to calculate z-score, and then feed the z-score to pvalue2tailedZtest post aggregator to calculate p-value.
+
+A JSON query example can be as follows:
+
+```json
+{
+  ...
+    "postAggregations" : {
+    "type"   : "pvalue2tailedZtest",
+    "name"   : "pvalue",
+    "zScore" :
+    {
+     "type"   : "zscore2sample",
+     "name"   : "zscore",
+     "successCount1" :
+       { "type"   : "constant",
+         "name"   : "successCountFromPopulation1Sample",
+         "value"  : 300
+       },
+     "sample1Size" :
+       { "type"   : "constant",
+         "name"   : "sampleSizeOfPopulation1",
+         "value"  : 500
+       },
+     "successCount2":
+       { "type"   : "constant",
+         "name"   : "successCountFromPopulation2Sample",
+         "value"  : 450
+       },
+     "sample2Size" :
+       { "type"   : "constant",
+         "name"   : "sampleSizeOfPopulation2",
+         "value"  : 600
+       }
+     }
+    }
+}
+
+```
diff --git a/docs/35.0.0/development/javascript.md b/docs/35.0.0/development/javascript.md
new file mode 100644
index 0000000000..da1cd11342
--- /dev/null
+++ b/docs/35.0.0/development/javascript.md
@@ -0,0 +1,75 @@
+---
+id: javascript
+title: "JavaScript programming guide"
+sidebar_label: "JavaScript functionality"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+This page discusses how to use JavaScript to extend Apache Druid.
+
+## Examples
+
+JavaScript can be used to extend Druid in a variety of ways:
+
+- [Aggregators](../querying/aggregations.md#javascript-aggregator)
+- [Extraction functions](../querying/dimensionspecs.md#javascript-extraction-function)
+- [Filters](../querying/filters.md#javascript-filter)
+- [Post-aggregators](../querying/post-aggregations.md#javascript-post-aggregator)
+- [Input parsers](../ingestion/data-formats.md#javascript-parsespec)
+- [Router strategy](../design/router.md#javascript)
+- [Worker select strategy](../configuration/index.md#javascript-1)
+
+JavaScript can be injected dynamically at runtime, making it convenient to rapidly prototype new functionality
+without needing to write and deploy Druid extensions.
+
+Druid uses the Mozilla Rhino engine at optimization level 9 to compile and execute JavaScript.
+
+## Security
+
+Druid does not execute JavaScript functions in a sandbox, so they have full access to the machine. So JavaScript
+functions allow users to execute arbitrary code inside druid process. So, by default, JavaScript is disabled.
+However, on dev/staging environments or secured production environments you can enable those by setting
+the [configuration property](../configuration/index.md#javascript)
+`druid.javascript.enabled = true`.
+
+## Global variables
+
+Avoid using global variables. Druid may share the global scope between multiple threads, which can lead to
+unpredictable results if global variables are used.
+
+## Performance
+
+Simple JavaScript functions typically have a slight performance penalty to native speed. More complex JavaScript
+functions can have steeper performance penalties. Druid compiles JavaScript functions once on each data process per query.
+
+You may need to pay special attention to garbage collection when making heavy use of JavaScript functions, especially
+garbage collection of the compiled classes themselves. Be sure to use a garbage collector configuration that supports
+timely collection of unused classes (this is generally easier on JDK8 with the Metaspace than it is on JDK7).
+
+## JavaScript vs. Native Extensions
+
+Generally we recommend using JavaScript when security is not an issue, and when speed of development is more important
+than performance or memory use. If security is an issue, or if performance and memory use are of the utmost importance,
+we recommend developing a native Druid extension.
+
+In addition, native Druid extensions are more flexible than JavaScript functions. There are some kinds of extensions
+(like sketches) that must be written as native Druid extensions due to their need for custom data formats.
diff --git a/docs/35.0.0/development/modules.md b/docs/35.0.0/development/modules.md
new file mode 100644
index 0000000000..c62a6d4a08
--- /dev/null
+++ b/docs/35.0.0/development/modules.md
@@ -0,0 +1,409 @@
+---
+id: modules
+title: "Creating extensions"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+Druid uses a module system that allows for the addition of extensions at runtime.
+
+## Writing your own extensions
+
+Druid's extensions leverage Guice in order to add things at runtime. Basically, Guice is a framework for Dependency Injection, but we use it to hold the expected object graph of the Druid process. Extensions can make any changes they want/need to the object graph via adding Guice bindings. While the extensions actually give you the capability to change almost anything however you want, in general, we expect people to want to extend one of the things listed below. This means that we honor our [versioning strategy](./versioning.md) for changes that affect the interfaces called out on this page, but other interfaces are deemed "internal" and can be changed in an incompatible manner even between patch releases.
+
+1. Add a new deep storage implementation by extending the `org.apache.druid.segment.loading.DataSegment*` and
+   `org.apache.druid.tasklogs.TaskLog*` classes.
+1. Add a new input source by extending `org.apache.druid.data.input.InputSource`.
+1. Add a new input entity by extending `org.apache.druid.data.input.InputEntity`.
+1. Add a new input source reader if necessary by extending `org.apache.druid.data.input.InputSourceReader`. You can use `org.apache.druid.data.input.impl.InputEntityIteratingReader` in most cases.
+1. Add a new input format by extending `org.apache.druid.data.input.InputFormat`.
+1. Add a new input entity reader by extending `org.apache.druid.data.input.TextReader` for text formats or `org.apache.druid.data.input.IntermediateRowParsingReader` for binary formats.
+1. Add Aggregators by extending `org.apache.druid.query.aggregation.AggregatorFactory`, `org.apache.druid.query.aggregation.Aggregator`,
+   and `org.apache.druid.query.aggregation.BufferAggregator`.
+1. Add PostAggregators by extending `org.apache.druid.query.aggregation.PostAggregator`.
+1. Add ExtractionFns by extending `org.apache.druid.query.extraction.ExtractionFn`.
+1. Add Complex metrics by extending `org.apache.druid.segment.serde.ComplexMetricSerde`.
+1. Add new Query types by extending `org.apache.druid.query.QueryRunnerFactory`, `org.apache.druid.query.QueryToolChest`, and
+   `org.apache.druid.query.Query`.
+1. Add new Jersey resources by calling `Jerseys.addResource(binder, clazz)`.
+1. Add new Jetty filters by extending `org.apache.druid.server.initialization.jetty.ServletFilterHolder`.
+1. Add new secret providers by extending `org.apache.druid.metadata.PasswordProvider`.
+1. Add new dynamic configuration providers by extending `org.apache.druid.metadata.DynamicConfigProvider`.
+1. Add new ingest transform by implementing the `org.apache.druid.segment.transform.Transform` interface from the `druid-processing` package.
+1. Bundle your extension with all the other Druid extensions
+
+Extensions are added to the system via an implementation of `org.apache.druid.initialization.DruidModule`.
+
+### Creating a Druid Module
+
+The DruidModule class is has two methods
+
+1. A `configure(Binder)` method
+2. A `getJacksonModules()` method
+
+The `configure(Binder)` method is the same method that a normal Guice module would have.
+
+The `getJacksonModules()` method provides a list of Jackson modules that are used to help initialize the Jackson ObjectMapper instances used by Druid. This is how you add extensions that are instantiated via Jackson (like AggregatorFactory and InputSource objects) to Druid.
+
+### Registering your Druid Module
+
+Once you have your DruidModule created, you will need to package an extra file in the `META-INF/services` directory of your jar. This is easiest to accomplish with a maven project by creating files in the `src/main/resources` directory. There are examples of this in the Druid code under the `cassandra-storage`, `hdfs-storage` and `s3-extensions` modules, for examples.
+
+The file that should exist in your jar is
+
+`META-INF/services/org.apache.druid.initialization.DruidModule`
+
+It should be a text file with a new-line delimited list of package-qualified classes that implement DruidModule like
+
+```txt
+org.apache.druid.storage.cassandra.CassandraDruidModule
+```
+
+If your jar has this file, then when it is added to the classpath or as an extension, Druid will notice the file and will instantiate instances of the Module. Your Module should have a default constructor, but if you need access to runtime configuration properties, it can have a method with @Inject on it to get a Properties object injected into it from Guice.
+
+### Adding a new deep storage implementation
+
+Check the `druid-azure-extensions`, `druid-google-extensions`, `druid-cassandra-storage`, `druid-hdfs-storage` and `druid-s3-extensions` modules for examples of how to do this.
+
+The basic idea behind the extension is that you need to add bindings for your [`DataSegmentPusher`](https://github.com/apache/druid/blob/master/processing/src/main/java/org/apache/druid/segment/loading/DataSegmentPusher.java) and [`URIDataPuller`](https://github.com/apache/druid/blob/master/processing/src/main/java/org/apache/druid/segment/loading/URIDataPuller.java) objects. The way to add them is something like (taken from HdfsStorageDruidModule)
+
+```java
+Binders.dataSegmentPullerBinder(binder)
+       .addBinding("hdfs")
+       .to(HdfsDataSegmentPuller.class).in(LazySingleton.class);
+
+Binders.dataSegmentPusherBinder(binder)
+       .addBinding("hdfs")
+       .to(HdfsDataSegmentPusher.class).in(LazySingleton.class);
+```
+
+`Binders.dataSegment*Binder()` is a call provided by the druid-core jar which sets up a Guice [multibind](https://github.com/google/guice/wiki/Multibindings) "MapBinder". If that doesn't make sense, don't worry about it; just think of it as a magical incantation.
+
+`addBinding("hdfs")` for the Puller binder creates a new handler for loadSpec objects of type "hdfs". For the Pusher binder it creates a new type value that you can specify for the `druid.storage.type` parameter.
+
+`to(...).in(...);` is normal Guice stuff.
+
+In addition to `DataSegmentPusher` and `URIDataPuller`, you can also bind:
+
+* [`DataSegmentKiller`](https://github.com/apache/druid/blob/master/processing/src/main/java/org/apache/druid/segment/loading/DataSegmentKiller.java): Removes segments, used as part of the Kill Task to delete unused segments, i.e. perform garbage collection of segments that are either superseded by newer versions or that have been dropped from the cluster.
+* [`DataSegmentMover`](https://github.com/apache/druid/blob/master/processing/src/main/java/org/apache/druid/segment/loading/DataSegmentMover.java): Allow migrating segments from one place to another, currently this is only used as part of the MoveTask to move unused segments to a different S3 bucket or prefix, typically to reduce storage costs of unused data (e.g. move to glacier or cheaper storage)
+* [`DataSegmentArchiver`](https://github.com/apache/druid/blob/master/processing/src/main/java/org/apache/druid/segment/loading/DataSegmentArchiver.java): Just a wrapper around Mover, but comes with a preconfigured target bucket/path, so it doesn't have to be specified at runtime as part of the ArchiveTask.
+
+### Validating your deep storage implementation
+
+**WARNING!** This is not a formal procedure, but a collection of hints to validate if your new deep storage implementation is able do push, pull and kill segments.
+
+It's recommended to use batch ingestion tasks to validate your implementation.
+The segment will be automatically rolled up to a Historical node after ~1 minute.
+In this way, you can validate both push (at realtime process) and pull (at Historical process) segments.
+
+#### DataSegmentPusher
+
+Wherever your data storage (cloud storage service, distributed file system, etc.) is, you should be able to see one new file: `index.zip` (`partitionNum_index.zip` for HDFS data storage) after your ingestion task ends.
+
+#### URIDataPuller
+
+After ~1 minute your ingestion task ends, you should be able to see your Historical process trying to load the new segment.
+
+#### DataSegmentKiller
+
+The easiest way of testing the segment killing is marking a segment as not used and then starting a killing task in the [web console](../operations/web-console.md).
+
+To mark a segment as not used, you need to connect to your metadata storage and update the `used` column to `false` on the segment table rows.
+
+To start a segment killing task, you need to access the web console then select `issue kill task` for the appropriate datasource.
+
+After the killing task ends, `index.zip` (`partitionNum_index.zip` for HDFS data storage) file should be deleted from the data storage.
+
+### Adding support for a new input source
+
+Adding support for a new input source requires to implement three interfaces, i.e., `InputSource`, `InputEntity`, and `InputSourceReader`.
+`InputSource` is to define where the input data is stored. `InputEntity` is to define how data can be read in parallel
+in [native parallel indexing](../ingestion/native-batch.md).
+`InputSourceReader` defines how to read your new input source and you can simply use the provided `InputEntityIteratingReader` in most cases.
+
+There is an example of this in the `druid-s3-extensions` module with the `S3InputSource` and `S3Entity`.
+
+Adding an InputSource is done almost entirely through the Jackson Modules instead of Guice. Specifically, note the implementation
+
+```java
+@Override
+public List<? extends Module> getJacksonModules()
+{
+  return ImmutableList.of(
+      new SimpleModule().registerSubtypes(new NamedType(S3InputSource.class, "s3"))
+  );
+}
+```
+
+This is registering the InputSource with Jackson's polymorphic serialization/deserialization layer. More concretely, having this will mean that if you specify a `"inputSource": { "type": "s3", ... }` in your IO config, then the system will load this InputSource for your `InputSource` implementation.
+
+Note that inside of Druid, we have made the `@JacksonInject` annotation for Jackson deserialized objects actually use the base Guice injector to resolve the object to be injected. So, if your InputSource needs access to some object, you can add a `@JacksonInject` annotation on a setter and it will get set on instantiation.
+
+### Adding support for a new data format
+
+Adding support for a new data format requires implementing two interfaces, i.e., `InputFormat` and `InputEntityReader`.
+`InputFormat` is to define how your data is formatted. `InputEntityReader` is to define how to parse your data and convert into Druid `InputRow`.
+
+There is an example in the `druid-orc-extensions` module with the `OrcInputFormat` and `OrcReader`.
+
+Adding an InputFormat is very similar to adding an InputSource. They operate purely through Jackson and thus should just be additions to the Jackson modules returned by your DruidModule.
+
+### Adding Aggregators
+
+Adding AggregatorFactory objects is very similar to InputSource objects. They operate purely through Jackson and thus should just be additions to the Jackson modules returned by your DruidModule.
+
+### Adding Complex Metrics
+
+Adding ComplexMetrics is a little ugly in the current version. The method of getting at complex metrics is through registration with the `ComplexMetrics.registerSerde()` method. There is no special Guice stuff to get this working, just in your `configure(Binder)` method register the serialization/deserialization.
+
+### Adding new Query types
+
+Adding a new Query type requires the implementation of three interfaces.
+
+1. `org.apache.druid.query.Query`
+1. `org.apache.druid.query.QueryToolChest`
+1. `org.apache.druid.query.QueryRunnerFactory`
+
+Registering these uses the same general strategy as a deep storage mechanism does. You do something like
+
+```java
+DruidBinders.queryToolChestBinder(binder)
+            .addBinding(SegmentMetadataQuery.class)
+            .to(SegmentMetadataQueryQueryToolChest.class);
+
+DruidBinders.queryRunnerFactoryBinder(binder)
+            .addBinding(SegmentMetadataQuery.class)
+            .to(SegmentMetadataQueryRunnerFactory.class);
+```
+
+The first one binds the SegmentMetadataQueryQueryToolChest for usage when a SegmentMetadataQuery is used. The second one does the same thing but for the QueryRunnerFactory instead.
+
+### Adding new Jersey resources
+
+Adding new Jersey resources to a module requires calling the following code to bind the resource in the module:
+
+```java
+Jerseys.addResource(binder, NewResource.class);
+```
+
+### Adding a new Password Provider implementation
+
+You will need to implement `org.apache.druid.metadata.PasswordProvider` interface. For every place where Druid uses PasswordProvider, a new instance of the implementation will be created,
+thus make sure all the necessary information required for fetching each password is supplied during object instantiation.
+In your implementation of `org.apache.druid.initialization.DruidModule`, `getJacksonModules` should look something like this -
+
+```java
+    return ImmutableList.of(
+        new SimpleModule("SomePasswordProviderModule")
+            .registerSubtypes(
+                new NamedType(SomePasswordProvider.class, "some")
+            )
+    );
+```
+
+where `SomePasswordProvider` is the implementation of `PasswordProvider` interface, you can have a look at `org.apache.druid.metadata.EnvironmentVariablePasswordProvider` for example.
+
+### Adding a new DynamicConfigProvider implementation
+
+You will need to implement `org.apache.druid.metadata.DynamicConfigProvider` interface. For every place where Druid uses DynamicConfigProvider, a new instance of the implementation will be created,
+thus make sure all the necessary information required for fetching all information is supplied during object instantiation.
+In your implementation of `org.apache.druid.initialization.DruidModule`, `getJacksonModules` should look something like this -
+
+```java
+    return ImmutableList.of(
+        new SimpleModule("SomeDynamicConfigProviderModule")
+            .registerSubtypes(
+                new NamedType(SomeDynamicConfigProvider.class, "some")
+            )
+    );
+```
+
+where `SomeDynamicConfigProvider` is the implementation of `DynamicConfigProvider` interface, you can have a look at `org.apache.druid.metadata.MapStringDynamicConfigProvider` for example.
+
+### Adding a Transform Extension
+
+To create a transform extension implement the `org.apache.druid.segment.transform.Transform` interface. You'll need to install the `druid-processing` package to import `org.apache.druid.segment.transform`.
+
+```java
+import com.fasterxml.jackson.annotation.JsonCreator;
+import com.fasterxml.jackson.annotation.JsonProperty;
+import org.apache.druid.segment.transform.RowFunction;
+import org.apache.druid.segment.transform.Transform;
+
+public class MyTransform implements Transform {
+    private final String name;
+
+    @JsonCreator
+    public MyTransform(
+        @JsonProperty("name") final String name
+    ) {
+        this.name = name;
+    }
+
+    @JsonProperty
+    @Override
+    public String getName() {
+        return name;
+    }
+
+    @Override
+    public RowFunction getRowFunction() {
+        return new MyRowFunction();
+    }
+
+    static class MyRowFunction implements RowFunction {
+        @Override
+        public Object eval(Row row) {
+            return "transformed-value";
+        }
+    }
+}
+```
+
+Then register your transform as a Jackson module.
+
+```java
+import com.fasterxml.jackson.databind.Module;
+import com.fasterxml.jackson.databind.jsontype.NamedModule;
+import com.fasterxml.jackson.databind.module.SimpleModule;
+import com.google.inject.Binder;
+import com.google.common.collect.ImmutableList;
+import org.apache.druid.initialization.DruidModule;
+
+public class MyTransformModule implements DruidModule {
+    @Override
+    public List<? extends Module> getJacksonModules() {
+        return return ImmutableList.of(
+            new SimpleModule("MyTransformModule").registerSubtypes(
+                new NamedType(MyTransform.class, "my-transform")
+            )
+        ):
+    }
+
+    @Override
+    public void configure(Binder binder) {
+    }
+}
+```
+
+### Adding your own custom pluggable Coordinator Duty
+
+The coordinator periodically runs jobs, so-called `CoordinatorDuty` which include loading new segments, segment balancing, etc.
+Druid users can add custom pluggable coordinator duties, which are not part of Core Druid, without modifying any Core Druid classes.
+Users can do this by writing their own custom coordinator duty implementing the interface `CoordinatorCustomDuty` and setting the `JsonTypeName`.
+Next, users will need to register their custom coordinator as subtypes in their Module's `DruidModule#getJacksonModules()`.
+Once these steps are done, user will be able to load their custom coordinator duty using the following properties:
+
+```properties
+druid.coordinator.dutyGroups=[<GROUP_NAME_1>, <GROUP_NAME_2>, ...]
+druid.coordinator.<GROUP_NAME_1>.duties=[<DUTY_NAME_MATCHING_JSON_TYPE_NAME_1>, <DUTY_NAME_MATCHING_JSON_TYPE_NAME_2>, ...]
+druid.coordinator.<GROUP_NAME_1>.period=<GROUP_NAME_1_RUN_PERIOD>
+
+druid.coordinator.<GROUP_NAME_1>.duty.<DUTY_NAME_MATCHING_JSON_TYPE_NAME_1>.<SOME_CONFIG_1_KEY>=<SOME_CONFIG_1_VALUE>
+druid.coordinator.<GROUP_NAME_1>.duty.<DUTY_NAME_MATCHING_JSON_TYPE_NAME_1>.<SOME_CONFIG_2_KEY>=<SOME_CONFIG_2_VALUE>
+```
+
+In the new system for pluggable Coordinator duties, similar to what coordinator already does today, the duties can be grouped together.
+The duties will be grouped into multiple groups as per the elements in list `druid.coordinator.dutyGroups`.
+All duties in the same group will have the same run period configured by `druid.coordinator.<GROUP_NAME>.period`.
+Currently, there is a single thread running the duties sequentially for each group.
+
+For example, see `KillSupervisorsCustomDuty` for a custom coordinator duty implementation and the `custom-coordinator-duties`
+integration test group which loads `KillSupervisorsCustomDuty` using the configs set in `integration-tests/docker/environment-configs/test-groups/custom-coordinator-duties`.
+This config file adds the configs below to enable a custom coordinator duty.
+
+```properties
+druid.coordinator.dutyGroups=["cleanupMetadata"]
+druid.coordinator.cleanupMetadata.duties=["killSupervisors"]
+druid.coordinator.cleanupMetadata.duty.killSupervisors.durationToRetain=PT0M
+druid.coordinator.cleanupMetadata.period=PT10S
+```
+
+These configurations create a custom coordinator duty group called `cleanupMetadata` which runs a custom coordinator duty called `killSupervisors` every 10 seconds.
+The custom coordinator duty `killSupervisors` also has a config called `durationToRetain` which is set to 0 minute.
+
+### Routing data through a HTTP proxy for your extension
+
+You can add the ability for the `HttpClient` of your extension to connect through an HTTP proxy.
+
+To support proxy connection for your extension's HTTP client:
+
+1. Add `HttpClientProxyConfig` as a `@JsonProperty` to the HTTP config class of your extension.
+2. In the extension's module class, add `HttpProxyConfig` config to `HttpClientConfig`.
+For example, where `config` variable is the extension's HTTP config from step 1:
+
+```java
+final HttpClientConfig.Builder builder = HttpClientConfig
+    .builder()
+    .withNumConnections(1)
+    .withReadTimeout(config.getReadTimeout().toStandardDuration())
+    .withHttpProxyConfig(config.getProxyConfig());
+```
+
+### Bundle your extension with all the other Druid extensions
+
+When you do `mvn install`, Druid extensions will be packaged within the Druid tarball and `extensions` directory, which are both underneath `distribution/target/`.
+
+If you want your extension to be included, you can add your extension's maven coordinate as an argument at
+[distribution/pom.xml](https://github.com/apache/druid/blob/master/distribution/pom.xml#L95)
+
+During `mvn install`, maven will install your extension to the local maven repository, and then call [pull-deps](../operations/pull-deps.md) to pull your extension from
+there. In the end, you should see your extension underneath `distribution/target/extensions` and within Druid tarball.
+
+### Managing dependencies
+
+Managing library collisions can be daunting for extensions which draw in commonly used libraries. Here is a list of group IDs for libraries that are suggested to be specified with a `provided` scope to prevent collision with versions used in druid:
+
+```txt
+"org.apache.druid",
+"com.metamx.druid",
+"asm",
+"org.ow2.asm",
+"org.jboss.netty",
+"com.google.guava",
+"com.google.code.findbugs",
+"com.google.protobuf",
+"com.esotericsoftware.minlog",
+"log4j",
+"org.slf4j",
+"commons-logging",
+"org.eclipse.jetty",
+"org.mortbay.jetty",
+"com.sun.jersey",
+"com.sun.jersey.contribs",
+"common-beanutils",
+"commons-codec",
+"commons-lang",
+"commons-cli",
+"commons-io",
+"javax.activation",
+"org.apache.httpcomponents",
+"org.apache.zookeeper",
+"org.codehaus.jackson",
+"com.fasterxml.jackson",
+"com.fasterxml.jackson.core",
+"com.fasterxml.jackson.dataformat",
+"com.fasterxml.jackson.datatype",
+"org.roaringbitmap",
+"net.java.dev.jets3t"
+```
+
+See the documentation in `org.apache.druid.cli.PullDependencies` for more information.
diff --git a/docs/35.0.0/development/overview.md b/docs/35.0.0/development/overview.md
new file mode 100644
index 0000000000..11c67ddfa2
--- /dev/null
+++ b/docs/35.0.0/development/overview.md
@@ -0,0 +1,85 @@
+---
+id: overview
+title: "Developing on Apache Druid"
+sidebar_label: "Developing on Druid"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+Druid's codebase consists of several major components. For developers interested in learning the code, this document provides
+a high level overview of the main components that make up Druid and the relevant classes to start from to learn the code.
+
+## Storage format
+
+Data in Druid is stored in a custom column format known as a [segment](../design/segments.md). Segments are composed of
+different types of columns. `Column.java` and the classes that extend it is a great place to looking into the storage format.
+
+## Segment creation
+
+Raw data is ingested in `IncrementalIndex.java`, and segments are created in `IndexMerger.java`.
+
+## Storage engine
+
+Druid segments are memory mapped in `IndexIO.java` to be exposed for querying.
+
+## Query engine
+
+Most of the logic related to Druid queries can be found in the Query* classes. Druid leverages query runners to run queries.
+Query runners often embed other query runners and each query runner adds on a layer of logic. A good starting point to trace
+the query logic is to start from `QueryResource.java`.
+
+## Coordination
+
+Most of the coordination logic for Historical processes is on the Druid Coordinator. The starting point here is `DruidCoordinator.java`.
+Most of the coordination logic for (real-time) ingestion is in the Druid indexing service. The starting point here is `OverlordResource.java`.
+
+## Real-time Ingestion
+
+Druid streaming tasks are based on the 'seekable stream' classes such as `SeekableStreamSupervisor.java`,
+`SeekableStreamIndexTask.java`, and `SeekableStreamIndexTaskRunner.java`. The data processing happens through
+`StreamAppenderator.java`, and the persist and hand-off logic is in `StreamAppenderatorDriver.java`.
+
+## Native Batch Ingestion
+
+Druid native batch ingestion main task types are based on `AbstractBatchTask.java` and `AbstractBatchSubtask.java`.
+Parallel processing uses `ParallelIndexSupervisorTask.java`, which spawns subtasks to perform various operations such
+as data analysis and partitioning depending on the task specification. Segment generation happens in
+`SinglePhaseSubTask.java`, `PartialHashSegmentGenerateTask.java`, or `PartialRangeSegmentGenerateTask.java` through
+`BatchAppenderator`, and the persist and hand-off logic is in `BatchAppenderatorDriver.java`.
+
+## Hadoop-based Batch Ingestion
+
+The two main Hadoop indexing classes are `HadoopDruidDetermineConfigurationJob.java` for the job to determine how many Druid
+segments to create, and `HadoopDruidIndexerJob.java`, which creates Druid segments.
+
+At some point in the future, we may move the Hadoop ingestion code out of core Druid.
+
+## Internal UIs
+
+Druid currently has two internal UIs. One is for the Coordinator and one is for the Overlord.
+
+At some point in the future, we will likely move the internal UI code out of core Druid.
+
+## Client libraries
+
+We welcome contributions for new client libraries to interact with Druid. See the
+[Community and third-party libraries](https://druid.apache.org/libraries.html) page for links to existing client
+libraries.
diff --git a/docs/35.0.0/development/versioning.md b/docs/35.0.0/development/versioning.md
new file mode 100644
index 0000000000..b01c28cc1b
--- /dev/null
+++ b/docs/35.0.0/development/versioning.md
@@ -0,0 +1,46 @@
+---
+id: versioning
+title: "Versioning"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+This page discusses how we do versioning and provides information on our stable releases.
+
+Versioning Strategy
+-------------------
+
+We generally follow [semantic versioning](http://semver.org/). The general idea is
+
+* "Major" version (leftmost): backwards incompatible, no guarantees exist about APIs between the versions
+* "Minor" version (middle number): you can move forward from a smaller number to a larger number, but moving backwards *might* be incompatible.
+* "bug-fix" version ("patch" or the rightmost): Interchangeable. The higher the number, the more things are fixed (hopefully), but the programming interfaces are completely compatible and you should be able to just drop in a new jar and have it work.
+
+Note that this is defined in terms of programming API, **not** in terms of functionality. It is possible that a brand new awesome way of doing something is introduced in a "bug-fix" release version if it doesn’t add to the public API or change it.
+
+One exception for right now, while we are still in major version 0, we are considering the APIs to be in beta and are conflating "major" and "minor" so a minor version increase could be backwards incompatible for as long as we are at major version 0. These will be communicated via email on the group.
+
+For external deployments, we recommend running the stable release tag. Releases are considered stable after we have deployed them into our production environment and they have operated bug-free for some time.
+
+Tagging strategy
+----------------
+
+Tags of the codebase are equivalent to release candidates. We tag the code every time we want to take it through our release process, which includes some QA cycles and deployments. So, it is not safe to assume that a tag is a stable release, it is a solidification of the code as it goes through our production QA cycle and deployment. Tags will never change, but we often go through a number of iterations of tags before actually getting a stable release onto production. So, it is recommended that if you are not aware of what is on a tag, to stick to the stable releases listed on the [Release](https://github.com/apache/druid/releases) page.
diff --git a/docs/35.0.0/ingestion/concurrent-append-replace.md b/docs/35.0.0/ingestion/concurrent-append-replace.md
new file mode 100644
index 0000000000..2dd7fb3abe
--- /dev/null
+++ b/docs/35.0.0/ingestion/concurrent-append-replace.md
@@ -0,0 +1,153 @@
+---
+id: concurrent-append-replace
+title: Concurrent append and replace
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+Concurrent append and replace safely replaces the existing data in an interval of a datasource while new data is being appended to that interval. One of the most common applications of this feature is appending new data (such as with streaming ingestion) to an interval while compaction of that interval is already in progress. Druid partitions the data ingested during this time using `dynamic` partitioning. The subsequent compaction run would partition the data into the granularity you specified in the compaction config.
+
+To set up concurrent append and replace, use the context flag `useConcurrentLocks`. Druid will then determine the correct lock type for you, either append or replace. Although you can set the type of lock manually, we don't recommend it. 
+
+## Update compaction config to use concurrent locks
+
+If you want to append data to a datasource while compaction is running, you need to enable concurrent append and replace for the datasource by updating the compaction settings.
+
+### Update compaction config from the Druid web-console
+
+In the **Compaction config** for a datasource, enable  **Use concurrent locks**.
+
+For details on accessing the compaction config in the UI, see [Enable automatic compaction with the web console](../data-management/automatic-compaction.md#manage-auto-compaction-using-the-web-console).
+
+### Update compaction config using REST API
+ 
+Add the `taskContext` like you would any other automatic compaction setting through the API:
+
+```shell
+curl --location --request POST 'http://localhost:8081/druid/coordinator/v1/config/compaction' \
+--header 'Content-Type: application/json' \
+--data-raw '{
+    "dataSource": "YOUR_DATASOURCE",
+    "taskContext": {
+        "useConcurrentLocks": true
+    }
+}'
+```
+
+## Use concurrent locks in ingestion jobs
+
+You also need to configure the ingestion job to allow concurrent locks.
+
+You can provide the context parameter like any other parameter for ingestion jobs through the API or the UI.
+
+### Use concurrent locks in the Druid web-console
+
+As part of the  **Load data** wizard for classic batch (JSON-based) ingestion and streaming ingestion, enable the following config on the **Publish** step: **Use concurrent locks**.
+
+### Use concurrent locks in the REST APIs
+
+Add the following JSON snippet to your supervisor or ingestion spec if you're using the API:
+
+```json
+"context": {
+   "useConcurrentLocks": true
+}
+```
+
+## Update Overlord properties to use concurrent locks for all ingestion and compaction jobs
+
+Updating the compaction config and ingestion job for each data source can be cumbersome if you have several data sources in your cluster. You can instead set the following config in the `runtime.properties` of the Overlord service to use concurrent locks across all ingestion and compaction jobs.
+
+```bash
+druid.indexer.task.default.context={"useConcurrentLocks":true}
+```
+
+## Task lock types
+
+We recommend that you use the `useConcurrentLocks` context parameter so that Druid automatically determines the task lock types for you. If, for some reason, you need to manually set the task lock types explicitly, you can read more about them in this section.
+
+<details>
+<summary>Click here to read more about the lock types.</summary>
+
+Druid uses task locks to make sure that multiple conflicting operations don't happen at once.
+There are two task lock types: `APPEND` and `REPLACE`. The type of lock you use is determined by what you're trying to accomplish.
+
+When setting task lock types manually, be aware of the following:
+- The segment granularity of the append task must be equal to or finer than the segment granularity of the replace task.
+- Concurrent append and replace fails if the task with `APPEND` lock uses a coarser segment granularity than the task with the `REPLACE` lock. For example, if the `APPEND` task uses a segment granularity of YEAR and the `REPLACE` task uses a segment granularity of MONTH, you should not use concurrent append and replace.
+-  Only a single task can hold a `REPLACE` lock on a given interval of a datasource.
+  - Multiple tasks can hold `APPEND` locks on a given interval of a datasource and append data to that interval simultaneously.
+
+#### Add a task lock type to your ingestion job
+
+You configure the task lock type for your ingestion job as follows:
+
+- For streaming jobs, the `taskLockType` context parameter goes in your supervisor spec, and the lock type is always `APPEND`.
+- For classic JSON-based batch ingestion, the `taskLockType` context parameter goes in your ingestion spec, and the lock type can be either `APPEND` or `REPLACE`. 
+ 
+You can provide the context parameter through the API like any other parameter for ingestion job or through the UI.
+
+##### Add a task lock using the Druid console
+
+As part of the  **Load data** wizard for classic batch (JSON-based ingestion) and streaming ingestion, you can configure the task lock type for the ingestion during the **Publish** step:
+
+- If you set **Append to existing** to **True**, you can then set **Allow concurrent append tasks (experimental)** to **True**.
+- If you set **Append to existing** to **False**, you can then set **Allow concurrent replace tasks (experimental)** to **True**.
+
+##### Add the task lock type through the API
+
+Add the following JSON snippet to your supervisor or ingestion spec if you're using the API:
+
+```json
+"context": {
+   "taskLockType": LOCK_TYPE
+}   
+```
+ 
+The `LOCK_TYPE` depends on what you're trying to accomplish.
+
+Set `taskLockType` to  `APPEND` if either of the following are true:
+
+- Dynamic partitioning with append to existing is set to `true`
+- The ingestion job is a streaming ingestion job
+
+If you have multiple ingestion jobs that append all targeting the same datasource and want them to run simultaneously, you need to also include the following context parameter:
+
+```json
+"useSharedLock": "true"
+```
+
+Keep in mind that `taskLockType` takes precedence over `useSharedLock`. Do not use `useSharedLock` with `REPLACE` task locks.
+
+
+Set  `taskLockType` to `REPLACE` if you're replacing data. For example, if you use any of the following partitioning types, use `REPLACE`:
+
+- hash partitioning 
+- range partitioning
+- dynamic partitioning with append to existing set to `false`
+
+</details>
+
+## Known limitations
+
+Do not use concurrent append and replace on a datasource if any one of the following is true:
+
+- The datasource has mixed granularity of data in any interval. For example, if an interval has both DAY and WEEK granularity data, using concurrent append and replace may result in data loss or duplication.
+- The datasource has a compaction config which compacts data into more granular chunks. For example, a datasource that has MONTH data ingested into it and is configured to compact it into DAY granularity might suffer data losses or duplication.
diff --git a/docs/35.0.0/ingestion/data-formats.md b/docs/35.0.0/ingestion/data-formats.md
new file mode 100644
index 0000000000..4bdf99a4ea
--- /dev/null
+++ b/docs/35.0.0/ingestion/data-formats.md
@@ -0,0 +1,1976 @@
+---
+id: data-formats
+title: Source input formats
+sidebar_label: Source input formats
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+Apache Druid can ingest denormalized data in JSON, CSV, or a delimited form such as TSV, or any custom format. While most examples in the documentation use data in JSON format, it is not difficult to configure Druid to ingest any other delimited data.
+We welcome any contributions to new formats.
+
+This page lists all default and core extension data formats supported by Druid.
+For additional data formats supported with community extensions,
+please see our [community extensions list](../configuration/extensions.md#community-extensions).
+
+## Formatting data
+
+The following samples show data formats that are natively supported in Druid:
+
+_JSON_
+
+```json
+{"timestamp": "2013-08-31T01:02:33Z", "page": "Gypsy Danger", "language" : "en", "user" : "nuclear", "unpatrolled" : "true", "newPage" : "true", "robot": "false", "anonymous": "false", "namespace":"article", "continent":"North America", "country":"United States", "region":"Bay Area", "city":"San Francisco", "added": 57, "deleted": 200, "delta": -143}
+{"timestamp": "2013-08-31T03:32:45Z", "page": "Striker Eureka", "language" : "en", "user" : "speed", "unpatrolled" : "false", "newPage" : "true", "robot": "true", "anonymous": "false", "namespace":"wikipedia", "continent":"Australia", "country":"Australia", "region":"Cantebury", "city":"Syndey", "added": 459, "deleted": 129, "delta": 330}
+{"timestamp": "2013-08-31T07:11:21Z", "page": "Cherno Alpha", "language" : "ru", "user" : "masterYi", "unpatrolled" : "false", "newPage" : "true", "robot": "true", "anonymous": "false", "namespace":"article", "continent":"Asia", "country":"Russia", "region":"Oblast", "city":"Moscow", "added": 123, "deleted": 12, "delta": 111}
+{"timestamp": "2013-08-31T11:58:39Z", "page": "Crimson Typhoon", "language" : "zh", "user" : "triplets", "unpatrolled" : "true", "newPage" : "false", "robot": "true", "anonymous": "false", "namespace":"wikipedia", "continent":"Asia", "country":"China", "region":"Shanxi", "city":"Taiyuan", "added": 905, "deleted": 5, "delta": 900}
+{"timestamp": "2013-08-31T12:41:27Z", "page": "Coyote Tango", "language" : "ja", "user" : "cancer", "unpatrolled" : "true", "newPage" : "false", "robot": "true", "anonymous": "false", "namespace":"wikipedia", "continent":"Asia", "country":"Japan", "region":"Kanto", "city":"Tokyo", "added": 1, "deleted": 10, "delta": -9}
+```
+
+_CSV_
+
+```
+2013-08-31T01:02:33Z,"Gypsy Danger","en","nuclear","true","true","false","false","article","North America","United States","Bay Area","San Francisco",57,200,-143
+2013-08-31T03:32:45Z,"Striker Eureka","en","speed","false","true","true","false","wikipedia","Australia","Australia","Cantebury","Syndey",459,129,330
+2013-08-31T07:11:21Z,"Cherno Alpha","ru","masterYi","false","true","true","false","article","Asia","Russia","Oblast","Moscow",123,12,111
+2013-08-31T11:58:39Z,"Crimson Typhoon","zh","triplets","true","false","true","false","wikipedia","Asia","China","Shanxi","Taiyuan",905,5,900
+2013-08-31T12:41:27Z,"Coyote Tango","ja","cancer","true","false","true","false","wikipedia","Asia","Japan","Kanto","Tokyo",1,10,-9
+```
+
+_TSV (Delimited)_
+
+```
+2013-08-31T01:02:33Z  "Gypsy Danger"  "en"  "nuclear" "true"  "true"  "false" "false" "article" "North America" "United States" "Bay Area"  "San Francisco" 57  200 -143
+2013-08-31T03:32:45Z  "Striker Eureka"  "en"  "speed" "false" "true"  "true"  "false" "wikipedia" "Australia" "Australia" "Cantebury" "Syndey"  459 129 330
+2013-08-31T07:11:21Z  "Cherno Alpha"  "ru"  "masterYi"  "false" "true"  "true"  "false" "article" "Asia"  "Russia"  "Oblast"  "Moscow"  123 12  111
+2013-08-31T11:58:39Z  "Crimson Typhoon" "zh"  "triplets"  "true"  "false" "true"  "false" "wikipedia" "Asia"  "China" "Shanxi"  "Taiyuan" 905 5 900
+2013-08-31T12:41:27Z  "Coyote Tango"  "ja"  "cancer"  "true"  "false" "true"  "false" "wikipedia" "Asia"  "Japan" "Kanto" "Tokyo" 1 10  -9
+```
+
+Note that the CSV and TSV data do not contain column heads. This becomes important when you specify the data for ingesting.
+
+Besides text formats, Druid also supports binary formats such as [Orc](#orc) and [Parquet](#parquet) formats.
+
+## Custom formats
+
+Druid supports custom data formats and can use the Regex parser or the JavaScript parsers to parse these formats. Using any of these parsers for
+parsing data is less efficient than writing a native Java parser or using an external stream processor. We welcome contributions of new parsers.
+
+## Input format
+
+You can use the `inputFormat` field to specify the data format for your input data.
+
+:::info
+ `inputFormat` doesn't support all data formats or ingestion methods supported by Druid.
+:::
+
+Especially if you want to use the Hadoop ingestion, you still need to use the [Parser](#parser).
+If your data is formatted in some format not listed in this section, please consider using the Parser instead.
+
+All forms of Druid ingestion require some form of schema object. The format of the data to be ingested is specified using the `inputFormat` entry in your [`ioConfig`](ingestion-spec.md#ioconfig).
+
+### JSON
+
+Configure the JSON `inputFormat` to load JSON data as follows:
+
+| Field | Type | Description | Required |
+|-------|------|-------------|----------|
+| type | String | Set value to `json`. | yes |
+| flattenSpec | JSON Object | Specifies flattening configuration for nested JSON data. See [`flattenSpec`](#flattenspec) for more info. | no |
+| featureSpec | JSON Object | [JSON parser features](https://github.com/FasterXML/jackson-core/wiki/JsonParser-Features) supported by Jackson, a JSON processor for Java. The features control parsing of the input JSON data. To enable a feature, map the feature name to a Boolean value of "true". For example: `"featureSpec": {"ALLOW_SINGLE_QUOTES": true, "ALLOW_UNQUOTED_FIELD_NAMES": true}` | no |
+
+The following properties are specialized properties that only apply when the JSON `inputFormat` is used in streaming ingestion, and they are related to how parsing exceptions are handled. In streaming ingestion, multi-line JSON events can be ingested (i.e. where a single JSON event spans multiple lines). However, if a parsing exception occurs, all JSON events that are present in the same streaming record will be discarded.
+
+| Field | Type | Description | Required |
+|-------|------|-------------|----------|
+| assumeNewlineDelimited | Boolean | If the input is known to be newline delimited JSON (each individual JSON event is contained in a single line, separated by newlines), setting this option to true allows for more flexible parsing exception handling. Only the lines with invalid JSON syntax will be discarded, while lines containing valid JSON events will still be ingested. | no (Default false) |
+| useJsonNodeReader | Boolean | When ingesting multi-line JSON events, enabling this option will enable the use of a JSON parser which will retain any valid JSON events encountered within a streaming record prior to when a parsing exception occurred. | no (Default false) |
+
+For example:
+
+```json
+"ioConfig": {
+  "inputFormat": {
+    "type": "json"
+  },
+  ...
+}
+```
+
+### CSV
+
+Configure the CSV `inputFormat` to load CSV data as follows:
+
+| Field | Type | Description | Required |
+|-------|------|-------------|----------|
+| type | String | Set value to `csv`. | yes |
+| listDelimiter | String | A custom delimiter for multi-value dimensions. | no (default = ctrl+A) |
+| columns | JSON array | Specifies the columns of the data. The columns should be in the same order with the columns of your data. | yes if `findColumnsFromHeader` is false or missing |
+| findColumnsFromHeader | Boolean | If this is set, the task will find the column names from the header row. Note that `skipHeaderRows` will be applied before finding column names from the header. For example, if you set `skipHeaderRows` to 2 and `findColumnsFromHeader` to true, the task will skip the first two lines and then extract column information from the third line. `columns` will be ignored if this is set to true. | no (default = false if `columns` is set; otherwise null) |
+| skipHeaderRows | Integer | If this is set, the task will skip the first `skipHeaderRows` rows. | no (default = 0) |
+| tryParseNumbers| Boolean| If this is set, the task will attempt to parse numeric strings into long or double data type, in that order. This parsing also applies to values separated by `listDelimiter`. If the value cannot be parsed as a number, it is retained as a string. | no (default = false) |
+
+For example:
+
+```json
+"ioConfig": {
+  "inputFormat": {
+    "type": "csv",
+    "columns" : ["timestamp","page","language","user","unpatrolled","newPage","robot","anonymous","namespace","continent","country","region","city","added","deleted","delta"]
+  },
+  ...
+}
+```
+
+### TSV (Delimited)
+
+Configure the TSV `inputFormat` to load TSV data as follows:
+
+| Field | Type | Description | Required |
+|-------|------|-------------|----------|
+| type | String | Set value to `tsv`. | yes |
+| delimiter | String | A custom delimiter for data values. | no (default = `\t`) |
+| listDelimiter | String | A custom delimiter for multi-value dimensions. | no (default = ctrl+A) |
+| columns | JSON array | Specifies the columns of the data. The columns should be in the same order with the columns of your data. | yes if `findColumnsFromHeader` is false or missing |
+| findColumnsFromHeader | Boolean | If this is set, the task will find the column names from the header row. Note that `skipHeaderRows` will be applied before finding column names from the header. For example, if you set `skipHeaderRows` to 2 and `findColumnsFromHeader` to true, the task will skip the first two lines and then extract column information from the third line. `columns` will be ignored if this is set to true. | no (default = false if `columns` is set; otherwise null) |
+| skipHeaderRows | Integer | If this is set, the task will skip the first `skipHeaderRows` rows. | no (default = 0) |
+| tryParseNumbers| Boolean| If this is set, the task will attempt to parse numeric strings into long or double data type, in that order. This parsing also applies to values separated by `listDelimiter`. If the value cannot be parsed as a number, it is retained as a string. | no (default = false) |
+
+Be sure to change the `delimiter` to the appropriate delimiter for your data. Like CSV, you must specify the columns and which subset of the columns you want indexed.
+
+For example:
+
+```json
+"ioConfig": {
+  "inputFormat": {
+    "type": "tsv",
+    "columns" : ["timestamp","page","language","user","unpatrolled","newPage","robot","anonymous","namespace","continent","country","region","city","added","deleted","delta"],
+    "delimiter":"|"
+  },
+  ...
+}
+```
+
+### Lines
+
+Configure the Lines `inputFormat` to load line-oriented data where each line is treated as a single field:
+
+| Field | Type | Description | Required |
+|-------|------|-------------|----------|
+| type | String | Set value to `lines`. | yes |
+
+The Lines input format reads each line from the input as UTF-8 text, and creates a single column named `line` containing the entire line as a string.
+This is useful for reading line-oriented data in a simple form for later processing.
+
+For example:
+
+```json
+"ioConfig": {
+  "inputFormat": {
+    "type": "lines"
+  },
+  ...
+}
+```
+
+### ORC
+
+To use the ORC input format, load the Druid Orc extension ( [`druid-orc-extensions`](../development/extensions-core/orc.md)).
+:::info
+ To upgrade from versions earlier than 0.15.0 to 0.15.0 or new, read [Migration from 'contrib' extension](../development/extensions-core/orc.md#migration-from-contrib-extension).
+:::
+
+Configure the ORC `inputFormat` to load ORC data as follows:
+
+| Field | Type | Description | Required |
+|-------|------|-------------|----------|
+| type | String | Set value to `orc`. | yes |
+| flattenSpec | JSON Object | Specifies flattening configuration for nested ORC data. Only 'path' expressions are supported ('jq' and 'tree' are unavailable). See [`flattenSpec`](#flattenspec) for more info. | no |
+| binaryAsString | Boolean | Specifies if the binary orc column which is not logically marked as a string should be treated as a UTF-8 encoded string. | no (default = false) |
+
+For example:
+
+```json
+"ioConfig": {
+  "inputFormat": {
+    "type": "orc",
+    "flattenSpec": {
+      "useFieldDiscovery": true,
+      "fields": [
+        {
+          "type": "path",
+          "name": "nested",
+          "expr": "$.path.to.nested"
+        }
+      ]
+    },
+    "binaryAsString": false
+  },
+  ...
+}
+```
+
+### Parquet
+
+To use the Parquet input format load the Druid Parquet extension ([`druid-parquet-extensions`](../development/extensions-core/parquet.md)).
+
+Configure the Parquet `inputFormat` to load Parquet data as follows:
+
+| Field | Type | Description | Required |
+|---|---|---|---|
+| `type` | String | Set value to `parquet`. | yes |
+| `flattenSpec` | JSON Object | Define a [`flattenSpec`](#flattenspec) to extract nested values from a Parquet file. Only 'path' expressions are supported ('jq' and 'tree' are unavailable). | no (default will auto-discover 'root' level properties) |
+| `binaryAsString` | Boolean | Specifies if the bytes parquet column which is not logically marked as a string or enum type should be treated as a UTF-8 encoded string. | no (default = false) |
+
+For example:
+
+```json
+"ioConfig": {
+  "inputFormat": {
+    "type": "parquet",
+    "flattenSpec": {
+      "useFieldDiscovery": true,
+      "fields": [
+        {
+          "type": "path",
+          "name": "nested",
+          "expr": "$.path.to.nested"
+        }
+      ]
+    },
+    "binaryAsString": false
+  },
+  ...
+}
+```
+
+### Avro Stream
+
+To use the Avro Stream input format load the Druid Avro extension ([`druid-avro-extensions`](../development/extensions-core/avro.md)).
+
+For more information on how Druid handles Avro types, see [Avro Types](../development/extensions-core/avro.md#avro-types) section for
+
+Configure the Avro `inputFormat` to load Avro data as follows:
+
+| Field | Type | Description | Required |
+|-------|------|-------------|----------|
+|type| String| Set value to `avro_stream`. | yes |
+|flattenSpec| JSON Object |Define a [`flattenSpec`](#flattenspec) to extract nested values from a Avro record. Only 'path' expressions are supported ('jq' is unavailable).| no (default will auto-discover 'root' level properties) |
+|`avroBytesDecoder`| JSON Object |Specifies how to decode bytes to Avro record. | yes |
+| binaryAsString | Boolean | Specifies if the bytes Avro column which is not logically marked as a string or enum type should be treated as a UTF-8 encoded string. | no (default = false) |
+
+For example:
+
+```json
+"ioConfig": {
+  "inputFormat": {
+    "type": "avro_stream",
+    "avroBytesDecoder": {
+      "type": "schema_inline",
+      "schema": {
+        //your schema goes here, for example
+        "namespace": "org.apache.druid.data",
+        "name": "User",
+        "type": "record",
+        "fields": [
+          { "name": "FullName", "type": "string" },
+          { "name": "Country", "type": "string" }
+        ]
+      }
+    },
+    "flattenSpec": {
+      "useFieldDiscovery": true,
+      "fields": [
+        {
+          "type": "path",
+          "name": "someRecord_subInt",
+          "expr": "$.someRecord.subInt"
+        }
+      ]
+    },
+    "binaryAsString": false
+  },
+  ...
+}
+```
+
+##### Avro Bytes Decoder
+
+If `type` is not included, the avroBytesDecoder defaults to `schema_repo`.
+
+###### Inline Schema Based Avro Bytes Decoder
+
+:::info
+ The "schema_inline" decoder reads Avro records using a fixed schema and does not support schema migration. If you
+ may need to migrate schemas in the future, consider one of the other decoders, all of which use a message header that
+ allows the parser to identify the proper Avro schema for reading records.
+:::
+
+This decoder can be used if all the input events can be read using the same schema. In this case, specify the schema in the input task JSON itself, as described below.
+
+```
+...
+"avroBytesDecoder": {
+  "type": "schema_inline",
+  "schema": {
+    //your schema goes here, for example
+    "namespace": "org.apache.druid.data",
+    "name": "User",
+    "type": "record",
+    "fields": [
+      { "name": "FullName", "type": "string" },
+      { "name": "Country", "type": "string" }
+    ]
+  }
+}
+...
+```
+
+###### Multiple Inline Schemas Based Avro Bytes Decoder
+
+Use this decoder if different input events can have different read schemas. In this case, specify the schema in the input task JSON itself, as described below.
+
+```
+...
+"avroBytesDecoder": {
+  "type": "multiple_schemas_inline",
+  "schemas": {
+    //your id -> schema map goes here, for example
+    "1": {
+      "namespace": "org.apache.druid.data",
+      "name": "User",
+      "type": "record",
+      "fields": [
+        { "name": "FullName", "type": "string" },
+        { "name": "Country", "type": "string" }
+      ]
+    },
+    "2": {
+      "namespace": "org.apache.druid.otherdata",
+      "name": "UserIdentity",
+      "type": "record",
+      "fields": [
+        { "name": "Name", "type": "string" },
+        { "name": "Location", "type": "string" }
+      ]
+    },
+    ...
+    ...
+  }
+}
+...
+```
+
+Note that it is essentially a map of integer schema ID to avro schema object. This parser assumes that record has following format.
+  first 1 byte is version and must always be 1.
+  next 4 bytes are integer schema ID serialized using big-endian byte order.
+  remaining bytes contain serialized avro message.
+
+##### SchemaRepo Based Avro Bytes Decoder
+
+This Avro bytes decoder first extracts `subject` and `id` from the input message bytes, and then uses them to look up the Avro schema used to decode the Avro record from bytes. For details, see the [schema repo](https://github.com/schema-repo/schema-repo). You need an HTTP service like schema repo to hold the Avro schema. For information on registering a schema on the message producer side, see `org.apache.druid.data.input.AvroStreamInputRowParserTest#testParse()`.
+
+| Field | Type | Description | Required |
+|-------|------|-------------|----------|
+| type | String | Set value to `schema_repo`. | no |
+| subjectAndIdConverter | JSON Object | Specifies how to extract the subject and id from message bytes. | yes |
+| schemaRepository | JSON Object | Specifies how to look up the Avro schema from subject and id. | yes |
+
+###### Avro-1124 Subject And Id Converter
+
+This section describes the format of the `subjectAndIdConverter` object for the `schema_repo` Avro bytes decoder.
+
+| Field | Type | Description | Required |
+|-------|------|-------------|----------|
+| type | String | Set value to `avro_1124`. | no |
+| topic | String | Specifies the topic of your Kafka stream. | yes |
+
+###### Avro-1124 Schema Repository
+
+This section describes the format of the `schemaRepository` object for the `schema_repo` Avro bytes decoder.
+
+| Field | Type | Description | Required |
+|-------|------|-------------|----------|
+| type | String | Set value to `avro_1124_rest_client`. | no |
+| url | String | Specifies the endpoint URL of your Avro-1124 schema repository. | yes |
+
+###### Confluent Schema Registry-based Avro Bytes Decoder
+
+This Avro bytes decoder first extracts a unique `id` from input message bytes, and then uses it to look up the schema in the Schema Registry used to decode the Avro record from bytes.
+For details, see the Schema Registry [documentation](http://docs.confluent.io/current/schema-registry/docs/) and [repository](https://github.com/confluentinc/schema-registry).
+
+| Field | Type | Description | Required |
+|-------|------|-------------|----------|
+| type | String | Set value to `schema_registry`. | no |
+| url | String | Specifies the URL endpoint of the Schema Registry. | yes |
+| capacity | Integer | Specifies the max size of the cache (default = Integer.MAX_VALUE). | no |
+| urls | ARRAY\<String\> | Specifies the URL endpoints of the multiple Schema Registry instances. | yes (if `url` is not provided) |
+| config | Json | To send additional configurations, configured for Schema Registry. This can be supplied via a [DynamicConfigProvider](../operations/dynamic-config-provider.md) | no |
+| headers | Json | To send headers to the Schema Registry. This can be supplied via a [DynamicConfigProvider](../operations/dynamic-config-provider.md) | no |
+
+For a single schema registry instance, use Field `url` or `urls` for multi instances.
+
+Single Instance:
+
+```json
+...
+"avroBytesDecoder" : {
+   "type" : "schema_registry",
+   "url" : <schema-registry-url>
+}
+...
+```
+
+Multiple Instances:
+
+```json
+...
+"avroBytesDecoder" : {
+   "type" : "schema_registry",
+   "urls" : [<schema-registry-url-1>, <schema-registry-url-2>, ...],
+   "config" : {
+        "basic.auth.credentials.source": "USER_INFO",
+        "basic.auth.user.info": "fred:letmein",
+        "schema.registry.ssl.truststore.location": "/some/secrets/kafka.client.truststore.jks",
+        "schema.registry.ssl.truststore.password": "<password>",
+        "schema.registry.ssl.keystore.location": "/some/secrets/kafka.client.keystore.jks",
+        "schema.registry.ssl.keystore.password": "<password>",
+        "schema.registry.ssl.key.password": "<password>",
+        "schema.registry.ssl.key.password",
+       ... 
+   },
+   "headers": {
+       "traceID" : "b29c5de2-0db4-490b-b421",
+       "timeStamp" : "1577191871865",
+       "druid.dynamic.config.provider":{
+            "type":"mapString", 
+            "config":{
+                 "registry.header.prop.1":"value.1", 
+                 "registry.header.prop.2":"value.2"
+                 }
+            }
+       ...
+    }
+}
+...
+```
+
+###### Parse exceptions
+
+The following errors when reading records will be considered parse exceptions, which can be limited and logged with ingestion task configurations such as `maxParseExceptions` and `maxSavedParseExceptions`:
+
+- Failure to retrieve a schema due to misconfiguration or corrupt records (invalid schema IDs)
+- Failure to decode an Avro message
+
+### Avro OCF
+
+To load the Avro OCF input format, load the Druid Avro extension ([`druid-avro-extensions`](../development/extensions-core/avro.md)).
+
+See the [Avro Types](../development/extensions-core/avro.md#avro-types) section for how Avro types are handled in Druid
+
+Configure the Avro OCF `inputFormat` to load Avro OCF data as follows:
+
+| Field | Type | Description                                                                                                                                                 | Required |
+|-------|------|-------------------------------------------------------------------------------------------------------------------------------------------------------------|----------|
+|type| String| Set value to `avro_ocf`.                                                                                                                                    | yes |
+|flattenSpec| JSON Object | Define a [`flattenSpec`](#flattenspec) to extract nested values from Avro records. Only 'path' expressions are supported ('jq' and 'tree' are unavailable). | no (default will auto-discover 'root' level properties) |
+|schema| JSON Object | Define a reader schema to be used when parsing Avro records. This is useful when parsing multiple versions of Avro OCF file data.                           | no (default will decode using the writer schema contained in the OCF file) |
+| binaryAsString | Boolean | Specifies if the bytes parquet column which is not logically marked as a string or enum type should be treated as a UTF-8 encoded string.                   | no (default = false) |
+
+For example:
+
+```json
+"ioConfig": {
+  "inputFormat": {
+    "type": "avro_ocf",
+    "flattenSpec": {
+      "useFieldDiscovery": true,
+      "fields": [
+        {
+          "type": "path",
+          "name": "someRecord_subInt",
+          "expr": "$.someRecord.subInt"
+        }
+      ]
+    },
+    "schema": {
+      "namespace": "org.apache.druid.data.input",
+      "name": "SomeDatum",
+      "type": "record",
+      "fields" : [
+        { "name": "timestamp", "type": "long" },
+        { "name": "eventType", "type": "string" },
+        { "name": "id", "type": "long" },
+        { "name": "someRecord", "type": {
+          "type": "record", "name": "MySubRecord", "fields": [
+            { "name": "subInt", "type": "int"},
+            { "name": "subLong", "type": "long"}
+          ]
+        }}]
+    },
+    "binaryAsString": false
+  },
+  ...
+}
+```
+
+### Protobuf
+
+:::info
+ You need to include the [`druid-protobuf-extensions`](../development/extensions-core/protobuf.md) as an extension to use the Protobuf input format.
+:::
+
+Configure the Protobuf `inputFormat` to load Protobuf data as follows:
+
+| Field | Type | Description | Required |
+|---|---|---|---|
+| `type` | String | Set value to `protobuf`. | yes |
+| `flattenSpec` | JSON Object | Define a [`flattenSpec`](#flattenspec) to extract nested values from a Protobuf record. Note that only 'path' expression are supported ('jq' and 'tree' is unavailable). | no (default will auto-discover 'root' level properties) |
+| `protoBytesDecoder` | JSON Object | Specifies how to decode bytes to Protobuf record. | yes |
+
+For example:
+
+```json
+"ioConfig": {
+  "inputFormat": {
+    "type": "protobuf",
+    "protoBytesDecoder": {
+      "type": "file",
+      "descriptor": "file:///tmp/metrics.desc",
+      "protoMessageType": "Metrics"
+    }
+    "flattenSpec": {
+      "useFieldDiscovery": true,
+      "fields": [
+        {
+          "type": "path",
+          "name": "someRecord_subInt",
+          "expr": "$.someRecord.subInt"
+        }
+      ]
+    }
+  },
+  ...
+}
+```
+
+### Kafka
+
+The `kafka` input format lets you parse the Kafka metadata fields in addition to the Kafka payload value contents.
+It should only be used when ingesting from Apache Kafka.
+
+The `kafka` input format wraps around the payload parsing input format and augments the data it outputs with the Kafka event timestamp, topic name, event headers, and the key field that itself can be parsed using any available input format.
+
+If there are conflicts between column names in the payload and those created from the metadata, the payload takes precedence.
+This ensures that upgrading a Kafka ingestion to use the Kafka input format (by taking its existing input format and setting it as the `valueFormat`) can be done without losing any of the payload data.  
+
+Configure the Kafka `inputFormat` as follows:
+
+| Field | Type | Description | Required | Default |
+|-------|------|-------------|----------|---------|
+| `type` | String | Set value to `kafka`. | yes ||
+| `valueFormat` | [InputFormat](#input-format) | The [input format](#input-format) to parse the Kafka value payload. | yes ||
+| `timestampColumnName` | String | The name of the column for the Kafka timestamp.| no |`kafka.timestamp`|
+| `topicColumnName` | String |The name of the column for the Kafka topic. This field is useful when ingesting data from multiple topics into same datasource.| no |`kafka.topic`|
+| `headerColumnPrefix` | String | The custom prefix for all the header columns. | no | `kafka.header`|
+| `headerFormat` | Object | Specifies how to parse the Kafka headers. Supports String types. Because Kafka header values are bytes, the parser decodes them as UTF-8 encoded strings. To change this behavior, implement your own parser based on the encoding style. Change the `encoding` type in `KafkaStringHeaderFormat` to match your custom implementation. See [Header format](#header-format) for supported encoding formats.| no ||
+| `keyFormat` | [InputFormat](#input-format) | The [input format](#input-format) to parse the Kafka key. It only processes the first entry of the `inputFormat` field. If your key values are simple strings, you can use the `tsv` format to parse them. Note that for `tsv`,`csv`, and `regex` formats, you need to provide a `columns` array to make a valid input format. Only the first one is used, and its name will be ignored in favor of `keyColumnName`. | no ||
+| `keyColumnName` | String | The name of the column for the Kafka key.| no |`kafka.key`|
+
+#### Header format
+
+`headerFormat` supports the following encoding formats:
+   - `ISO-8859-1`: ISO Latin Alphabet No. 1, that is, ISO-LATIN-1.
+   - `US-ASCII`: Seven-bit ASCII. Also known as ISO646-US. The Basic Latin block of the Unicode character set.
+   - `UTF-8`: Eight-bit UCS Transformation Format.
+   - `UTF-16`: Sixteen-bit UCS Transformation Format, byte order identified by an optional byte-order mark.
+   - `UTF-16BE`: Sixteen-bit UCS Transformation Format, big-endian byte order.
+   - `UTF-16LE`: Sixteen-bit UCS Transformation Format, little-endian byte order.
+- `headerColumnPrefix`: Supply a prefix to the Kafka headers to avoid any conflicts with columns from the payload. The default is `kafka.header.`.
+
+#### Example
+
+Using `{ "type": "json" }` as the input format would only parse the payload value.
+To parse the Kafka metadata in addition to the payload, use the `kafka` input format.
+
+For example, consider the following structure for a Kafka message that represents an edit in a development environment:
+
+- **Kafka timestamp**: `1680795276351`
+- **Kafka topic**: `wiki-edits`
+- **Kafka headers**:
+  - `env=development`
+  - `zone=z1`
+- **Kafka key**: `wiki-edit`
+- **Kafka payload value**: `{"channel":"#sv.wikipedia","timestamp":"2016-06-27T00:00:11.080Z","page":"Salo Toraut","delta":31,"namespace":"Main"}`
+
+You would configure it as follows:
+
+```json
+"ioConfig": {
+  "inputFormat": {
+    "type": "kafka",
+    "valueFormat": {
+      "type": "json"
+    },
+    "timestampColumnName": "kafka.timestamp",
+    "topicColumnName": "kafka.topic",
+    "headerFormat": {
+      "type": "string",
+      "encoding": "UTF-8"
+    },
+    "headerColumnPrefix": "kafka.header.",
+    "keyFormat": {
+      "type": "tsv",
+      "findColumnsFromHeader": false,
+      "columns": ["x"]
+    },
+    "keyColumnName": "kafka.key",
+  }
+}
+```
+
+You would parse the example message as follows:
+
+```json
+{
+  "channel": "#sv.wikipedia",
+  "timestamp": "2016-06-27T00:00:11.080Z",
+  "page": "Salo Toraut",
+  "delta": 31,
+  "namespace": "Main",
+  "kafka.timestamp": 1680795276351,
+  "kafka.topic": "wiki-edits",
+  "kafka.header.env": "development",
+  "kafka.header.zone": "z1",
+  "kafka.key": "wiki-edit"
+}
+```
+
+If you want to use `kafka.timestamp` as Druid's primary timestamp (`__time`), specify it as the value for `column` in the `timestampSpec`:
+
+```json
+"timestampSpec": {
+  "column": "kafka.timestamp",
+  "format": "millis"
+}
+```
+
+Similarly, if you want to use a timestamp extracted from the Kafka header:
+
+```json
+"timestampSpec": {
+  "column": "kafka.header.myTimestampHeader",
+  "format": "millis"
+}
+```
+
+Finally, add these Kafka metadata columns to the `dimensionsSpec` or  set your `dimensionsSpec` to auto-detect columns.
+     
+The following supervisor spec demonstrates how to ingest the Kafka header, key, timestamp, and topic into Druid dimensions:
+
+<details>
+<summary>Click to view the example</summary>
+
+```json
+{
+  "type": "kafka",
+  "spec": {
+    "ioConfig": {
+      "type": "kafka",
+      "consumerProperties": {
+        "bootstrap.servers": "localhost:9092"
+      },
+      "topic": "wiki-edits",
+      "inputFormat": {
+        "type": "kafka",
+        "valueFormat": {
+          "type": "json"
+        },
+        "headerFormat": {
+          "type": "string"
+        },
+        "keyFormat": {
+          "type": "tsv",
+          "findColumnsFromHeader": false,
+          "columns": ["x"]
+        }
+      },
+      "useEarliestOffset": true
+    },
+    "dataSchema": {
+      "dataSource": "wikiticker",
+      "timestampSpec": {
+        "column": "timestamp",
+        "format": "posix"
+      },
+      "dimensionsSpec":  "dimensionsSpec": {
+        "useSchemaDiscovery": true,
+        "includeAllDimensions": true
+      },
+      "granularitySpec": {
+        "queryGranularity": "none",
+        "rollup": false,
+        "segmentGranularity": "day"
+      }
+    },
+    "tuningConfig": {
+      "type": "kafka"
+    }
+  }
+}
+```
+</details>
+
+After Druid ingests the data, you can query the Kafka metadata columns as follows:
+
+```sql
+SELECT
+  "kafka.header.env",
+  "kafka.key",
+  "kafka.timestamp",
+  "kafka.topic"
+FROM "wikiticker"
+```
+
+This query returns:
+
+| `kafka.header.env` | `kafka.key` | `kafka.timestamp` | `kafka.topic` |
+|--------------------|-----------|---------------|---------------|
+| `development`      | `wiki-edit` | `1680795276351` | `wiki-edits`  |
+
+### Kinesis
+
+The `kinesis` input format lets you parse the Kinesis metadata fields in addition to the Kinesis payload value contents.
+It should only be used when ingesting from Kinesis.
+
+The `kinesis` input format wraps around the payload parsing input format and augments the data it outputs with the Kinesis event timestamp and partition key, the `ApproximateArrivalTimestamp ` and `PartitionKey` fields in the Kinesis record.
+
+If there are conflicts between column names in the payload and those created from the metadata, the payload takes precedence.
+This ensures that upgrading a Kinesis ingestion to use the Kinesis input format (by taking its existing input format and setting it as the `valueFormat`) can be done without losing any of the payload data.
+
+Configure the Kinesis `inputFormat` as follows:
+
+| Field | Type | Description                                                                                                                                       | Required | Default             |
+|-------|------|---------------------------------------------------------------------------------------------------------------------------------------------------|----------|---------------------|
+| `type` | String | Set value to `kinesis`. | yes ||
+| `valueFormat` | [InputFormat](#input-format) | The [input format](#input-format) to parse the Kinesis value payload. | yes ||
+| `partitionKeyColumnName` | String | The name of the column for the Kinesis partition key. This field is useful when ingesting data from multiple partitions into the same datasource. | no | `kinesis.partitionKey` |
+| `timestampColumnName` | String | The name of the column for the Kinesis timestamp. | no | `kinesis.timestamp` |
+
+#### Example
+
+Using `{ "type": "json" }` as the input format would only parse the payload value.
+To parse the Kinesis metadata in addition to the payload, use the `kinesis` input format.
+
+For example, consider the following structure for a Kinesis record that represents an edit in a development environment:
+
+- **Kinesis timestamp**: `1680795276351`
+- **Kinesis partition key**: `partition-1`
+- **Kinesis payload value**: `{"channel":"#sv.wikipedia","timestamp":"2016-06-27T00:00:11.080Z","page":"Salo Toraut","delta":31,"namespace":"Main"}`
+
+You would configure it as follows:
+
+```json
+{
+  "ioConfig": {
+    "inputFormat": {
+      "type": "kinesis",
+      "valueFormat": {
+        "type": "json"
+      },
+      "timestampColumnName": "kinesis.timestamp",
+      "partitionKeyColumnName": "kinesis.partitionKey"
+    }
+  }
+}
+```
+
+You would parse the example record as follows:
+
+```json
+{
+  "channel": "#sv.wikipedia",
+  "timestamp": "2016-06-27T00:00:11.080Z",
+  "page": "Salo Toraut",
+  "delta": 31,
+  "namespace": "Main",
+  "kinesis.timestamp": 1680795276351,
+  "kinesis.partitionKey": "partition-1"
+}
+```
+
+If you want to use `kinesis.timestamp` as Druid's primary timestamp (`__time`), specify it as the value for `column` in the `timestampSpec`:
+
+```json
+"timestampSpec": {
+  "column": "kinesis.timestamp",
+  "format": "millis"
+}
+```
+
+Finally, add these Kinesis metadata columns to the `dimensionsSpec` or  set your `dimensionsSpec` to automatically detect columns.
+
+The following supervisor spec demonstrates how to ingest the Kinesis timestamp, and partition key into Druid dimensions:
+
+<details>
+<summary>Click to view the example</summary>
+
+```json
+{
+  "type": "kinesis",
+  "spec": {
+    "ioConfig": {
+      "type": "kinesis",
+      "consumerProperties": {
+        "bootstrap.servers": "localhost:9092"
+      },
+      "topic": "wiki-edits",
+      "inputFormat": {
+        "type": "kinesis",
+        "valueFormat": {
+          "type": "json"
+        },
+        "headerFormat": {
+          "type": "string"
+        },
+        "keyFormat": {
+          "type": "tsv",
+          "findColumnsFromHeader": false,
+          "columns": ["x"]
+        }
+      },
+      "useEarliestOffset": true
+    },
+    "dataSchema": {
+      "dataSource": "wikiticker",
+      "timestampSpec": {
+        "column": "timestamp",
+        "format": "posix"
+      },
+      "dimensionsSpec": {
+        "useSchemaDiscovery": true,
+        "includeAllDimensions": true
+      },
+      "granularitySpec": {
+        "queryGranularity": "none",
+        "rollup": false,
+        "segmentGranularity": "day"
+      }
+    },
+    "tuningConfig": {
+      "type": "kinesis"
+    }
+  }
+}
+```
+</details>
+
+After Druid ingests the data, you can query the Kinesis metadata columns as follows:
+
+```sql
+SELECT
+  "kinesis.timestamp",
+  "kinesis.partitionKey"
+FROM "wikiticker"
+```
+
+This query returns:
+
+| `kinesis.timestamp` | `kinesis.topic` |
+|---------------------|-----------------|
+| `1680795276351`     | `partition-1`   |
+
+## FlattenSpec
+
+You can use the `flattenSpec` object to flatten nested data, as an alternative to the Druid [nested columns](../querying/nested-columns.md) feature, and for nested input formats unsupported by the feature. It is an object within the `inputFormat` object.
+
+See [Nested columns](../querying/nested-columns.md) for information on ingesting and storing nested data in an Apache Druid column as a `COMPLEX<json>` data type.
+
+Configure your `flattenSpec` as follows:
+
+| Field | Description | Default |
+|-------|-------------|---------|
+| useFieldDiscovery | If true, interpret all root-level fields as available fields for usage by [`timestampSpec`](./ingestion-spec.md#timestampspec), [`transformSpec`](./ingestion-spec.md#transformspec), [`dimensionsSpec`](./ingestion-spec.md#dimensionsspec), and [`metricsSpec`](./ingestion-spec.md#metricsspec).<br /><br />If false, only explicitly specified fields (see `fields`) will be available for use. | `true` |
+| fields | Specifies the fields of interest and how they are accessed. See [Field flattening specifications](#field-flattening-specifications) for more detail. | `[]` |
+
+For example:
+
+```json
+"flattenSpec": {
+  "useFieldDiscovery": true,
+  "fields": [
+    { "name": "baz", "type": "root" },
+    { "name": "foo_bar", "type": "path", "expr": "$.foo.bar" },
+    { "name": "foo_other_bar", "type": "tree", "nodes": ["foo", "other", "bar"] },
+    { "name": "first_food", "type": "jq", "expr": ".thing.food[1]" }
+  ]
+}
+```
+
+After Druid reads the input data records, it applies the flattenSpec before applying any other specs such as [`timestampSpec`](./ingestion-spec.md#timestampspec), [`transformSpec`](./ingestion-spec.md#transformspec), [`dimensionsSpec`](./ingestion-spec.md#dimensionsspec), or [`metricsSpec`](./ingestion-spec.md#metricsspec).  This makes it possible to extract timestamps from flattened data, for example, and to refer to flattened data in transformations, in your dimension list, and when generating metrics.
+
+Flattening is only supported for [data formats](data-formats.md) that support nesting, including `avro`, `json`, `orc`, and `parquet`.
+
+### Field flattening specifications
+
+Each entry in the `fields` list can have the following components:
+
+| Field | Description | Default |
+|-------|-------------|---------|
+| type | Options are as follows:<br /><br /><ul><li>`root`, referring to a field at the root level of the record. Only really useful if `useFieldDiscovery` is false.</li><li>`path`, referring to a field using [JsonPath](https://github.com/jayway/JsonPath) notation. Supported by most data formats that offer nesting, including `avro`, `json`, `orc`, and `parquet`.</li><li>`jq`, referring to a field using [jackson-jq](https://github.com/eiiches/jackson-jq) notation. Only supported for the `json` format.</li><li>`tree`, referring to a nested field from the root level of the record. Useful and more efficient than `path` or `jq` if a simple hierarchical fetch is required. Only supported for the `json` format.</li></ul> | none (required) |
+| name | Name of the field after flattening. This name can be referred to by the [`timestampSpec`](./ingestion-spec.md#timestampspec), [`transformSpec`](./ingestion-spec.md#transformspec), [`dimensionsSpec`](./ingestion-spec.md#dimensionsspec), and [`metricsSpec`](./ingestion-spec.md#metricsspec).| none (required) |
+| expr | Expression for accessing the field while flattening. For type `path`, this should be [JsonPath](https://github.com/jayway/JsonPath). For type `jq`, this should be [jackson-jq](https://github.com/eiiches/jackson-jq) notation. For other types, this parameter is ignored. | none (required for types `path` and `jq`) |
+| nodes | For `tree` only. Multiple-expression field for accessing the field while flattening, representing the hierarchy of field names to read. For other types, this parameter must not be provided. | none (required for type `tree`) |
+
+### Notes on flattening
+
+- For convenience, when defining a root-level field, it is possible to define only the field name, as a string, instead of a JSON object. For example, `{"name": "baz", "type": "root"}` is equivalent to `"baz"`.
+- Enabling `useFieldDiscovery` will only automatically detect "simple" fields at the root level that correspond to data types that Druid supports. This includes strings, numbers, and lists of strings or numbers. Other types will not be automatically detected, and must be specified explicitly in the `fields` list.
+- Duplicate field `name`s are not allowed. An exception will be thrown.
+- If `useFieldDiscovery` is enabled, any discovered field with the same name as one already defined in the `fields` list will be skipped, rather than added twice.
+- [JSONPath evaluator](https://jsonpath.com/) is useful for testing `path`-type expressions.
+- jackson-jq supports a subset of the full [jq](https://stedolan.github.io/jq/) syntax.  Please refer to the [jackson-jq documentation](https://github.com/eiiches/jackson-jq) for details.
+- [JsonPath](https://github.com/jayway/JsonPath) supports a bunch of functions, but not all of these functions are supported by Druid now. Following matrix shows the current supported JsonPath functions and corresponding data formats. Please also note the output data type of these functions.
+  
+  | Function   | Description                                                         | Output type | json | orc | avro | parquet |
+  | :----------| :------------------------------------------------------------------ |:----------- |:-----|:----|:-----|:-----|
+  | min()      | Provides the min value of an array of numbers                       | Double      | &#10003;  |  &#10003;   |   &#10003;   |  &#10003;   |
+  | max()      | Provides the max value of an array of numbers                       | Double      | &#10003;  |  &#10003;   |   &#10003;   |  &#10003;   |
+  | avg()      | Provides the average value of an array of numbers                   | Double      | &#10003;  |  &#10003;   |   &#10003;   |  &#10003;   |
+  | stddev()   | Provides the standard deviation value of an array of numbers        | Double      | &#10003;  |  &#10003;   |   &#10003;   |  &#10003;   |
+  | length()   | Provides the length of an array                                     | Integer     | &#10003;  |  &#10003;   |   &#10003;   |  &#10003;   |
+  | sum()      | Provides the sum value of an array of numbers                       | Double      | &#10003;  |  &#10003;   |   &#10003;   |  &#10003;   |
+  | concat(X)  | Provides a concatenated version of the path output with a new item  | like input  | &#10003;  |  &#10007;   |   &#10007;   | &#10007;   |
+  | append(X)  | add an item to the json path output array                           | like input  | &#10003;  |  &#10007;   |   &#10007;   | &#10007;   |
+  | keys()     | Provides the property keys (An alternative for terminal tilde ~)    | Set\<E\>      | &#10007;  |  &#10007;   |   &#10007;   | &#10007;   |
+
+## Parser
+
+:::info
+ The Parser is deprecated for [native batch tasks](./native-batch.md), [Kafka indexing service](../ingestion/kafka-ingestion.md),
+and [Kinesis indexing service](../ingestion/kinesis-ingestion.md).
+Consider using the [input format](#input-format) instead for these types of ingestion.
+:::
+
+This section lists all default and core extension parsers.
+For community extension parsers, please see our [community extensions list](../configuration/extensions.md#community-extensions).
+
+### String Parser
+
+`string` typed parsers operate on text based inputs that can be split into individual records by newlines.
+Each line can be further parsed using [`parseSpec`](#parsespec).
+
+| Field | Type | Description | Required |
+|-------|------|-------------|----------|
+| type | String | Set value to `string` for most cases. Otherwise use `hadoopyString` for Hadoop indexing. | yes |
+| parseSpec | JSON Object | Specifies the format, timestamp, and dimensions of the data. | yes |
+
+### Avro Hadoop Parser
+
+:::caution[Deprecated]
+
+Hadoop-based ingestion is deprecated. For more information, see the [upgrade notes](../release-info/upgrade-notes.md#hadoop-based-ingestion).
+
+:::
+
+
+:::info
+You need to include [`druid-avro-extensions`](../development/extensions-core/avro.md) as an extension to use the Avro Hadoop Parser.
+
+ See the [Avro Types](../development/extensions-core/avro.md#avro-types) section for how Avro types are handled in Druid
+:::
+
+This parser is for [Hadoop batch ingestion](./hadoop.md).
+The `inputFormat` of `inputSpec` in `ioConfig` must be set to `"org.apache.druid.data.input.avro.AvroValueInputFormat"`.
+You may want to set Avro reader's schema in `jobProperties` in `tuningConfig`,
+e.g.: `"avro.schema.input.value.path": "/path/to/your/schema.avsc"` or
+`"avro.schema.input.value": "your_schema_JSON_object"`.
+If the Avro reader's schema is not set, the schema in Avro object container file will be used.
+See [Avro specification](http://avro.apache.org/docs/1.7.7/spec.html#Schema+Resolution) for more information.
+
+| Field | Type | Description | Required |
+|-------|------|-------------|----------|
+| type | String | Set value to `avro_hadoop`. | yes |
+| parseSpec | JSON Object | Specifies the timestamp and dimensions of the data. Should be an "avro" parseSpec. | yes |
+| fromPigAvroStorage | Boolean | Specifies whether the data file is stored using AvroStorage. | no(default == false) |
+
+An Avro parseSpec can contain a [`flattenSpec`](#flattenspec) using either the "root" or "path"
+field types, which can be used to read nested Avro records. The "jq" and "tree" field type is not currently supported
+for Avro.
+
+For example, using Avro Hadoop parser with custom reader's schema file:
+
+```json
+{
+  "type" : "index_hadoop",
+  "spec" : {
+    "dataSchema" : {
+      "dataSource" : "",
+      "parser" : {
+        "type" : "avro_hadoop",
+        "parseSpec" : {
+          "format": "avro",
+          "timestampSpec": <standard timestampSpec>,
+          "dimensionsSpec": <standard dimensionsSpec>,
+          "flattenSpec": <optional>
+        }
+      }
+    },
+    "ioConfig" : {
+      "type" : "hadoop",
+      "inputSpec" : {
+        "type" : "static",
+        "inputFormat": "org.apache.druid.data.input.avro.AvroValueInputFormat",
+        "paths" : ""
+      }
+    },
+    "tuningConfig" : {
+       "jobProperties" : {
+          "avro.schema.input.value.path" : "/path/to/my/schema.avsc"
+      }
+    }
+  }
+}
+```
+
+### ORC Hadoop Parser
+
+:::caution[Deprecated]
+
+Hadoop-based ingestion is deprecated. For more information, see the [upgrade notes](../release-info/upgrade-notes.md#hadoop-based-ingestion).
+
+
+:::
+
+
+:::info
+ You need to include the [`druid-orc-extensions`](../development/extensions-core/orc.md) as an extension to use the ORC Hadoop Parser.
+:::
+
+:::info
+ If you are considering upgrading from earlier than 0.15.0 to 0.15.0 or a higher version,
+ please read [Migration from 'contrib' extension](../development/extensions-core/orc.md#migration-from-contrib-extension) carefully.
+:::
+
+This parser is for [Hadoop batch ingestion](./hadoop.md).
+The `inputFormat` of `inputSpec` in `ioConfig` must be set to `"org.apache.orc.mapreduce.OrcInputFormat"`.
+
+|Field     | Type        | Description                                                                            | Required|
+|----------|-------------|----------------------------------------------------------------------------------------|---------|
+| type | String | Set value to `orc`. | yes |
+|parseSpec | JSON Object | Specifies the timestamp and dimensions of the data (`timeAndDims` and `orc` format) and a `flattenSpec` (`orc` format). | yes|
+
+The parser supports two `parseSpec` formats: `orc` and `timeAndDims`.
+
+`orc` supports auto field discovery and flattening, if specified with a [`flattenSpec`](#flattenspec).
+If no `flattenSpec` is specified, `useFieldDiscovery` will be enabled by default. Specifying a `dimensionSpec` is
+optional if `useFieldDiscovery` is enabled: if a `dimensionSpec` is supplied, the list of `dimensions` it defines will be
+the set of ingested dimensions, if missing the discovered fields will make up the list.
+
+`timeAndDims` parse spec must specify which fields will be extracted as dimensions through the `dimensionSpec`.
+
+[All column types](https://orc.apache.org/docs/types.html) are supported, with the exception of `union` types. Columns of
+ `list` type, if filled with primitives, may be used as a multi-value dimension, or specific elements can be extracted with
+`flattenSpec` expressions. Likewise, primitive fields may be extracted from `map` and `struct` types in the same manner.
+Auto field discovery will automatically create a string dimension for every (non-timestamp) primitive or `list` of
+primitives, as well as any flatten expressions defined in the `flattenSpec`.
+
+#### Hadoop job properties
+
+Like most Hadoop jobs, the best outcomes will add `"mapreduce.job.user.classpath.first": "true"` or
+`"mapreduce.job.classloader": "true"` to the `jobProperties` section of `tuningConfig`. Note that it is likely if using
+`"mapreduce.job.classloader": "true"` that you will need to set `mapreduce.job.classloader.system.classes` to include
+`-org.apache.hadoop.hive.` to instruct Hadoop to load `org.apache.hadoop.hive` classes from the application jars instead
+of system jars, e.g.
+
+```json
+...
+    "mapreduce.job.classloader": "true",
+    "mapreduce.job.classloader.system.classes" : "java., javax.accessibility., javax.activation., javax.activity., javax.annotation., javax.annotation.processing., javax.crypto., javax.imageio., javax.jws., javax.lang.model., -javax.management.j2ee., javax.management., javax.naming., javax.net., javax.print., javax.rmi., javax.script., -javax.security.auth.message., javax.security.auth., javax.security.cert., javax.security.sasl., javax.sound., javax.sql., javax.swing., javax.tools., javax.transaction., -javax.xml.registry., -javax.xml.rpc., javax.xml., org.w3c.dom., org.xml.sax., org.apache.commons.logging., org.apache.log4j., -org.apache.hadoop.hbase., -org.apache.hadoop.hive., org.apache.hadoop., core-default.xml, hdfs-default.xml, mapred-default.xml, yarn-default.xml",
+...
+```
+
+This is due to the `hive-storage-api` dependency of the
+`orc-mapreduce` library, which provides some classes under the `org.apache.hadoop.hive` package. If instead using the
+setting `"mapreduce.job.user.classpath.first": "true"`, then this will not be an issue.
+
+#### Examples
+
+##### `orc` parser, `orc` parseSpec, auto field discovery, flatten expressions
+
+```json
+{
+  "type": "index_hadoop",
+  "spec": {
+    "ioConfig": {
+      "type": "hadoop",
+      "inputSpec": {
+        "type": "static",
+        "inputFormat": "org.apache.orc.mapreduce.OrcInputFormat",
+        "paths": "path/to/file.orc"
+      },
+      ...
+    },
+    "dataSchema": {
+      "dataSource": "example",
+      "parser": {
+        "type": "orc",
+        "parseSpec": {
+          "format": "orc",
+          "flattenSpec": {
+            "useFieldDiscovery": true,
+            "fields": [
+              {
+                "type": "path",
+                "name": "nestedDim",
+                "expr": "$.nestedData.dim1"
+              },
+              {
+                "type": "path",
+                "name": "listDimFirstItem",
+                "expr": "$.listDim[1]"
+              }
+            ]
+          },
+          "timestampSpec": {
+            "column": "timestamp",
+            "format": "millis"
+          }
+        }
+      },
+      ...
+    },
+    "tuningConfig": <hadoop-tuning-config>
+    }
+  }
+}
+```
+
+##### `orc` parser, `orc` parseSpec, field discovery with no flattenSpec or dimensionSpec
+
+```json
+{
+  "type": "index_hadoop",
+  "spec": {
+    "ioConfig": {
+      "type": "hadoop",
+      "inputSpec": {
+        "type": "static",
+        "inputFormat": "org.apache.orc.mapreduce.OrcInputFormat",
+        "paths": "path/to/file.orc"
+      },
+      ...
+    },
+    "dataSchema": {
+      "dataSource": "example",
+      "parser": {
+        "type": "orc",
+        "parseSpec": {
+          "format": "orc",
+          "timestampSpec": {
+            "column": "timestamp",
+            "format": "millis"
+          }
+        }
+      },
+      ...
+    },
+    "tuningConfig": <hadoop-tuning-config>
+    }
+  }
+}
+```
+
+##### `orc` parser, `orc` parseSpec, no autodiscovery
+
+```json
+{
+  "type": "index_hadoop",
+  "spec": {
+    "ioConfig": {
+      "type": "hadoop",
+      "inputSpec": {
+        "type": "static",
+        "inputFormat": "org.apache.orc.mapreduce.OrcInputFormat",
+        "paths": "path/to/file.orc"
+      },
+      ...
+    },
+    "dataSchema": {
+      "dataSource": "example",
+      "parser": {
+        "type": "orc",
+        "parseSpec": {
+          "format": "orc",
+          "flattenSpec": {
+            "useFieldDiscovery": false,
+            "fields": [
+              {
+                "type": "path",
+                "name": "nestedDim",
+                "expr": "$.nestedData.dim1"
+              },
+              {
+                "type": "path",
+                "name": "listDimFirstItem",
+                "expr": "$.listDim[1]"
+              }
+            ]
+          },
+          "timestampSpec": {
+            "column": "timestamp",
+            "format": "millis"
+          },
+          "dimensionsSpec": {
+            "dimensions": [
+              "dim1",
+              "dim3",
+              "nestedDim",
+              "listDimFirstItem"
+            ],
+            "dimensionExclusions": [],
+            "spatialDimensions": []
+          }
+        }
+      },
+      ...
+    },
+    "tuningConfig": <hadoop-tuning-config>
+    }
+  }
+}
+```
+
+##### `orc` parser, `timeAndDims` parseSpec
+
+```json
+{
+  "type": "index_hadoop",
+  "spec": {
+    "ioConfig": {
+      "type": "hadoop",
+      "inputSpec": {
+        "type": "static",
+        "inputFormat": "org.apache.orc.mapreduce.OrcInputFormat",
+        "paths": "path/to/file.orc"
+      },
+      ...
+    },
+    "dataSchema": {
+      "dataSource": "example",
+      "parser": {
+        "type": "orc",
+        "parseSpec": {
+          "format": "timeAndDims",
+          "timestampSpec": {
+            "column": "timestamp",
+            "format": "auto"
+          },
+          "dimensionsSpec": {
+            "dimensions": [
+              "dim1",
+              "dim2",
+              "dim3",
+              "listDim"
+            ],
+            "dimensionExclusions": [],
+            "spatialDimensions": []
+          }
+        }
+      },
+      ...
+    },
+    "tuningConfig": <hadoop-tuning-config>
+  }
+}
+
+```
+
+### Parquet Hadoop Parser
+
+:::caution[Deprecated]
+
+Hadoop-based ingestion is deprecated. For more information, see the [upgrade notes](../release-info/upgrade-notes.md#hadoop-based-ingestion).
+
+:::
+
+
+:::info
+ You need to include the [`druid-parquet-extensions`](../development/extensions-core/parquet.md) as an extension to use the Parquet Hadoop Parser.
+:::
+
+The Parquet Hadoop parser is for [Hadoop batch ingestion](./hadoop.md) and parses Parquet files directly.
+The `inputFormat` of `inputSpec` in `ioConfig` must be set to `org.apache.druid.data.input.parquet.DruidParquetInputFormat`.
+
+The Parquet Hadoop Parser supports auto field discovery and flattening if provided with a
+[`flattenSpec`](#flattenspec) with the `parquet` `parseSpec`. Parquet nested list and map
+[logical types](https://github.com/apache/parquet-format/blob/master/LogicalTypes.md) _should_ operate correctly with
+JSON path expressions for all supported types.
+
+|Field     | Type        | Description                                                                            | Required|
+|----------|-------------|----------------------------------------------------------------------------------------|---------|
+| type      | String      | Set value to `parquet`. | yes |
+| parseSpec | JSON Object | Specifies the timestamp and dimensions of the data, and optionally, a flatten spec. Valid parseSpec formats are `timeAndDims` and `parquet`. | yes |
+| binaryAsString | Boolean | Specifies if the bytes parquet column which is not logically marked as a string or enum type should be treated as a UTF-8 encoded string. | no(default = false) |
+
+When the time dimension is a [DateType column](https://github.com/apache/parquet-format/blob/master/LogicalTypes.md),
+a format should not be supplied. When the format is UTF8 (String), either `auto` or a explicitly defined
+[format](http://www.joda.org/joda-time/apidocs/org/joda/time/format/DateTimeFormat) is required.
+
+#### Parquet Hadoop Parser vs Parquet Avro Hadoop Parser
+
+Both parsers read from Parquet files, but slightly differently. The main
+differences are:
+
+- The Parquet Hadoop Parser uses a simple conversion while the Parquet Avro Hadoop Parser
+converts Parquet data into avro records first with the `parquet-avro` library and then
+parses avro data using the `druid-avro-extensions` module to ingest into Druid.
+- The Parquet Hadoop Parser sets a hadoop job property
+`parquet.avro.add-list-element-records` to `false` (which normally defaults to `true`), in order to 'unwrap' primitive
+list elements into multi-value dimensions.
+- The Parquet Hadoop Parser supports `int96` Parquet values, while the Parquet Avro Hadoop Parser does not.
+There may also be some subtle differences in the behavior of JSON path expression evaluation of `flattenSpec`.
+
+Based on those differences, we suggest using the Parquet Hadoop Parser over the Parquet Avro Hadoop Parser
+to allow ingesting data beyond the schema constraints of Avro conversion.
+However, the Parquet Avro Hadoop Parser was the original basis for supporting the Parquet format, and as such it is a bit more mature.
+
+#### Examples
+
+##### `parquet` parser, `parquet` parseSpec
+
+```json
+{
+  "type": "index_hadoop",
+  "spec": {
+    "ioConfig": {
+      "type": "hadoop",
+      "inputSpec": {
+        "type": "static",
+        "inputFormat": "org.apache.druid.data.input.parquet.DruidParquetInputFormat",
+        "paths": "path/to/file.parquet"
+      },
+      ...
+    },
+    "dataSchema": {
+      "dataSource": "example",
+      "parser": {
+        "type": "parquet",
+        "parseSpec": {
+          "format": "parquet",
+          "flattenSpec": {
+            "useFieldDiscovery": true,
+            "fields": [
+              {
+                "type": "path",
+                "name": "nestedDim",
+                "expr": "$.nestedData.dim1"
+              },
+              {
+                "type": "path",
+                "name": "listDimFirstItem",
+                "expr": "$.listDim[1]"
+              }
+            ]
+          },
+          "timestampSpec": {
+            "column": "timestamp",
+            "format": "auto"
+          },
+          "dimensionsSpec": {
+            "dimensions": [],
+            "dimensionExclusions": [],
+            "spatialDimensions": []
+          }
+        }
+      },
+      ...
+    },
+    "tuningConfig": <hadoop-tuning-config>
+    }
+  }
+}
+```
+
+##### `parquet` parser, `timeAndDims` parseSpec
+
+```json
+{
+  "type": "index_hadoop",
+  "spec": {
+    "ioConfig": {
+      "type": "hadoop",
+      "inputSpec": {
+        "type": "static",
+        "inputFormat": "org.apache.druid.data.input.parquet.DruidParquetInputFormat",
+        "paths": "path/to/file.parquet"
+      },
+      ...
+    },
+    "dataSchema": {
+      "dataSource": "example",
+      "parser": {
+        "type": "parquet",
+        "parseSpec": {
+          "format": "timeAndDims",
+          "timestampSpec": {
+            "column": "timestamp",
+            "format": "auto"
+          },
+          "dimensionsSpec": {
+            "dimensions": [
+              "dim1",
+              "dim2",
+              "dim3",
+              "listDim"
+            ],
+            "dimensionExclusions": [],
+            "spatialDimensions": []
+          }
+        }
+      },
+      ...
+    },
+    "tuningConfig": <hadoop-tuning-config>
+  }
+}
+
+```
+
+### Parquet Avro Hadoop Parser
+
+:::caution[Deprecated]
+
+Hadoop-based ingestion is deprecated. For more information, see the [upgrade notes](../release-info/upgrade-notes.md#hadoop-based-ingestion).
+
+:::
+
+
+:::info
+ Consider using the [Parquet Hadoop Parser](#parquet-hadoop-parser) over this parser to ingest
+Parquet files. See [Parquet Hadoop Parser vs Parquet Avro Hadoop Parser](#parquet-hadoop-parser-vs-parquet-avro-hadoop-parser)
+for the differences between those parsers.
+:::
+
+:::info
+ You need to include both the [`druid-parquet-extensions`](../development/extensions-core/parquet.md)
+[`druid-avro-extensions`] as extensions to use the Parquet Avro Hadoop Parser.
+:::
+
+The Parquet Avro Hadoop Parser is for [Hadoop batch ingestion](./hadoop.md).
+This parser first converts the Parquet data into Avro records, and then parses them to ingest into Druid.
+The `inputFormat` of `inputSpec` in `ioConfig` must be set to `org.apache.druid.data.input.parquet.DruidParquetAvroInputFormat`.
+
+The Parquet Avro Hadoop Parser supports auto field discovery and flattening if provided with a
+[`flattenSpec`](#flattenspec) with the `avro` `parseSpec`. Parquet nested list and map
+[logical types](https://github.com/apache/parquet-format/blob/master/LogicalTypes.md) _should_ operate correctly with
+JSON path expressions for all supported types. This parser sets a hadoop job property
+`parquet.avro.add-list-element-records` to `false` (which normally defaults to `true`), in order to 'unwrap' primitive
+list elements into multi-value dimensions.
+
+Note that the `int96` Parquet value type is not supported with this parser.
+
+|Field     | Type        | Description                                                                            | Required|
+|----------|-------------|----------------------------------------------------------------------------------------|---------|
+| type      | String      | Set value to `parquet-avro`. | yes |
+| parseSpec | JSON Object | Specifies the timestamp and dimensions of the data, and optionally, a flatten spec. Should be `avro`. | yes |
+| binaryAsString | Boolean | Specifies if the bytes parquet column which is not logically marked as a string or enum type should be treated as a UTF-8 encoded string. | no(default = false) |
+
+When the time dimension is a [DateType column](https://github.com/apache/parquet-format/blob/master/LogicalTypes.md),
+a format should not be supplied. When the format is UTF8 (String), either `auto` or
+an explicitly defined [format](http://www.joda.org/joda-time/apidocs/org/joda/time/format/DateTimeFormat) is required.
+
+#### Example
+
+```json
+{
+  "type": "index_hadoop",
+  "spec": {
+    "ioConfig": {
+      "type": "hadoop",
+      "inputSpec": {
+        "type": "static",
+        "inputFormat": "org.apache.druid.data.input.parquet.DruidParquetAvroInputFormat",
+        "paths": "path/to/file.parquet"
+      },
+      ...
+    },
+    "dataSchema": {
+      "dataSource": "example",
+      "parser": {
+        "type": "parquet-avro",
+        "parseSpec": {
+          "format": "avro",
+          "flattenSpec": {
+            "useFieldDiscovery": true,
+            "fields": [
+              {
+                "type": "path",
+                "name": "nestedDim",
+                "expr": "$.nestedData.dim1"
+              },
+              {
+                "type": "path",
+                "name": "listDimFirstItem",
+                "expr": "$.listDim[1]"
+              }
+            ]
+          },
+          "timestampSpec": {
+            "column": "timestamp",
+            "format": "auto"
+          },
+          "dimensionsSpec": {
+            "dimensions": [],
+            "dimensionExclusions": [],
+            "spatialDimensions": []
+          }
+        }
+      },
+      ...
+    },
+    "tuningConfig": <hadoop-tuning-config>
+    }
+  }
+}
+```
+
+### Avro Stream Parser
+
+:::info
+ You need to include the [`druid-avro-extensions`](../development/extensions-core/avro.md) as an extension to use the Avro Stream Parser.
+:::
+
+:::info
+ See the [Avro Types](../development/extensions-core/avro.md#avro-types) section for how Avro types are handled in Druid
+:::
+
+This parser is for [stream ingestion](./index.md#streaming) and reads Avro data from a stream directly.
+
+| Field | Type | Description | Required |
+|-------|------|-------------|----------|
+| type | String | Set value to `avro_stream`. | no |
+| avroBytesDecoder | JSON Object | Specifies [`avroBytesDecoder`](#Avro Bytes Decoder) to decode bytes to Avro record. | yes |
+| parseSpec | JSON Object | Specifies the timestamp and dimensions of the data. Should be an "avro" parseSpec. | yes |
+
+An Avro parseSpec can contain a [`flattenSpec`](#flattenspec) using either the "root" or "path"
+field types, which can be used to read nested Avro records. The "jq" and "tree" field type is not currently supported for Avro.
+
+For example, using Avro stream parser with schema repo Avro bytes decoder:
+
+```json
+"parser" : {
+  "type" : "avro_stream",
+  "avroBytesDecoder" : {
+    "type" : "schema_repo",
+    "subjectAndIdConverter" : {
+      "type" : "avro_1124",
+      "topic" : "${YOUR_TOPIC}"
+    },
+    "schemaRepository" : {
+      "type" : "avro_1124_rest_client",
+      "url" : "${YOUR_SCHEMA_REPO_END_POINT}",
+    }
+  },
+  "parseSpec" : {
+    "format": "avro",
+    "timestampSpec": <standard timestampSpec>,
+    "dimensionsSpec": <standard dimensionsSpec>,
+    "flattenSpec": <optional>
+  }
+}
+```
+
+### Protobuf Parser
+
+:::info
+ You need to include the [`druid-protobuf-extensions`](../development/extensions-core/protobuf.md) as an extension to use the Protobuf Parser.
+:::
+
+This parser is for [stream ingestion](./index.md#streaming) and reads Protocol buffer data from a stream directly.
+
+| Field | Type | Description | Required |
+|-------|------|-------------|----------|
+| type | String | Set value to `protobuf`. | yes |
+| `protoBytesDecoder` | JSON Object | Specifies how to decode bytes to Protobuf record. | yes |
+| parseSpec | JSON Object | Specifies the timestamp and dimensions of the data.  The format must be JSON. See [JSON ParseSpec](#json-parsespec) for more configuration options. Note that `timeAndDims` `parseSpec` is no longer supported. | yes |
+
+Sample spec:
+
+```json
+"parser": {
+  "type": "protobuf",
+  "protoBytesDecoder": {
+    "type": "file",
+    "descriptor": "file:///tmp/metrics.desc",
+    "protoMessageType": "Metrics"
+  },
+  "parseSpec": {
+    "format": "json",
+    "timestampSpec": {
+      "column": "timestamp",
+      "format": "auto"
+    },
+    "dimensionsSpec": {
+      "dimensions": [
+        "unit",
+        "http_method",
+        "http_code",
+        "page",
+        "metricType",
+        "server"
+      ],
+      "dimensionExclusions": [
+        "timestamp",
+        "value"
+      ]
+    }
+  }
+}
+```
+
+See the [extension description](../development/extensions-core/protobuf.md) for
+more details and examples.
+
+#### Protobuf Bytes Decoder
+
+If `type` is not included, the `protoBytesDecoder` defaults to `schema_registry`.
+
+##### File-based Protobuf Bytes Decoder
+
+This Protobuf bytes decoder first read a descriptor file, and then parse it to get schema used to decode the Protobuf record from bytes.
+
+| Field | Type | Description | Required |
+|-------|------|-------------|----------|
+| type | String | Set value to `file`. | yes |
+| descriptor | String | Protobuf descriptor file name in the classpath or URL. | yes |
+| protoMessageType | String | Protobuf message type in the descriptor.  Both short name and fully qualified name are accepted. The parser uses the first message type found in the descriptor if not specified. | no |
+
+Sample spec:
+
+```json
+"protoBytesDecoder": {
+  "type": "file",
+  "descriptor": "file:///tmp/metrics.desc",
+  "protoMessageType": "Metrics"
+}
+```
+
+#### Inline Descriptor Protobuf Bytes Decoder
+
+This Protobuf bytes decoder allows the user to provide the contents of a Protobuf descriptor file inline, encoded as a Base64 string, and then parse it to get schema used to decode the Protobuf record from bytes.
+
+| Field | Type | Description | Required |
+|-------|------|-------------|----------|
+| type | String | Set value to `inline`. | yes |
+| descriptorString | String | A compiled Protobuf descriptor, encoded as a Base64 string. | yes |
+| protoMessageType | String | Protobuf message type in the descriptor.  Both short name and fully qualified name are accepted. The parser uses the first message type found in the descriptor if not specified. | no |
+
+Sample spec:
+
+```json
+"protoBytesDecoder": {
+  "type": "inline",
+  "descriptorString": <Contents of a Protobuf descriptor file encoded as Base64 string>,
+  "protoMessageType": "Metrics"
+}
+```
+
+##### Confluent Schema Registry-based Protobuf Bytes Decoder
+
+This Protobuf bytes decoder first extracts a unique `id` from input message bytes, and then uses it to look up the schema in the Schema Registry used to decode the Avro record from bytes.
+For details, see the Schema Registry [documentation](http://docs.confluent.io/current/schema-registry/docs/) and [repository](https://github.com/confluentinc/schema-registry).
+
+| Field | Type | Description | Required |
+|-------|------|-------------|----------|
+| type | String | Set value to `schema_registry`. | yes |
+| url | String | Specifies the URL endpoint of the Schema Registry. | yes |
+| capacity | Integer | Specifies the max size of the cache (default = Integer.MAX_VALUE). | no |
+| urls | ARRAY\<String\> | Specifies the URL endpoints of the multiple Schema Registry instances. | yes (if `url` is not provided) |
+| config | Json | To send additional configurations, configured for Schema Registry. This can be supplied via a [DynamicConfigProvider](../operations/dynamic-config-provider.md).  | no |
+| headers | Json | To send headers to the Schema Registry.  This can be supplied via a [DynamicConfigProvider](../operations/dynamic-config-provider.md) | no |
+
+For a single schema registry instance, use Field `url` or `urls` for multi instances.
+
+Single Instance:
+
+```json
+...
+"protoBytesDecoder": {
+  "url": <schema-registry-url>,
+  "type": "schema_registry"
+}
+...
+```
+
+Multiple Instances:
+
+```json
+...
+"protoBytesDecoder": {
+  "urls": [<schema-registry-url-1>, <schema-registry-url-2>, ...],
+  "type": "schema_registry",
+  "capacity": 100,
+  "config" : {
+       "basic.auth.credentials.source": "USER_INFO",
+       "basic.auth.user.info": "fred:letmein",
+       "schema.registry.ssl.truststore.location": "/some/secrets/kafka.client.truststore.jks",
+       "schema.registry.ssl.truststore.password": "<password>",
+       "schema.registry.ssl.keystore.location": "/some/secrets/kafka.client.keystore.jks",
+       "schema.registry.ssl.keystore.password": "<password>",
+       "schema.registry.ssl.key.password": "<password>",
+         ... 
+  },
+  "headers": {
+      "traceID" : "b29c5de2-0db4-490b-b421",
+      "timeStamp" : "1577191871865",
+      "druid.dynamic.config.provider":{
+           "type":"mapString", 
+           "config":{
+                "registry.header.prop.1":"value.1", 
+                "registry.header.prop.2":"value.2"
+                }
+           }
+      ...
+  }
+}
+...
+```
+
+## ParseSpec
+
+:::info
+ The Parser is deprecated for [native batch tasks](./native-batch.md), [Kafka indexing service](../ingestion/kafka-ingestion.md),
+and [Kinesis indexing service](../ingestion/kinesis-ingestion.md).
+Consider using the [input format](#input-format) instead for these types of ingestion.
+:::
+
+ParseSpecs serve two purposes:
+
+- The String Parser use them to determine the format (i.e., JSON, CSV, TSV) of incoming rows.
+- All Parsers use them to determine the timestamp and dimensions of incoming rows.
+
+If `format` is not included, the parseSpec defaults to `tsv`.
+
+### JSON ParseSpec
+
+Use this with the String Parser to load JSON.
+
+| Field | Type | Description | Required |
+|-------|------|-------------|----------|
+| format | String |`json`| no |
+| timestampSpec | JSON Object | Specifies the column and format of the timestamp. | yes |
+| dimensionsSpec | JSON Object | Specifies the dimensions of the data. | yes |
+| flattenSpec | JSON Object | Specifies flattening configuration for nested JSON data. See [`flattenSpec`](#flattenspec) for more info. | no |
+
+Sample spec:
+
+```json
+"parseSpec": {
+  "format" : "json",
+  "timestampSpec" : {
+    "column" : "timestamp"
+  },
+  "dimensionSpec" : {
+    "dimensions" : ["page","language","user","unpatrolled","newPage","robot","anonymous","namespace","continent","country","region","city"]
+  }
+}
+```
+
+### JSON Lowercase ParseSpec
+
+:::info
+ The _jsonLowercase_ parser is deprecated and may be removed in a future version of Druid.
+:::
+
+This is a special variation of the JSON ParseSpec that lower cases all the column names in the incoming JSON data. This parseSpec is required if you are updating to Druid 0.7.x from Druid 0.6.x, are directly ingesting JSON with mixed case column names, do not have any ETL in place to lower case those column names, and would like to make queries that include the data you created using 0.6.x and 0.7.x.
+
+| Field | Type | Description | Required |
+|-------|------|-------------|----------|
+| format | String | `jsonLowercase` | yes |
+| timestampSpec | JSON Object | Specifies the column and format of the timestamp. | yes |
+| dimensionsSpec | JSON Object | Specifies the dimensions of the data. | yes |
+
+### CSV ParseSpec
+
+Use this with the String Parser to load CSV. Strings are parsed using the com.opencsv library.
+
+| Field | Type | Description | Required |
+|-------|------|-------------|----------|
+| format | String | `csv` | yes |
+| timestampSpec | JSON Object | Specifies the column and format of the timestamp. | yes |
+| dimensionsSpec | JSON Object | Specifies the dimensions of the data. | yes |
+| listDelimiter | String | A custom delimiter for multi-value dimensions. | no (default = ctrl+A) |
+| columns | JSON array | Specifies the columns of the data. | yes |
+
+Sample spec:
+
+```json
+"parseSpec": {
+  "format" : "csv",
+  "timestampSpec" : {
+    "column" : "timestamp"
+  },
+  "columns" : ["timestamp","page","language","user","unpatrolled","newPage","robot","anonymous","namespace","continent","country","region","city","added","deleted","delta"],
+  "dimensionsSpec" : {
+    "dimensions" : ["page","language","user","unpatrolled","newPage","robot","anonymous","namespace","continent","country","region","city"]
+  }
+}
+```
+
+#### CSV Index Tasks
+
+If your input files contain a header, the `columns` field is optional and you don't need to set.
+Instead, you can set the `hasHeaderRow` field to true, which makes Druid automatically extract the column information from the header.
+Otherwise, you must set the `columns` field and ensure that field must match the columns of your input data in the same order.
+
+Also, you can skip some header rows by setting `skipHeaderRows` in your parseSpec. If both `skipHeaderRows` and `hasHeaderRow` options are set,
+`skipHeaderRows` is first applied. For example, if you set `skipHeaderRows` to 2 and `hasHeaderRow` to true, Druid will
+skip the first two lines and then extract column information from the third line.
+
+Note that `hasHeaderRow` and `skipHeaderRows` are effective only for non-Hadoop batch index tasks. Other types of index
+tasks will fail with an exception.
+
+#### Other CSV Ingestion Tasks
+
+The `columns` field must be included and and ensure that the order of the fields matches the columns of your input data in the same order.
+
+### TSV / Delimited ParseSpec
+
+Use this with the String Parser to load any delimited text that does not require special escaping. By default,
+the delimiter is a tab, so this will load TSV.
+
+| Field | Type | Description | Required |
+|-------|------|-------------|----------|
+| format | String | `tsv` | yes |
+| timestampSpec | JSON Object | Specifies the column and format of the timestamp. | yes |
+| dimensionsSpec | JSON Object | Specifies the dimensions of the data. | yes |
+| delimiter | String | A custom delimiter for data values. | no (default = \t) |
+| listDelimiter | String | A custom delimiter for multi-value dimensions. | no (default = ctrl+A) |
+| columns | JSON String array | Specifies the columns of the data. | yes |
+
+Sample spec:
+
+```json
+"parseSpec": {
+  "format" : "tsv",
+  "timestampSpec" : {
+    "column" : "timestamp"
+  },
+  "columns" : ["timestamp","page","language","user","unpatrolled","newPage","robot","anonymous","namespace","continent","country","region","city","added","deleted","delta"],
+  "delimiter":"|",
+  "dimensionsSpec" : {
+    "dimensions" : ["page","language","user","unpatrolled","newPage","robot","anonymous","namespace","continent","country","region","city"]
+  }
+}
+```
+
+Be sure to change the `delimiter` to the appropriate delimiter for your data. Like CSV, you must specify the columns and which subset of the columns you want indexed.
+
+#### TSV (Delimited) Index Tasks
+
+If your input files contain a header, the `columns` field is optional and doesn't need to be set.
+Instead, you can set the `hasHeaderRow` field to true, which makes Druid automatically extract the column information from the header.
+Otherwise, you must set the `columns` field and ensure that field must match the columns of your input data in the same order.
+
+Also, you can skip some header rows by setting `skipHeaderRows` in your parseSpec. If both `skipHeaderRows` and `hasHeaderRow` options are set,
+`skipHeaderRows` is first applied. For example, if you set `skipHeaderRows` to 2 and `hasHeaderRow` to true, Druid will
+skip the first two lines and then extract column information from the third line.
+
+Note that `hasHeaderRow` and `skipHeaderRows` are effective only for non-Hadoop batch index tasks. Other types of index
+tasks will fail with an exception.
+
+#### Other TSV (Delimited) Ingestion Tasks
+
+The `columns` field must be included and and ensure that the order of the fields matches the columns of your input data in the same order.
+
+### Regex ParseSpec
+
+```json
+"parseSpec":{
+  "format" : "regex",
+  "timestampSpec" : {
+    "column" : "timestamp"
+  },
+  "dimensionsSpec" : {
+    "dimensions" : [<your_list_of_dimensions>]
+  },
+  "columns" : [<your_columns_here>],
+  "pattern" : <regex pattern for partitioning data>
+}
+```
+
+The `columns` field must match the columns of your regex matching groups in the same order. If columns are not provided, default
+columns names ("column_1", "column2", ... "column_n") will be assigned. Ensure that your column names include all your dimensions.
+
+### JavaScript ParseSpec
+
+```json
+"parseSpec":{
+  "format" : "javascript",
+  "timestampSpec" : {
+    "column" : "timestamp"
+  },
+  "dimensionsSpec" : {
+    "dimensions" : ["page","language","user","unpatrolled","newPage","robot","anonymous","namespace","continent","country","region","city"]
+  },
+  "function" : "function(str) { var parts = str.split(\"-\"); return { one: parts[0], two: parts[1] } }"
+}
+```
+
+Note with the JavaScript parser that data must be fully parsed and returned as a `{key:value}` format in the JS logic.
+This means any flattening or parsing multi-dimensional values must be done here.
+
+:::info
+ JavaScript-based functionality is disabled by default. Please refer to the Druid [JavaScript programming guide](../development/javascript.md) for guidelines about using Druid's JavaScript functionality, including instructions on how to enable it.
+:::
+
+### TimeAndDims ParseSpec
+
+Use this with non-String Parsers to provide them with timestamp and dimensions information. Non-String Parsers
+handle all formatting decisions on their own, without using the ParseSpec.
+
+| Field | Type | Description | Required |
+|-------|------|-------------|----------|
+| format | String | `timeAndDims` | yes |
+| timestampSpec | JSON Object | Specifies the column and format of the timestamp. | yes |
+| dimensionsSpec | JSON Object | Specifies the dimensions of the data. | yes |
+
+### Orc ParseSpec
+
+Use this with the Hadoop ORC Parser to load ORC files.
+
+| Field | Type | Description | Required |
+|-------|------|-------------|----------|
+| format | String |  `orc`| no |
+| timestampSpec | JSON Object | Specifies the column and format of the timestamp. | yes |
+| dimensionsSpec | JSON Object | Specifies the dimensions of the data. | yes |
+| flattenSpec | JSON Object | Specifies flattening configuration for nested JSON data. See [`flattenSpec`](#flattenspec) for more info. | no |
+
+### Parquet ParseSpec
+
+Use this with the Hadoop Parquet Parser to load Parquet files.
+
+| Field | Type | Description | Required |
+|-------|------|-------------|----------|
+| format | String |  `parquet`| no |
+| timestampSpec | JSON Object | Specifies the column and format of the timestamp. | yes |
+| dimensionsSpec | JSON Object | Specifies the dimensions of the data. | yes |
+| flattenSpec | JSON Object | Specifies flattening configuration for nested JSON data. See [`flattenSpec`](#flattenspec) for more info. | no |
diff --git a/docs/35.0.0/ingestion/faq.md b/docs/35.0.0/ingestion/faq.md
new file mode 100644
index 0000000000..3fab83f0ea
--- /dev/null
+++ b/docs/35.0.0/ingestion/faq.md
@@ -0,0 +1,80 @@
+---
+id: faq
+title: "Ingestion troubleshooting FAQ"
+sidebar_label: "Troubleshooting FAQ"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+## Batch Ingestion
+
+If you are trying to batch load historical data but no events are being loaded, make sure the interval of your ingestion spec actually encapsulates the interval of your data. Events outside this interval are dropped.
+
+## Druid ingested my events but they are not in my query results
+
+If the number of ingested events seem correct, make sure your query is correctly formed. If you included a `count` aggregator in your ingestion spec, you will need to query for the results of this aggregate with a `longSum` aggregator. Issuing a query with a count aggregator will count the number of Druid rows, which includes [roll-up](../design/index.md).
+
+## Where do my Druid segments end up after ingestion?
+
+Depending on what `druid.storage.type` is set to, Druid will upload segments to some [Deep Storage](../design/deep-storage.md). Local disk is used as the default deep storage.
+
+## My stream ingest is not handing segments off
+
+First, make sure there are no exceptions in the logs of the ingestion process. Also make sure that `druid.storage.type` is set to a deep storage that isn't `local` if you are running a distributed cluster.
+
+Other common reasons that hand-off fails are as follows:
+
+1) Druid is unable to write to the metadata storage. Make sure your configurations are correct.
+
+2) Historical processes are out of capacity and cannot download any more segments. You'll see exceptions in the Coordinator logs if this occurs and the web console will show the Historicals are near capacity.
+
+3) Segments are corrupt and cannot be downloaded. You'll see exceptions in your Historical processes if this occurs.
+
+4) Deep storage is improperly configured. Make sure that your segment actually exists in deep storage and that the Coordinator logs have no errors.
+
+## How do I know when I can make query to Druid after submitting batch ingestion task?
+
+You can verify if segments created by a recent ingestion task are loaded onto historicals and available for querying using the following workflow.
+1. Submit your ingestion task.
+2. Repeatedly poll the [Overlord's tasks API](../api-reference/tasks-api.md) ( `/druid/indexer/v1/task/{taskId}/status`) until your task is shown to be successfully completed.
+3. Poll the [Segment Loading by Datasource API](../api-reference/legacy-metadata-api.md#segment-loading-by-datasource) (`/druid/coordinator/v1/datasources/{dataSourceName}/loadstatus`) with 
+`forceMetadataRefresh=true` and `interval=<INTERVAL_OF_INGESTED_DATA>` once. 
+(Note: `forceMetadataRefresh=true` refreshes Coordinator's metadata cache of all datasources. This can be a heavy operation in terms of the load on the metadata store but is necessary to make sure that we verify all the latest segments' load status)
+If there are segments not yet loaded, continue to step 4, otherwise you can now query the data.
+4. Repeatedly poll the [Segment Loading by Datasource API](../api-reference/legacy-metadata-api.md#segment-loading-by-datasource) (`/druid/coordinator/v1/datasources/{dataSourceName}/loadstatus`) with 
+`forceMetadataRefresh=false` and `interval=<INTERVAL_OF_INGESTED_DATA>`. 
+Continue polling until all segments are loaded. Once all segments are loaded you can now query the data. 
+Note that this workflow only guarantees that the segments are available at the time of the [Segment Loading by Datasource API](../api-reference/legacy-metadata-api.md#segment-loading-by-datasource) call. Segments can still become missing because of historical process failures or any other reasons afterward.
+
+## I don't see my Druid segments on my Historical processes
+
+You can check the [web console](../operations/web-console.md) to make sure that your segments have actually loaded on [Historical processes](../design/historical.md). If your segments are not present, check the Coordinator logs for messages about capacity of replication errors. One reason that segments are not downloaded is because Historical processes have maxSizes that are too small, making them incapable of downloading more data. You can change that with (for example):
+
+```
+-Ddruid.segmentCache.locations=[{"path":"/tmp/druid/storageLocation","maxSize":"500000000000"}]
+ ```
+
+## My queries are returning empty results
+
+You can use a [segment metadata query](../querying/segmentmetadataquery.md) for the dimensions and metrics that have been created for your datasource. Make sure that the name of the aggregators you use in your query match one of these metrics. Also make sure that the query interval you specify match a valid time range where data exists.
+
+## Real-time ingestion seems to be stuck
+
+There are a few ways this can occur. Druid will throttle ingestion to prevent out of memory problems if the intermediate persists are taking too long or if hand-off is taking too long. If your process logs indicate certain columns are taking a very long time to build (for example, if your segment granularity is hourly, but creating a single column takes 30 minutes), you should re-evaluate your configuration or scale up your real-time ingestion.
diff --git a/docs/35.0.0/ingestion/hadoop.md b/docs/35.0.0/ingestion/hadoop.md
new file mode 100644
index 0000000000..af416c8773
--- /dev/null
+++ b/docs/35.0.0/ingestion/hadoop.md
@@ -0,0 +1,580 @@
+---
+id: hadoop
+title: "Hadoop-based ingestion"
+sidebar_label: "Hadoop-based"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::caution[Deprecated]
+
+Hadoop-based ingestion is deprecated and scheduled to be removed with Druid 37.0.0.
+
+We recommend one of Druid's other supported ingestion methods, such as [SQL-based ingestion](../multi-stage-query/index.md) or [MiddleManager-less ingestion using Kubernetes](../development/extensions-core/k8s-jobs.md)
+
+You must now explicitly opt-in to using the deprecated `index_hadoop` task type. To opt-in, set `druid.indexer.task.allowHadoopTaskExecution` to `true` in your `common.runtime.properties` file. For more information, see [#18239](https://github.com/apache/druid/pull/18239).
+
+:::
+
+
+
+Apache Hadoop-based batch ingestion in Apache Druid is supported via a Hadoop-ingestion task. These tasks can be posted to a running
+instance of a Druid [Overlord](../design/overlord.md). Please refer to our [Hadoop-based vs. native batch comparison table](index.md#batch) for
+comparisons between Hadoop-based, native batch (simple), and native batch (parallel) ingestion.
+
+To run a Hadoop-based ingestion task, write an ingestion spec as specified below. Then POST it to the
+[`/druid/indexer/v1/task`](../api-reference/tasks-api.md) endpoint on the Overlord, or use the
+`bin/post-index-task` script included with Druid.
+
+## Tutorial
+
+This page contains reference documentation for Hadoop-based ingestion.
+For a walk-through instead, check out the [Loading from Apache Hadoop](../tutorials/tutorial-batch-hadoop.md) tutorial.
+
+## Task syntax
+
+A sample task is shown below:
+
+```json
+{
+  "type" : "index_hadoop",
+  "spec" : {
+    "dataSchema" : {
+      "dataSource" : "wikipedia",
+      "parser" : {
+        "type" : "hadoopyString",
+        "parseSpec" : {
+          "format" : "json",
+          "timestampSpec" : {
+            "column" : "timestamp",
+            "format" : "auto"
+          },
+          "dimensionsSpec" : {
+            "dimensions": ["page","language","user","unpatrolled","newPage","robot","anonymous","namespace","continent","country","region","city"],
+            "dimensionExclusions" : [],
+            "spatialDimensions" : []
+          }
+        }
+      },
+      "metricsSpec" : [
+        {
+          "type" : "count",
+          "name" : "count"
+        },
+        {
+          "type" : "doubleSum",
+          "name" : "added",
+          "fieldName" : "added"
+        },
+        {
+          "type" : "doubleSum",
+          "name" : "deleted",
+          "fieldName" : "deleted"
+        },
+        {
+          "type" : "doubleSum",
+          "name" : "delta",
+          "fieldName" : "delta"
+        }
+      ],
+      "granularitySpec" : {
+        "type" : "uniform",
+        "segmentGranularity" : "DAY",
+        "queryGranularity" : "NONE",
+        "intervals" : [ "2013-08-31/2013-09-01" ]
+      }
+    },
+    "ioConfig" : {
+      "type" : "hadoop",
+      "inputSpec" : {
+        "type" : "static",
+        "paths" : "/MyDirectory/example/wikipedia_data.json"
+      }
+    },
+    "tuningConfig" : {
+      "type": "hadoop"
+    }
+  },
+  "hadoopDependencyCoordinates": <my_hadoop_version>
+}
+```
+
+|property|description|required?|
+|--------|-----------|---------|
+|type|The task type, this should always be "index_hadoop".|yes|
+|spec|A Hadoop Index Spec. See [Ingestion](../ingestion/index.md)|yes|
+|hadoopDependencyCoordinates|A JSON array of Hadoop dependency coordinates that Druid will use, this property will override the default Hadoop coordinates. Once specified, Druid will look for those Hadoop dependencies from the location specified by `druid.extensions.hadoopDependenciesDir`|no|
+|classpathPrefix|Classpath that will be prepended for the Peon process.|no|
+
+Also note that Druid automatically computes the classpath for Hadoop job containers that run in the Hadoop cluster. But in case of conflicts between Hadoop and Druid's dependencies, you can manually specify the classpath by setting `druid.extensions.hadoopContainerDruidClasspath` property. See the extensions config in [base druid configuration](../configuration/index.md#extensions).
+
+## `dataSchema`
+
+This field is required. See the [`dataSchema`](ingestion-spec.md#legacy-dataschema-spec) section of the main ingestion page for details on
+what it should contain.
+
+## `ioConfig`
+
+This field is required.
+
+|Field|Type|Description|Required|
+|-----|----|-----------|--------|
+|type|String|This should always be 'hadoop'.|yes|
+|inputSpec|Object|A specification of where to pull the data in from. See below.|yes|
+|segmentOutputPath|String|The path to dump segments into.|Only used by the [Command-line Hadoop indexer](#cli). This field must be null otherwise.|
+|metadataUpdateSpec|Object|A specification of how to update the metadata for the druid cluster these segments belong to.|Only used by the [Command-line Hadoop indexer](#cli). This field must be null otherwise.|
+
+### `inputSpec`
+
+There are multiple types of inputSpecs:
+
+#### `static`
+
+A type of inputSpec where a static path to the data files is provided.
+
+|Field|Type|Description|Required|
+|-----|----|-----------|--------|
+|inputFormat|String|Specifies the Hadoop InputFormat class to use. e.g. `org.apache.hadoop.mapreduce.lib.input.SequenceFileInputFormat` |no|
+|paths|String|Comma-separated input paths to the raw data. Druid ingests data only from the configured paths. It does not search recursively for data in subdirectories. |yes|
+
+For example, using the static input paths:
+
+```
+"paths" : "hdfs://path/to/data/is/here/data.gz,hdfs://path/to/data/is/here/moredata.gz,hdfs://path/to/data/is/here/evenmoredata.gz"
+```
+
+You can also read from cloud storage such as Amazon S3 or Google Cloud Storage.
+To do so, you need to install the necessary library under Druid's classpath in _all Middle Manager or Indexer processes_.
+For S3, you can run the below command to install the [Hadoop AWS module](https://hadoop.apache.org/docs/stable/hadoop-aws/tools/hadoop-aws/).
+
+```bash
+java -classpath "${DRUID_HOME}lib/*" org.apache.druid.cli.Main tools pull-deps -h "org.apache.hadoop:hadoop-aws:${HADOOP_VERSION}";
+cp ${DRUID_HOME}/hadoop-dependencies/hadoop-aws/${HADOOP_VERSION}/hadoop-aws-${HADOOP_VERSION}.jar ${DRUID_HOME}/extensions/druid-hdfs-storage/
+```
+
+Once you install the Hadoop AWS module in all Middle Manager and Indexer processes, you can put
+your S3 paths in the inputSpec with the below job properties.
+For more configurations, see the [Hadoop AWS module](https://hadoop.apache.org/docs/stable/hadoop-aws/tools/hadoop-aws/).
+
+```
+"paths" : "s3a://billy-bucket/the/data/is/here/data.gz,s3a://billy-bucket/the/data/is/here/moredata.gz,s3a://billy-bucket/the/data/is/here/evenmoredata.gz"
+```
+
+```json
+"jobProperties" : {
+  "fs.s3a.impl" : "org.apache.hadoop.fs.s3a.S3AFileSystem",
+  "fs.AbstractFileSystem.s3a.impl" : "org.apache.hadoop.fs.s3a.S3A",
+  "fs.s3a.access.key" : "YOUR_ACCESS_KEY",
+  "fs.s3a.secret.key" : "YOUR_SECRET_KEY"
+}
+```
+
+For Google Cloud Storage, you need to install [GCS connector jar](https://github.com/GoogleCloudPlatform/bigdata-interop/blob/master/gcs/INSTALL.md)
+under `${DRUID_HOME}/hadoop-dependencies` in _all Middle Manager or Indexer processes_.
+Once you install the GCS Connector jar in all Middle Manager and Indexer processes, you can put
+your Google Cloud Storage paths in the inputSpec with the below job properties.
+For more configurations, see the [instructions to configure Hadoop](https://github.com/GoogleCloudPlatform/bigdata-interop/blob/master/gcs/INSTALL.md#configure-hadoop),
+[GCS core default](https://github.com/GoogleCloudDataproc/hadoop-connectors/blob/v2.0.0/gcs/conf/gcs-core-default.xml)
+and [GCS core template](https://github.com/GoogleCloudDataproc/hadoop-connectors/blob/master/gcs/src/test/resources/core-site.xml).
+
+```
+"paths" : "gs://billy-bucket/the/data/is/here/data.gz,gs://billy-bucket/the/data/is/here/moredata.gz,gs://billy-bucket/the/data/is/here/evenmoredata.gz"
+```
+
+```json
+"jobProperties" : {
+  "fs.gs.impl" : "com.google.cloud.hadoop.fs.gcs.GoogleHadoopFileSystem",
+  "fs.AbstractFileSystem.gs.impl" : "com.google.cloud.hadoop.fs.gcs.GoogleHadoopFS"
+}
+```
+
+#### `granularity`
+
+A type of inputSpec that expects data to be organized in directories according to datetime using the path format: `y=XXXX/m=XX/d=XX/H=XX/M=XX/S=XX` (where date is represented by lowercase and time is represented by uppercase).
+
+|Field|Type|Description|Required|
+|-----|----|-----------|--------|
+|dataGranularity|String|Specifies the granularity to expect the data at, e.g. hour means to expect directories `y=XXXX/m=XX/d=XX/H=XX`.|yes|
+|inputFormat|String|Specifies the Hadoop InputFormat class to use. e.g. `org.apache.hadoop.mapreduce.lib.input.SequenceFileInputFormat` |no|
+|inputPath|String|Base path to append the datetime path to.|yes|
+|filePattern|String|Pattern that files should match to be included.|yes|
+|pathFormat|String|Joda datetime format for each directory. Default value is `"'y'=yyyy/'m'=MM/'d'=dd/'H'=HH"`, or see [Joda documentation](http://www.joda.org/joda-time/apidocs/org/joda/time/format/DateTimeFormat.html)|no|
+
+For example, if the sample config were run with the interval 2012-06-01/2012-06-02, it would expect data at the paths:
+
+```
+s3n://billy-bucket/the/data/is/here/y=2012/m=06/d=01/H=00
+s3n://billy-bucket/the/data/is/here/y=2012/m=06/d=01/H=01
+...
+s3n://billy-bucket/the/data/is/here/y=2012/m=06/d=01/H=23
+```
+
+#### `dataSource`
+
+This is a type of `inputSpec` that reads data already stored inside Druid. This is used to allow "re-indexing" data and for "delta-ingestion" described later in `multi` type inputSpec.
+
+|Field|Type|Description|Required|
+|-----|----|-----------|--------|
+|type|String.|This should always be 'dataSource'.|yes|
+|ingestionSpec|JSON object.|Specification of Druid segments to be loaded. See below.|yes|
+|maxSplitSize|Number|Enables combining multiple segments into single Hadoop InputSplit according to size of segments. With -1, druid calculates max split size based on user specified number of map task(mapred.map.tasks or mapreduce.job.maps). By default, one split is made for one segment. maxSplitSize is specified in bytes.|no|
+|useNewAggs|Boolean|If "false", then list of aggregators in "metricsSpec" of hadoop indexing task must be same as that used in original indexing task while ingesting raw data. Default value is "false". This field can be set to "true" when "inputSpec" type is "dataSource" and not "multi" to enable arbitrary aggregators while reindexing. See below for "multi" type support for delta-ingestion.|no|
+
+Here is what goes inside `ingestionSpec`:
+
+|Field|Type|Description|Required|
+|-----|----|-----------|--------|
+|dataSource|String|Druid dataSource name from which you are loading the data.|yes|
+|intervals|List|A list of strings representing ISO-8601 Intervals.|yes|
+|segments|List|List of segments from which to read data from, by default it is obtained automatically. You can obtain list of segments to put here by making a POST query to Coordinator at url /druid/coordinator/v1/metadata/datasources/segments?full with list of intervals specified in the request payload, e.g. ["2012-01-01T00:00:00.000/2012-01-03T00:00:00.000", "2012-01-05T00:00:00.000/2012-01-07T00:00:00.000"]. You may want to provide this list manually in order to ensure that segments read are exactly same as they were at the time of task submission, task would fail if the list provided by the user does not match with state of database when the task actually runs.|no|
+|filter|JSON|See [Filters](../querying/filters.md)|no|
+|dimensions|Array of String|Name of dimension columns to load. By default, the list will be constructed from parseSpec. If parseSpec does not have an explicit list of dimensions then all the dimension columns present in stored data will be read.|no|
+|metrics|Array of String|Name of metric columns to load. By default, the list will be constructed from the "name" of all the configured aggregators.|no|
+|ignoreWhenNoSegments|boolean|Whether to ignore this ingestionSpec if no segments were found. Default behavior is to throw error when no segments were found.|no|
+
+For example
+
+```json
+"ioConfig" : {
+  "type" : "hadoop",
+  "inputSpec" : {
+    "type" : "dataSource",
+    "ingestionSpec" : {
+      "dataSource": "wikipedia",
+      "intervals": ["2014-10-20T00:00:00Z/P2W"]
+    }
+  },
+  ...
+}
+```
+
+#### `multi`
+
+This is a composing inputSpec to combine other inputSpecs. This inputSpec is used for delta ingestion. You can also use a `multi` inputSpec to combine data from multiple dataSources. However, each particular dataSource can only be specified one time.
+Note that, "useNewAggs" must be set to default value false to support delta-ingestion.
+
+|Field|Type|Description|Required|
+|-----|----|-----------|--------|
+|children|Array of JSON objects|List of JSON objects containing other inputSpecs.|yes|
+
+For example:
+
+```json
+"ioConfig" : {
+  "type" : "hadoop",
+  "inputSpec" : {
+    "type" : "multi",
+    "children": [
+      {
+        "type" : "dataSource",
+        "ingestionSpec" : {
+          "dataSource": "wikipedia",
+          "intervals": ["2012-01-01T00:00:00.000/2012-01-03T00:00:00.000", "2012-01-05T00:00:00.000/2012-01-07T00:00:00.000"],
+          "segments": [
+            {
+              "dataSource": "test1",
+              "interval": "2012-01-01T00:00:00.000/2012-01-03T00:00:00.000",
+              "version": "v2",
+              "loadSpec": {
+                "type": "local",
+                "path": "/tmp/index1.zip"
+              },
+              "dimensions": "host",
+              "metrics": "visited_sum,unique_hosts",
+              "shardSpec": {
+                "type": "none"
+              },
+              "binaryVersion": 9,
+              "size": 2,
+              "identifier": "test1_2000-01-01T00:00:00.000Z_3000-01-01T00:00:00.000Z_v2"
+            }
+          ]
+        }
+      },
+      {
+        "type" : "static",
+        "paths": "/path/to/more/wikipedia/data/"
+      }
+    ]
+  },
+  ...
+}
+```
+
+It is STRONGLY RECOMMENDED to provide list of segments in `dataSource` inputSpec explicitly so that your delta ingestion task is idempotent. You can obtain that list of segments by making following call to the Coordinator.
+POST `/druid/coordinator/v1/metadata/datasources/{dataSourceName}/segments?full`
+Request Body: [interval1, interval2,...] for example ["2012-01-01T00:00:00.000/2012-01-03T00:00:00.000", "2012-01-05T00:00:00.000/2012-01-07T00:00:00.000"]
+
+## `tuningConfig`
+
+The tuningConfig is optional and default parameters will be used if no tuningConfig is specified.
+
+|Field|Type|Description|Required|
+|-----|----|-----------|--------|
+|workingPath|String|The working path to use for intermediate results (results between Hadoop jobs).|Only used by the [Command-line Hadoop indexer](#cli). The default is '/tmp/druid-indexing'. This field must be null otherwise.|
+|version|String|The version of created segments. Ignored for HadoopIndexTask unless useExplicitVersion is set to true|no (default == datetime that indexing starts at)|
+|partitionsSpec|Object|A specification of how to partition each time bucket into segments. Absence of this property means no partitioning will occur. See [`partitionsSpec`](#partitionsspec) below.|no (default == 'hashed')|
+|maxRowsInMemory|Integer|The number of rows to aggregate before persisting. Note that this is the number of post-aggregation rows which may not be equal to the number of input events due to roll-up. This is used to manage the required JVM heap size. Normally user does not need to set this, but depending on the nature of data, if rows are short in terms of bytes, user may not want to store a million rows in memory and this value should be set.|no (default == 1000000)|
+|maxBytesInMemory|Long|The number of bytes to aggregate in heap memory before persisting. Normally this is computed internally and user does not need to set it. This is based on a rough estimate of memory usage and not actual usage. The maximum heap memory usage for indexing is maxBytesInMemory * (2 + maxPendingPersists). Note that `maxBytesInMemory` also includes heap usage of artifacts created from intermediary persists. This means that after every persist, the amount of `maxBytesInMemory` until next persist will decreases, and task will fail when the sum of bytes of all intermediary persisted artifacts exceeds `maxBytesInMemory`.|no (default == One-sixth of max JVM memory)|
+|leaveIntermediate|Boolean|Leave behind intermediate files (for debugging) in the workingPath when a job completes, whether it passes or fails.|no (default == false)|
+|cleanupOnFailure|Boolean|Clean up intermediate files when a job fails (unless leaveIntermediate is on).|no (default == true)|
+|overwriteFiles|Boolean|Override existing files found during indexing.|no (default == false)|
+|ignoreInvalidRows|Boolean|DEPRECATED. Ignore rows found to have problems. If false, any exception encountered during parsing will be thrown and will halt ingestion; if true, unparseable rows and fields will be skipped. If `maxParseExceptions` is defined, this property is ignored.|no (default == false)|
+|combineText|Boolean|Use CombineTextInputFormat to combine multiple files into a file split. This can speed up Hadoop jobs when processing a large number of small files.|no (default == false)|
+|useCombiner|Boolean|Use Hadoop combiner to merge rows at mapper if possible.|no (default == false)|
+|jobProperties|Object|A map of properties to add to the Hadoop job configuration, see below for details.|no (default == null)|
+|indexSpec|Object|Tune how data is indexed. See [`indexSpec`](ingestion-spec.md#indexspec) on the main ingestion page for more information.|no|
+|indexSpecForIntermediatePersists|Object|defines segment storage format options to be used at indexing time for intermediate persisted temporary segments. this can be used to disable dimension/metric compression on intermediate segments to reduce memory required for final merging. however, disabling compression on intermediate segments might increase page cache use while they are used before getting merged into final segment published, see [`indexSpec`](ingestion-spec.md#indexspec) for possible values.|no (default = same as indexSpec)|
+|numBackgroundPersistThreads|Integer|The number of new background threads to use for incremental persists. Using this feature causes a notable increase in memory pressure and CPU usage but will make the job finish more quickly. If changing from the default of 0 (use current thread for persists), we recommend setting it to 1.|no (default == 0)|
+|forceExtendableShardSpecs|Boolean|Forces use of extendable shardSpecs. Hash-based partitioning always uses an extendable shardSpec. For single-dimension partitioning, this option should be set to true to use an extendable shardSpec. For partitioning, please check [Partitioning specification](#partitionsspec). This option can be useful when you need to append more data to existing dataSource.|no (default = false)|
+|useExplicitVersion|Boolean|Forces HadoopIndexTask to use version.|no (default = false)|
+|logParseExceptions|Boolean|If true, log an error message when a parsing exception occurs, containing information about the row where the error occurred.|no(default = false)|
+|maxParseExceptions|Integer|The maximum number of parse exceptions that can occur before the task halts ingestion and fails. Overrides `ignoreInvalidRows` if `maxParseExceptions` is defined.|no(default = unlimited)|
+|useYarnRMJobStatusFallback|Boolean|If the Hadoop jobs created by the indexing task are unable to retrieve their completion status from the JobHistory server, and this parameter is true, the indexing task will try to fetch the application status from `http://<yarn-rm-address>/ws/v1/cluster/apps/<application-id>`, where `<yarn-rm-address>` is the value of `yarn.resourcemanager.webapp.address` in your Hadoop configuration. This flag is intended as a fallback for cases where an indexing task's jobs succeed, but the JobHistory server is unavailable, causing the indexing task to fail because it cannot determine the job statuses.|no (default = true)|
+|awaitSegmentAvailabilityTimeoutMillis|Long|Milliseconds to wait for the newly indexed segments to become available for query after ingestion completes. If `<= 0`, no wait will occur. If `> 0`, the task will wait for the Coordinator to indicate that the new segments are available for querying. If the timeout expires, the task will exit as successful, but the segments were not confirmed to have become available for query.|no (default = 0)|
+
+### `jobProperties`
+
+```json
+   "tuningConfig" : {
+     "type": "hadoop",
+     "jobProperties": {
+       "<hadoop-property-a>": "<value-a>",
+       "<hadoop-property-b>": "<value-b>"
+     }
+   }
+```
+
+Hadoop's [MapReduce documentation](https://hadoop.apache.org/docs/stable/hadoop-mapreduce-client/hadoop-mapreduce-client-core/mapred-default.xml) lists the possible configuration parameters.
+
+With some Hadoop distributions, it may be necessary to set `mapreduce.job.classpath` or `mapreduce.job.user.classpath.first`
+to avoid class loading issues. See the [working with different Hadoop versions documentation](../operations/other-hadoop.md)
+for more details.
+
+## `partitionsSpec`
+
+Segments are always partitioned based on timestamp (according to the granularitySpec) and may be further partitioned in
+some other way depending on partition type. Druid supports two types of partitioning strategies: `hashed` (based on the
+hash of all dimensions in each row), and `single_dim` (based on ranges of a single dimension).
+
+Hashed partitioning is recommended in most cases, as it will improve indexing performance and create more uniformly
+sized data segments relative to single-dimension partitioning.
+
+### Hash-based partitioning
+
+```json
+  "partitionsSpec": {
+     "type": "hashed",
+     "targetRowsPerSegment": 5000000
+   }
+```
+
+Hashed partitioning works by first selecting a number of segments, and then partitioning rows across those segments
+according to the hash of all dimensions in each row. The number of segments is determined automatically based on the
+cardinality of the input set and a target partition size.
+
+The configuration options are:
+
+|Field|Description|Required|
+|--------|-----------|---------|
+|type|Type of partitionSpec to be used.|"hashed"|
+|targetRowsPerSegment|Target number of rows to include in a partition, should be a number that targets segments of 500MB\~1GB. Defaults to 5000000 if `numShards` is not set.|either this or `numShards`|
+|targetPartitionSize|Deprecated. Renamed to `targetRowsPerSegment`. Target number of rows to include in a partition, should be a number that targets segments of 500MB\~1GB.|either this or `numShards`|
+|maxRowsPerSegment|Deprecated. Renamed to `targetRowsPerSegment`. Target number of rows to include in a partition, should be a number that targets segments of 500MB\~1GB.|either this or `numShards`|
+|numShards|Specify the number of partitions directly, instead of a target partition size. Ingestion will run faster, since it can skip the step necessary to select a number of partitions automatically.|either this or `targetRowsPerSegment`|
+|partitionDimensions|The dimensions to partition on. Leave blank to select all dimensions. Only used with `numShards`, will be ignored when `targetRowsPerSegment` is set.|no|
+|partitionFunction|A function to compute hash of partition dimensions. See [Hash partition function](#hash-partition-function)|`murmur3_32_abs`|no|
+
+##### Hash partition function
+
+In hash partitioning, the partition function is used to compute hash of partition dimensions. The partition dimension
+values are first serialized into a byte array as a whole, and then the partition function is applied to compute hash of
+the byte array.
+Druid currently supports only one partition function.
+
+|name|description|
+|----|-----------|
+|`murmur3_32_abs`|Applies an absolute value function to the result of [`murmur3_32`](https://guava.dev/releases/16.0/api/docs/com/google/common/hash/Hashing.html#murmur3_32()).|
+
+### Single-dimension range partitioning
+
+```json
+  "partitionsSpec": {
+     "type": "single_dim",
+     "targetRowsPerSegment": 5000000
+   }
+```
+
+Single-dimension range partitioning works by first selecting a dimension to partition on, and then separating that dimension
+into contiguous ranges. Each segment will contain all rows with values of that dimension in that range. For example,
+your segments may be partitioned on the dimension "host" using the ranges "a.example.com" to "f.example.com" and
+"f.example.com" to "z.example.com". By default, the dimension to use is determined automatically, although you can
+override it with a specific dimension.
+
+The configuration options are:
+
+|Field|Description|Required|
+|--------|-----------|---------|
+|type|Type of partitionSpec to be used.|"single_dim"|
+|targetRowsPerSegment|Target number of rows to include in a partition, should be a number that targets segments of 500MB\~1GB.|yes|
+|targetPartitionSize|Deprecated. Renamed to `targetRowsPerSegment`. Target number of rows to include in a partition, should be a number that targets segments of 500MB\~1GB.|no|
+|maxRowsPerSegment|Maximum number of rows to include in a partition. Defaults to 50% larger than the `targetRowsPerSegment`.|no|
+|maxPartitionSize|Deprecated. Use `maxRowsPerSegment` instead. Maximum number of rows to include in a partition. Defaults to 50% larger than the `targetPartitionSize`.|no|
+|partitionDimension|The dimension to partition on. Leave blank to select a dimension automatically.|no|
+|assumeGrouped|Assume that input data has already been grouped on time and dimensions. Ingestion will run faster, but may choose sub-optimal partitions if this assumption is violated.|no|
+
+## Remote Hadoop clusters
+
+If you have a remote Hadoop cluster, make sure to include the folder holding your configuration `*.xml` files in your Druid `_common` configuration folder.
+
+If you are having dependency problems with your version of Hadoop and the version compiled with Druid, please see [these docs](../operations/other-hadoop.md).
+
+## Elastic MapReduce
+
+If your cluster is running on Amazon Web Services, you can use Elastic MapReduce (EMR) to index data
+from S3. To do this:
+
+- Create a persistent, [long-running cluster](http://docs.aws.amazon.com/ElasticMapReduce/latest/ManagementGuide/emr-plan-longrunning-transient).
+- When creating your cluster, enter the following configuration. If you're using the wizard, this
+should be in advanced mode under "Edit software settings":
+
+```
+classification=yarn-site,properties=[mapreduce.reduce.memory.mb=6144,mapreduce.reduce.java.opts=-server -Xms2g -Xmx2g -Duser.timezone=UTC -Dfile.encoding=UTF-8 -XX:+PrintGCDetails -XX:+PrintGCTimeStamps,mapreduce.map.java.opts=758,mapreduce.map.java.opts=-server -Xms512m -Xmx512m -Duser.timezone=UTC -Dfile.encoding=UTF-8 -XX:+PrintGCDetails -XX:+PrintGCTimeStamps,mapreduce.task.timeout=1800000]
+```
+
+- Follow the instructions under
+[Configure for connecting to Hadoop](../tutorials/cluster.md#configure-for-connecting-to-hadoop-optional) using the XML files from `/etc/hadoop/conf`
+on your EMR master.
+
+## Kerberized Hadoop clusters
+
+By default druid can use the existing TGT kerberos ticket available in local kerberos key cache.
+Although TGT ticket has a limited life cycle,
+therefore you need to call `kinit` command periodically to ensure validity of TGT ticket.
+To avoid this extra external cron job script calling `kinit` periodically,
+ you can provide the principal name and keytab location and druid will do the authentication transparently at startup and job launching time.
+
+|Property|Possible Values|Description|Default|
+|--------|---------------|-----------|-------|
+|`druid.hadoop.security.kerberos.principal`|`druid@EXAMPLE.COM`| Principal user name |empty|
+|`druid.hadoop.security.kerberos.keytab`|`/etc/security/keytabs/druid.headlessUser.keytab`|Path to keytab file|empty|
+
+### Loading from S3 with EMR
+
+- In the `jobProperties` field in the `tuningConfig` section of your Hadoop indexing task, add:
+
+```
+"jobProperties" : {
+   "fs.s3.awsAccessKeyId" : "YOUR_ACCESS_KEY",
+   "fs.s3.awsSecretAccessKey" : "YOUR_SECRET_KEY",
+   "fs.s3.impl" : "org.apache.hadoop.fs.s3native.NativeS3FileSystem",
+   "fs.s3n.awsAccessKeyId" : "YOUR_ACCESS_KEY",
+   "fs.s3n.awsSecretAccessKey" : "YOUR_SECRET_KEY",
+   "fs.s3n.impl" : "org.apache.hadoop.fs.s3native.NativeS3FileSystem",
+   "io.compression.codecs" : "org.apache.hadoop.io.compress.GzipCodec,org.apache.hadoop.io.compress.DefaultCodec,org.apache.hadoop.io.compress.BZip2Codec,org.apache.hadoop.io.compress.SnappyCodec"
+}
+```
+
+Note that this method uses Hadoop's built-in S3 filesystem rather than Amazon's EMRFS, and is not compatible
+with Amazon-specific features such as S3 encryption and consistent views. If you need to use these
+features, you will need to make the Amazon EMR Hadoop JARs available to Druid through one of the
+mechanisms described in the [Using other Hadoop distributions](#using-other-hadoop-distributions) section.
+
+## Using other Hadoop distributions
+
+Druid works out of the box with many Hadoop distributions.
+
+If you are having dependency conflicts between Druid and your version of Hadoop, you can try
+searching for a solution in the [Druid user groups](https://groups.google.com/forum/#!forum/druid-user), or reading the
+Druid [Different Hadoop Versions](../operations/other-hadoop.md) documentation.
+
+<a name="cli"></a>
+
+## Command line (non-task) version
+
+To run:
+
+```
+java -Xmx256m -Duser.timezone=UTC -Dfile.encoding=UTF-8 -classpath lib/*:<hadoop_config_dir> org.apache.druid.cli.Main index hadoop <spec_file>
+```
+
+### Options
+
+- "--coordinate" - provide a version of Apache Hadoop to use. This property will override the default Hadoop coordinates. Once specified, Apache Druid will look for those Hadoop dependencies from the location specified by `druid.extensions.hadoopDependenciesDir`.
+- "--no-default-hadoop" - don't pull down the default hadoop version
+
+### Spec file
+
+The spec file needs to contain a JSON object where the contents are the same as the "spec" field in the Hadoop index task. See [Hadoop Batch Ingestion](../ingestion/hadoop.md) for details on the spec format.
+
+In addition, a `metadataUpdateSpec` and `segmentOutputPath` field needs to be added to the ioConfig:
+
+```
+      "ioConfig" : {
+        ...
+        "metadataUpdateSpec" : {
+          "type":"mysql",
+          "connectURI" : "jdbc:mysql://localhost:3306/druid",
+          "password" : "diurd",
+          "segmentTable" : "druid_segments",
+          "user" : "druid"
+        },
+        "segmentOutputPath" : "/MyDirectory/data/index/output"
+      },
+```
+
+and a `workingPath` field needs to be added to the tuningConfig:
+
+```
+  "tuningConfig" : {
+   ...
+    "workingPath": "/tmp",
+    ...
+  }
+```
+
+#### Metadata Update Job Spec
+
+This is a specification of the properties that tell the job how to update metadata such that the Druid cluster will see the output segments and load them.
+
+|Field|Type|Description|Required|
+|-----|----|-----------|--------|
+|type|String|"metadata" is the only value available.|yes|
+|connectURI|String|A valid JDBC url to metadata storage.|yes|
+|user|String|Username for db.|yes|
+|password|String|password for db.|yes|
+|segmentTable|String|Table to use in DB.|yes|
+
+These properties should parrot what you have configured for your [Coordinator](../design/coordinator.md).
+
+#### segmentOutputPath Config
+
+|Field|Type|Description|Required|
+|-----|----|-----------|--------|
+|segmentOutputPath|String|the path to dump segments into.|yes|
+
+#### workingPath Config
+
+|Field|Type|Description|Required|
+|-----|----|-----------|--------|
+|workingPath|String|the working path to use for intermediate results (results between Hadoop jobs).|no (default == '/tmp/druid-indexing')|
+
+Please note that the command line Hadoop indexer doesn't have the locking capabilities of the indexing service, so if you choose to use it,
+you have to take caution to not override segments created by real-time processing (if you that a real-time pipeline set up).
diff --git a/docs/35.0.0/ingestion/index.md b/docs/35.0.0/ingestion/index.md
new file mode 100644
index 0000000000..de90051fca
--- /dev/null
+++ b/docs/35.0.0/ingestion/index.md
@@ -0,0 +1,80 @@
+---
+id: index
+title: Ingestion overview
+sidebar_label: Overview
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+Loading data in Druid is called _ingestion_ or _indexing_. When you ingest data into Druid, Druid reads the data from
+your source system and stores it in data files called [_segments_](../design/segments.md).
+In general, segment files contain a few million rows each.
+
+For most ingestion methods, the Druid [Middle Manager](../design/middlemanager.md) processes or the
+[Indexer](../design/indexer.md) processes load your source data. 
+
+During ingestion, Druid creates segments and stores them in [deep storage](../design/deep-storage.md). Historical nodes load the segments into memory to respond to queries. For streaming ingestion, the Middle Managers and indexers can respond to queries in real-time with arriving data. For more information, see [Storage overview](../design/storage.md).
+
+This topic introduces streaming and batch ingestion methods. The following topics describe ingestion concepts and information that apply to all [ingestion methods](#ingestion-methods):
+
+- [Druid schema model](./schema-model.md) introduces concepts of datasources, primary timestamp, dimensions, and metrics.
+- [Data rollup](./rollup.md) describes rollup as a concept and provides suggestions to maximize the benefits of rollup.
+- [Partitioning](./partitioning.md) describes time chunk and secondary partitioning in Druid.
+- [Ingestion spec reference](./ingestion-spec.md) provides a reference for the configuration options in the ingestion spec.
+
+For additional information about concepts and configurations that are unique to each ingestion method, see the topic for the ingestion method.
+
+## Ingestion methods
+
+The tables below list Druid's most common data ingestion methods, along with comparisons to help you choose
+the best one for your situation. Each ingestion method supports its own set of source systems to pull from. For details
+about how each method works, as well as configuration properties specific to that method, check out its documentation
+page.
+
+### Streaming
+
+There are two available options for streaming ingestion. Streaming ingestion is controlled by a continuously-running
+supervisor.
+
+| **Method** | [Kafka](../ingestion/kafka-ingestion.md) | [Kinesis](../ingestion/kinesis-ingestion.md) |
+|---|-----|--------------|
+| **Supervisor type** | `kafka` | `kinesis`|
+| **How it works** | Druid reads directly from Apache Kafka. | Druid reads directly from Amazon Kinesis.|
+| **Can ingest late data?** | Yes. | Yes. |
+| **Exactly-once guarantees?** | Yes. | Yes. |
+
+### Batch
+
+There are three available options for batch ingestion. Batch ingestion jobs are associated with a controller task that
+runs for the duration of the job.
+
+| **Method** | [Native batch](./native-batch.md) | [SQL](../multi-stage-query/index.md) | [Hadoop-based (deprecated)](hadoop.md) |
+|---|-----|--------------|------------|
+| **Controller task type** | `index_parallel` | `query_controller` | `index_hadoop` |
+| **How you submit it** | Send an `index_parallel` spec to the [Tasks API](../api-reference/tasks-api.md). | Send an [INSERT](../multi-stage-query/concepts.md#load-data-with-insert) or [REPLACE](../multi-stage-query/concepts.md#overwrite-data-with-replace) statement to the [SQL task API](../api-reference/sql-ingestion-api.md#submit-a-query). | Send an `index_hadoop` spec to the [Tasks API](../api-reference/tasks-api.md). |
+| **Parallelism** | Using subtasks, if [`maxNumConcurrentSubTasks`](native-batch.md#tuningconfig) is greater than 1. | Using `query_worker` subtasks. | Using YARN. |
+| **Fault tolerance** | Workers automatically relaunched upon failure. Controller task failure leads to job failure. | Controller or worker task failure leads to job failure. | YARN containers automatically relaunched upon failure. Controller task failure leads to job failure. |
+| **Can append?** | Yes. | Yes (INSERT). | No. |
+| **Can overwrite?** | Yes. | Yes (REPLACE). | Yes. |
+| **External dependencies** | None. | None. | Hadoop cluster. |
+| **Input sources** | Any [`inputSource`](./input-sources.md). | Any [`inputSource`](./input-sources.md) (using [EXTERN](../multi-stage-query/concepts.md#write-to-an-external-destination-with-extern)) or Druid datasource (using FROM). | Any Hadoop FileSystem or Druid datasource. |
+| **Input formats** | Any [`inputFormat`](./data-formats.md#input-format). | Any [`inputFormat`](./data-formats.md#input-format). | Any Hadoop InputFormat. |
+| **Secondary partitioning options** | Dynamic, hash-based, and range-based partitioning methods are available. See [partitionsSpec](./native-batch.md#partitionsspec) for details.| Range partitioning ([CLUSTERED BY](../multi-stage-query/concepts.md#clustering)). |  Hash-based or range-based partitioning via [`partitionsSpec`](hadoop.md#partitionsspec). |
+| **[Rollup modes](./rollup.md#perfect-rollup-vs-best-effort-rollup)** | Perfect if `forceGuaranteedRollup` = true in the [`tuningConfig`](native-batch.md#tuningconfig).  | Always perfect. | Always perfect. |
diff --git a/docs/35.0.0/ingestion/ingestion-spec.md b/docs/35.0.0/ingestion/ingestion-spec.md
new file mode 100644
index 0000000000..78425c9363
--- /dev/null
+++ b/docs/35.0.0/ingestion/ingestion-spec.md
@@ -0,0 +1,565 @@
+---
+id: ingestion-spec
+title: Ingestion spec reference
+sidebar_label: Ingestion spec reference
+description: Reference for the configuration options in the ingestion spec.
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+All ingestion methods use ingestion tasks to load data into Druid. Streaming ingestion uses ongoing supervisors that run and supervise a set of tasks over time. Native batch and Hadoop-based ingestion use a one-time [task](tasks.md). Other than with SQL-based ingestion, use an _ingestion spec_ to configure your ingestion.
+
+Ingestion specs consists of three main components:
+
+- [`dataSchema`](#dataschema), which configures the [datasource name](#datasource),
+   [primary timestamp](#timestampspec), [dimensions](#dimensionsspec), [metrics](#metricsspec), and [transforms and filters](#transformspec) (if needed).
+- [`ioConfig`](#ioconfig), which tells Druid how to connect to the source system and how to parse data. For more information, see the
+   documentation for each [ingestion method](./index.md#ingestion-methods).
+- [`tuningConfig`](#tuningconfig), which controls various tuning parameters specific to each
+  [ingestion method](./index.md#ingestion-methods).
+
+Example ingestion spec for task type `index_parallel` (native batch):
+
+```
+{
+  "type": "index_parallel",
+  "spec": {
+    "dataSchema": {
+      "dataSource": "wikipedia",
+      "timestampSpec": {
+        "column": "timestamp",
+        "format": "auto"
+      },
+      "dimensionsSpec": {
+        "dimensions": [
+          "page",
+          "language",
+          { "type": "long", "name": "userId" }
+        ]
+      },
+      "metricsSpec": [
+        { "type": "count", "name": "count" },
+        { "type": "doubleSum", "name": "bytes_added_sum", "fieldName": "bytes_added" },
+        { "type": "doubleSum", "name": "bytes_deleted_sum", "fieldName": "bytes_deleted" }
+      ],
+      "granularitySpec": {
+        "segmentGranularity": "day",
+        "queryGranularity": "none",
+        "intervals": [
+          "2013-08-31/2013-09-01"
+        ]
+      }
+    },
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "local",
+        "baseDir": "examples/indexing/",
+        "filter": "wikipedia_data.json"
+      },
+      "inputFormat": {
+        "type": "json",
+        "flattenSpec": {
+          "useFieldDiscovery": true,
+          "fields": [
+            { "type": "path", "name": "userId", "expr": "$.user.id" }
+          ]
+        }
+      }
+    },
+    "tuningConfig": {
+      "type": "index_parallel"
+    }
+  }
+}
+```
+
+The specific options supported by these sections will depend on the [ingestion method](./index.md#ingestion-methods) you have chosen.
+For more examples, refer to the documentation for each ingestion method.
+
+You can also load data visually, without the need to write an ingestion spec, using the "Load data" functionality
+available in Druid's [web console](../operations/web-console.md). Druid's visual data loader supports
+[Kafka](../ingestion/kafka-ingestion.md),
+[Kinesis](../ingestion/kinesis-ingestion.md), and
+[native batch](native-batch.md) mode.
+
+## `dataSchema`
+
+:::info
+ The `dataSchema` spec has been changed in 0.17.0. The new spec is supported by all ingestion methods
+except for _Hadoop_ ingestion. See the [Legacy `dataSchema` spec](#legacy-dataschema-spec) for the old spec.
+:::
+
+The `dataSchema` is a holder for the following components:
+
+- [datasource name](#datasource)
+- [primary timestamp](#timestampspec)
+- [dimensions](#dimensionsspec)
+- [metrics](#metricsspec)
+- [transforms and filters](#transformspec) (if needed).
+
+An example `dataSchema` is:
+
+```
+"dataSchema": {
+  "dataSource": "wikipedia",
+  "timestampSpec": {
+    "column": "timestamp",
+    "format": "auto"
+  },
+  "dimensionsSpec": {
+    "dimensions": [
+      "page",
+      "language",
+      { "type": "long", "name": "userId" }
+    ]
+  },
+  "metricsSpec": [
+    { "type": "count", "name": "count" },
+    { "type": "doubleSum", "name": "bytes_added_sum", "fieldName": "bytes_added" },
+    { "type": "doubleSum", "name": "bytes_deleted_sum", "fieldName": "bytes_deleted" }
+  ],
+  "granularitySpec": {
+    "segmentGranularity": "day",
+    "queryGranularity": "none",
+    "intervals": [
+      "2013-08-31/2013-09-01"
+    ]
+  }
+}
+```
+
+### `dataSource`
+
+The `dataSource` is located in `dataSchema` → `dataSource` and is simply the name of the
+[datasource](../design/storage.md) that data will be written to. An example
+`dataSource` is:
+
+```
+"dataSource": "my-first-datasource"
+```
+
+### `timestampSpec`
+
+The `timestampSpec` is located in `dataSchema` → `timestampSpec` and is responsible for
+configuring the [primary timestamp](./schema-model.md#primary-timestamp). An example `timestampSpec` is:
+
+```
+"timestampSpec": {
+  "column": "timestamp",
+  "format": "auto"
+}
+```
+
+:::info
+ Conceptually, after input data records are read, Druid applies ingestion spec components in a particular order:
+ first [`flattenSpec`](data-formats.md#flattenspec) (if any), then [`timestampSpec`](#timestampspec), then [`transformSpec`](#transformspec),
+ and finally [`dimensionsSpec`](#dimensionsspec) and [`metricsSpec`](#metricsspec). Keep this in mind when writing
+ your ingestion spec.
+:::
+
+A `timestampSpec` can have the following components:
+
+|Field|Description|Default|
+|-----|-----------|-------|
+|column|Input row field to read the primary timestamp from.<br /><br />Regardless of the name of this input field, the primary timestamp will always be stored as a column named `__time` in your Druid datasource.|timestamp|
+|format|Timestamp format. Options are: <ul><li>`iso`: ISO8601 with 'T' separator, like "2000-01-01T01:02:03.456"</li><li>`posix`: seconds since epoch</li><li>`millis`: milliseconds since epoch</li><li>`micro`: microseconds since epoch</li><li>`nano`: nanoseconds since epoch</li><li>`auto`: automatically detects ISO (either 'T' or space separator) or millis format</li><li>any [Joda DateTimeFormat string](http://joda-time.sourceforge.net/apidocs/org/joda/time/format/DateTimeFormat.html)</li></ul>|auto|
+|missingValue|Timestamp to use for input records that have a null or missing timestamp `column`. Should be in ISO8601 format, like `"2000-01-01T01:02:03.456"`, even if you have specified something else for `format`. Since Druid requires a primary timestamp, this setting can be useful for ingesting datasets that do not have any per-record timestamps at all. |none|
+
+You can use the timestamp in a expression as `__time` because Druid parses the `timestampSpec` before applying [transforms](#transforms).  You can also set the expression `name` to `__time` to replace the value of the timestamp.
+
+Treat `__time` as a millisecond timestamp: the number of milliseconds since Jan 1, 1970 at midnight UTC.
+
+### `dimensionsSpec`
+
+The `dimensionsSpec` is located in `dataSchema` → `dimensionsSpec` and is responsible for
+configuring [dimensions](./schema-model.md#dimensions).
+
+You can either manually specify the dimensions or take advantage of schema auto-discovery where you allow Druid to infer all or some of the schema for your data. This means that you don't have to explicitly specify your dimensions and their type. 
+
+To use schema auto-discovery, set `useSchemaDiscovery` to `true`. 
+
+Alternatively, you can use the string-based schemaless ingestion where any discovered dimensions are treated as strings. To do so, leave `useSchemaDiscovery` set to `false` (default). Then, set the dimensions list to empty or set the  `includeAllDimensions` property to `true`.
+
+The following `dimensionsSpec` example uses schema auto-discovery (`"useSchemaDiscovery": true`) in conjunction with explicitly defined dimensions to have Druid infer some of the schema for the data:
+
+
+
+```json
+"dimensionsSpec" : {
+  "dimensions": [
+    "page",
+    "language",
+    { "type": "long", "name": "userId" }
+  ],
+  "dimensionExclusions" : [],
+  "spatialDimensions" : [],
+  "useSchemaDiscovery": true
+}
+```
+
+
+:::info
+ Conceptually, after input data records are read, Druid applies ingestion spec components in a particular order:
+ first [`flattenSpec`](data-formats.md#flattenspec) (if any), then [`timestampSpec`](#timestampspec), then [`transformSpec`](#transformspec),
+ and finally [`dimensionsSpec`](#dimensionsspec) and [`metricsSpec`](#metricsspec). Keep this in mind when writing
+ your ingestion spec.
+:::
+
+A `dimensionsSpec` can have the following components:
+
+| Field                  | Description                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                         | Default |
+|------------------------|---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|---------|
+| `dimensions`           | A list of [dimension names or objects](#dimension-objects). You cannot include the same column in both `dimensions` and `dimensionExclusions`.<br /><br />If `dimensions` and `spatialDimensions` are both null or empty arrays, Druid treats all columns other than timestamp or metrics that do not appear in `dimensionExclusions` as String-typed dimension columns. See [inclusions and exclusions](#inclusions-and-exclusions) for details.<br /><br />As a best practice, put the most frequently filtered dimensions at the beginning of the dimensions list. In this case, it would also be good to consider [`partitioning`](partitioning.md) by those same dimensions.                                                                                                                                                                                                                                  | `[]`    |
+| `dimensionExclusions`  | The names of dimensions to exclude from ingestion. Only names are supported here, not objects.<br /><br />This list is only used if the `dimensions` and `spatialDimensions` lists are both null or empty arrays; otherwise it is ignored. See [inclusions and exclusions](#inclusions-and-exclusions) below for details.                                                                                                                                                                                                                                                                                                                                               | `[]`    |
+| `spatialDimensions`    | An array of [spatial dimensions](../querying/geo.md).                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            | `[]`    |
+| `includeAllDimensions` | Note that this field only applies to string-based schema discovery where Druid ingests dimensions it discovers as strings. This is different from schema auto-discovery where Druid infers the type for data. You can set `includeAllDimensions` to true to ingest both explicit dimensions in the `dimensions` field and other dimensions that the ingestion task discovers from input data. In this case, the explicit dimensions will appear first in the order that you specify them, and the dimensions dynamically discovered will come after. This flag can be useful especially with auto schema discovery using [`flattenSpec`](./data-formats.md#flattenspec). If this is not set and the `dimensions` field is not empty, Druid will ingest only explicit dimensions. If this is not set and the `dimensions` field is empty, all discovered dimensions will be ingested. | false   |
+| `useSchemaDiscovery` | Configure Druid to use schema auto-discovery to discover some or all of the dimensions and types for your data. For any dimensions that aren't a uniform type, Druid ingests them as JSON. You can use this for native batch or streaming ingestion.  | false  | 
+| `forceSegmentSortByTime` | When set to true (the default), segments created by the ingestion job are sorted by `{__time, dimensions[0], dimensions[1], ...}`. When set to false, segments created by the ingestion job are sorted by `{dimensions[0], dimensions[1], ...}`. To include `__time` in the sort order when this parameter is set to `false`, you must include a dimension named `__time` with type `long` explicitly in the `dimensions` list.<br /><br />Setting this to `false` is an experimental feature; see [Sorting](partitioning.md#sorting) for details. | `true` |
+
+#### Dimension objects
+
+Each dimension in the `dimensions` list can either be a name or an object. Providing a name is equivalent to providing
+a `string` type dimension object with the given name, e.g. `"page"` is equivalent to `{"name": "page", "type": "string"}`.
+
+Dimension objects can have the following components:
+
+| Field | Description | Default |
+|-------|-------------|---------|
+| type | Either `auto`, `string`, `long`, `float`, `double`, or `json`. For the `auto` type, Druid determines the most appropriate type for the dimension and assigns one of the following: STRING, ARRAY\<String\>, LONG, ARRAY\<LONG\>, DOUBLE, ARRAY\<DOUBLE\>, or COMPLEX\<json\> columns, all sharing a common 'nested' format. When Druid infers the schema with schema auto-discovery, the type is `auto`. | `string` |
+| name | The name of the dimension. This will be used as the field name to read from input records, as well as the column name stored in generated segments.<br /><br />Note that you can use a [`transformSpec`](#transformspec) if you want to rename columns during ingestion time. | none (required) |
+| createBitmapIndex | For `string` typed dimensions, whether or not bitmap indexes should be created for the column in generated segments. Creating a bitmap index requires more storage, but speeds up certain kinds of filtering (especially equality and prefix filtering). Only supported for `string` typed dimensions. | `true` |
+| multiValueHandling | For `string` typed dimensions, specifies the type of handling for [multi-value fields](../querying/multi-value-dimensions.md). Possible values are `array` (ingest string arrays as-is), `sorted_array` (sort string arrays during ingestion), and `sorted_set` (sort and de-duplicate string arrays during ingestion). This parameter is ignored for types other than `string`. | `sorted_array` |
+
+#### Inclusions and exclusions
+
+Druid will interpret a `dimensionsSpec` in two possible ways: _normal_ or _schemaless_.
+
+Normal interpretation occurs when either `dimensions` or `spatialDimensions` is non-empty. In this case, the combination of the two lists will be taken as the set of dimensions to be ingested, and the list of `dimensionExclusions` will be ignored.
+
+:::info
+ The following description of schemaless refers to  string-based schemaless  where Druid treats dimensions it discovers as strings. We recommend you use schema auto-discovery instead where Druid infers the type for the dimension. For more information, see [`dimensionsSpec`](#dimensionsspec).
+:::
+
+Schemaless interpretation occurs when both `dimensions` and `spatialDimensions` are empty or null. In this case, the set of dimensions is determined in the following way:
+
+1. First, start from the set of all root-level fields from the input record, as determined by the [`inputFormat`](./data-formats.md). "Root-level" includes all fields at the top level of a data structure, but does not included fields nested within maps or lists. To extract these, you must use a [`flattenSpec`](./data-formats.md#flattenspec). All fields of non-nested data formats, such as CSV and delimited text, are considered root-level.
+2. If a [`flattenSpec`](./data-formats.md#flattenspec) is being used, the set of root-level fields includes any fields generated by the `flattenSpec`. The `useFieldDiscovery` parameter determines whether the original root-level fields will be retained or discarded.
+3. Any field listed in `dimensionExclusions` is excluded.
+4. The field listed as `column` in the [`timestampSpec`](#timestampspec) is excluded.
+5. Any field used as an input to an aggregator from the [metricsSpec](#metricsspec) is excluded.
+6. Any field with the same name as an aggregator from the [metricsSpec](#metricsspec) is excluded.
+7. All other fields are ingested as `string` typed dimensions with the [default settings](#dimension-objects).
+
+Additionally, if you have empty columns that you want to include in the string-based schemaless ingestion, you'll need to include the context parameter `storeEmptyColumns` and set it to `true`.
+
+:::info
+ Note: Fields generated by a [`transformSpec`](#transformspec) are not currently considered candidates for
+ schemaless dimension interpretation.
+:::
+
+### `metricsSpec`
+
+The `metricsSpec` is located in `dataSchema` → `metricsSpec` and is a list of [aggregators](../querying/aggregations.md)
+to apply at ingestion time. This is most useful when [rollup](./rollup.md) is enabled, since it's how you configure
+ingestion-time aggregation.
+
+An example `metricsSpec` is:
+
+```
+"metricsSpec": [
+  { "type": "count", "name": "count" },
+  { "type": "doubleSum", "name": "bytes_added_sum", "fieldName": "bytes_added" },
+  { "type": "doubleSum", "name": "bytes_deleted_sum", "fieldName": "bytes_deleted" }
+]
+```
+
+:::info
+ Generally, when [rollup](./rollup.md) is disabled, you should have an empty `metricsSpec` (because without rollup,
+ Druid does not do any ingestion-time aggregation, so there is little reason to include an ingestion-time aggregator). However,
+ in some cases, it can still make sense to define metrics: for example, if you want to create a complex column as a way of
+ pre-computing part of an [approximate aggregation](../querying/aggregations.md#approximate-aggregations), this can only
+ be done by defining a metric in a `metricsSpec`.
+:::
+
+### `granularitySpec`
+
+The `granularitySpec`, located in `dataSchema` → `granularitySpec`, specifies the following:
+
+1. `segmentGranularity` to partitioning a datasource into [time chunks](../design/storage.md).
+2. `queryGranularity` to optionally truncate the timestamp.
+3. `intervals` to define the time chunks of segments to create for batch ingestion.
+4.  `rollup` to enable ingestion-time [rollup](./rollup.md) or not.
+
+Other than `rollup`, these operations are all based on the [primary timestamp](./schema-model.md#primary-timestamp).
+Use the format from [Query granularities] to specify both `segmentGranualarity` and `queryGranularity`.
+
+An example `granularitySpec` is:
+
+```
+"granularitySpec": {
+  "segmentGranularity": "day",
+  "queryGranularity": "none",
+  "intervals": [
+    "2013-08-31/2013-09-01"
+  ],
+  "rollup": true
+}
+```
+
+A `granularitySpec` can have the following components:
+
+| Field | Description | Default |
+|-------|-------------|---------|
+| type |`uniform`| `uniform` |
+| segmentGranularity | [Time chunking](../design/storage.md) granularity for this datasource. Multiple segments can be created per time chunk. For example, when set to `day`, the events of the same day fall into the same time chunk which can be optionally further partitioned into multiple segments based on other configurations and input size. Any [granularity](../querying/granularities.md) can be provided here. Note that all segments in the same time chunk should have the same segment granularity.<br /><br />Avoid `WEEK` granularity for data partitioning because weeks don't align neatly with months and years, making it difficult to change partitioning by coarser granularity. Instead, opt for other partitioning options such as `DAY` or `MONTH`, which offer more flexibility.| `day` |
+| queryGranularity | The resolution of timestamp storage within each segment. This must be equal to, or finer, than `segmentGranularity`. This will be the finest granularity that you can query at and still receive sensible results, but note that you can still query at anything coarser than this granularity. E.g., a value of `minute` will mean that records will be stored at minutely granularity, and can be sensibly queried at any multiple of minutes (including minutely, 5-minutely, hourly, etc).<br /><br />Any [granularity](../querying/granularities.md) can be provided here. Use `none` to store timestamps as-is, without any truncation. Note that `rollup` will be applied if it is set even when the `queryGranularity` is set to `none`. | `none` |
+| rollup | Whether to use ingestion-time [rollup](./rollup.md) or not. Note that rollup is still effective even when `queryGranularity` is set to `none`. Your data will be rolled up if they have the exactly same timestamp. | `true` |
+| intervals | A list of intervals defining time chunks for segments. Specify interval values using ISO8601 format. For example, `["2021-12-06T21:27:10+00:00/2021-12-07T00:00:00+00:00"]`. If you omit the time, the time defaults to "00:00:00".<br /><br />Druid breaks the list up and rounds off the list values based on the `segmentGranularity`.<br /><br />If `null` or not provided, batch ingestion tasks generally determine which time chunks to output based on the timestamps found in the input data.<br /><br />If specified, batch ingestion tasks may be able to skip a determining-partitions phase, which can result in faster ingestion. Batch ingestion tasks may also be able to request all their locks up-front instead of one by one. Batch ingestion tasks throw away any records with timestamps outside of the specified intervals.<br /><br />Ignored for any form of streaming ingestion. | `null` |
+
+### `transformSpec`
+
+The `transformSpec` is located in `dataSchema` → `transformSpec` and is responsible for transforming and filtering
+records during ingestion time. It is optional. An example `transformSpec` is:
+
+```
+"transformSpec": {
+  "transforms": [
+    { "type": "expression", "name": "countryUpper", "expression": "upper(country)" }
+  ],
+  "filter": {
+    "type": "selector",
+    "dimension": "country",
+    "value": "San Serriffe"
+  }
+}
+```
+
+:::info
+ Conceptually, after input data records are read, Druid applies ingestion spec components in a particular order:
+ first [`flattenSpec`](data-formats.md#flattenspec) (if any), then [`timestampSpec`](#timestampspec), then [`transformSpec`](#transformspec),
+ and finally [`dimensionsSpec`](#dimensionsspec) and [`metricsSpec`](#metricsspec). Keep this in mind when writing
+ your ingestion spec.
+:::
+
+#### Transforms
+
+The `transforms` list allows you to specify a set of expressions to evaluate on top of input data. Each transform has a
+"name" which can be referred to by your `dimensionsSpec`, `metricsSpec`, etc.
+
+If a transform has the same name as a field in an input row, then it will shadow the original field. Transforms that
+shadow fields may still refer to the fields they shadow. This can be used to transform a field "in-place".
+
+Transforms do have some limitations. They can only refer to fields present in the actual input rows; in particular,
+they cannot refer to other transforms. And they cannot remove fields, only add them. However, they can shadow a field
+with another field containing all nulls, which will act similarly to removing the field.
+
+Druid currently includes one kind of built-in transform, the expression transform. It has the following syntax:
+
+```
+{
+  "type": "expression",
+  "name": "<output name>",
+  "expression": "<expr>"
+}
+```
+
+The `expression` is a [Druid query expression](../querying/math-expr.md).
+
+:::info
+ Conceptually, after input data records are read, Druid applies ingestion spec components in a particular order:
+ first [`flattenSpec`](data-formats.md#flattenspec) (if any), then [`timestampSpec`](#timestampspec), then [`transformSpec`](#transformspec),
+ and finally [`dimensionsSpec`](#dimensionsspec) and [`metricsSpec`](#metricsspec). Keep this in mind when writing
+ your ingestion spec.
+:::
+
+#### Filter
+
+The `filter` conditionally filters input rows during ingestion. Only rows that pass the filter will be
+ingested. Any of Druid's standard [query filters](../querying/filters.md) can be used. Note that within a
+`transformSpec`, the `transforms` are applied before the `filter`, so the filter can refer to a transform.
+
+### Legacy `dataSchema` spec
+
+:::info
+ The `dataSchema` spec has been changed in 0.17.0. The new spec is supported by all ingestion methods
+except for _Hadoop_ ingestion. See [`dataSchema`](#dataschema) for the new spec.
+:::
+
+The legacy `dataSchema` spec has below two more components in addition to the ones listed in the [`dataSchema`](#dataschema) section above.
+
+- [input row parser](#parser-deprecated), [flattening of nested data](#flattenspec) (if needed)
+
+#### `parser` (Deprecated)
+
+In legacy `dataSchema`, the `parser` is located in the `dataSchema` → `parser` and is responsible for configuring a wide variety of
+items related to parsing input records. The `parser` is deprecated and it is highly recommended to use `inputFormat` instead.
+For details about `inputFormat` and supported `parser` types, see the ["Data formats" page](data-formats.md).
+
+For details about major components of the `parseSpec`, refer to their subsections:
+
+- [`timestampSpec`](#timestampspec), responsible for configuring the [primary timestamp](./schema-model.md#primary-timestamp).
+- [`dimensionsSpec`](#dimensionsspec), responsible for configuring [dimensions](./schema-model.md#dimensions).
+- [`flattenSpec`](#flattenspec), responsible for flattening nested data formats.
+
+An example `parser` is:
+
+```
+"parser": {
+  "type": "string",
+  "parseSpec": {
+    "format": "json",
+    "flattenSpec": {
+      "useFieldDiscovery": true,
+      "fields": [
+        { "type": "path", "name": "userId", "expr": "$.user.id" }
+      ]
+    },
+    "timestampSpec": {
+      "column": "timestamp",
+      "format": "auto"
+    },
+    "dimensionsSpec": {
+      "dimensions": [
+        "page",
+        "language",
+        { "type": "long", "name": "userId" }
+      ]
+    }
+  }
+}
+```
+
+#### `flattenSpec`
+
+In the legacy `dataSchema`, the `flattenSpec` is located in `dataSchema` → `parser` → `parseSpec` → `flattenSpec` and is responsible for
+bridging the gap between potentially nested input data (such as JSON, Avro, etc) and Druid's flat data model.
+See [Flatten spec](./data-formats.md#flattenspec) for more details.
+
+## `ioConfig`
+
+The `ioConfig` influences how data is read from a source system, such as Apache Kafka, Amazon S3, a mounted
+filesystem, or any other supported source system. The `inputFormat` property applies to all
+[ingestion method](./index.md#ingestion-methods) except for Hadoop ingestion. The Hadoop ingestion still
+uses the [`parser`](#parser-deprecated) in the legacy `dataSchema`.
+The rest of `ioConfig` is specific to each individual ingestion method.
+An example `ioConfig` to read JSON data is:
+
+```json
+"ioConfig": {
+    "type": "<ingestion-method-specific type code>",
+    "inputFormat": {
+      "type": "json"
+    },
+    ...
+}
+```
+
+For details, see the documentation provided by each [ingestion method](./index.md#ingestion-methods).
+
+## `tuningConfig`
+
+You specify tuning properties in a `tuningConfig` object, which goes at the top level of an ingestion spec.
+Some properties apply to all [ingestion methods](./index.md#ingestion-methods), but most are specific to each individual ingestion method.
+
+The following table lists the common tuning properties shared among ingestion methods:
+
+|Field|Description|Default|
+|-----|-----------|-------|
+|type|Each ingestion method has its own tuning type code. You must specify the type code that matches your ingestion method. Common options are `index`, `hadoop`, `kafka`, and `kinesis`.||
+|maxRowsInMemory|The maximum number of records to store in memory before persisting to disk. Note that this is the number of rows post-rollup, and so it may not be equal to the number of input records. Ingested records will be persisted to disk when either `maxRowsInMemory` or `maxBytesInMemory` are reached (whichever happens first).|`1000000`|
+|maxBytesInMemory|The maximum aggregate size of records, in bytes, to store in the JVM heap before persisting. This is based on a rough estimate of memory usage. Ingested records will be persisted to disk when either `maxRowsInMemory` or `maxBytesInMemory` are reached (whichever happens first). `maxBytesInMemory` also includes heap usage of artifacts created from intermediary persists. This means that after every persist, the amount of `maxBytesInMemory` until the next persist will decrease. If the sum of bytes of all intermediary persisted artifacts exceeds `maxBytesInMemory` the task fails.<br /><br />Setting `maxBytesInMemory` to -1 disables this check, meaning Druid will rely entirely on `maxRowsInMemory` to control memory usage. Setting it to zero means the default value will be used (one-sixth of JVM heap size).<br /><br />Note that the estimate of memory usage is designed to be an overestimate, and can be especially high when using complex ingest-time aggregators, including sketches. If this causes your indexing workloads to persist to disk too often, you can set `maxBytesInMemory` to -1 and rely on `maxRowsInMemory` instead.|One-sixth of max JVM heap size|
+|skipBytesInMemoryOverheadCheck|The calculation of maxBytesInMemory takes into account overhead objects created during ingestion and each intermediate persist. Setting this to true can exclude the bytes of these overhead objects from maxBytesInMemory check.|false|
+|indexSpec|Defines segment storage format options to use at indexing time.|See [`indexSpec`](#indexspec) for more information.|
+|indexSpecForIntermediatePersists|Defines segment storage format options to use at indexing time for intermediate persisted temporary segments.|See [`indexSpec`](#indexspec) for more information.|
+|Other properties|Each ingestion method has its own list of additional tuning properties. See the documentation for each method for a full list: [Kafka indexing service](../ingestion/kafka-ingestion.md#tuning-configuration), [Kinesis indexing service](../ingestion/kinesis-ingestion.md#tuning-configuration), [Native batch](native-batch.md#tuningconfig), and [Hadoop-based](hadoop.md#tuningconfig).||
+
+The following example shows a `tuningConfig` object that sets all of the shared common properties to their defaults:
+
+```plaintext
+"tuningConfig": {
+  "type": "<ingestion-method-specific type code>",
+  "maxRowsInMemory": 1000000,
+  "maxBytesInMemory": <one-sixth of JVM memory>,
+  "indexSpec": {
+    "bitmap": { "type": "roaring" },
+    "dimensionCompression": "lz4",
+    "metricCompression": "lz4",
+    "longEncoding": "longs"
+  },
+  <other ingestion-method-specific properties>
+}
+```
+
+### `indexSpec`
+
+The `indexSpec` object can include the following properties.
+For information on defining an `indexSpec` in a query context, see [SQL-based ingestion reference](../multi-stage-query/reference.md#context-parameters).
+
+|Field|Description|Default|
+|-----|-----------|-------|
+|bitmap|Compression format for bitmap indexes. Should be a JSON object with `type` set to `roaring` or `concise`.|`{"type": "roaring"}`|
+|dimensionCompression|Compression format for dimension columns. One of `lz4`, `lzf`, `zstd`, or `uncompressed`.|`lz4`|
+|stringDictionaryEncoding|Encoding format for string value dictionaries used by STRING and [COMPLEX&lt;json&gt;](../querying/nested-columns.md) columns. To enable front coding, set `stringDictionaryEncoding.type` to `frontCoded`. Optionally, you can specify the `bucketSize` and `formatVersion` properties. See [Front coding](#front-coding) for more information.|`{"type":"utf8"}`|
+|metricCompression|Compression format for primitive type metric columns. Options are `lz4`, `lzf`, `zstd`, `uncompressed`, or `none` (which is more efficient than `uncompressed`, but not supported by older versions of Druid).|`lz4`|
+|longEncoding|Encoding format for long-typed columns. Applies regardless of whether they are dimensions or metrics. Options are `auto` or `longs`. `auto` encodes the values using offset or lookup table depending on column cardinality, and store them with variable size. `longs` stores the value as-is with 8 bytes each.|`longs`|
+|complexMetricCompression|Compression format for complex type metric columns. Options are `lz4`, `lzf`, `zstd`, `uncompressed`. Options other than `uncompressed` are not compatible with Druid versions older than 31, and only applies to complex metrics which do not have specialized column formats.|`uncompressed`|
+|jsonCompression|Compression format to use for nested column raw data. Options are `lz4`, `lzf`, `zstd`, or `uncompressed`.|`lz4`|
+
+#### Front coding
+
+:::info
+Front coding is an [experimental feature](../development/experimental.md).
+:::
+
+Druid encodes string columns into dictionaries for better compression.
+Front coding is an incremental encoding strategy that lets you store STRING and [COMPLEX&lt;json&gt;](../querying/nested-columns.md) columns in Druid with minimal performance impact.
+Front-coded dictionaries reduce storage and improve performance by optimizing for strings where the front part looks similar.
+For example, if you are tracking website visits, most URLs start with `https://domain.xyz/`, and front coding is able to exploit this pattern for more optimal compression when storing such datasets.
+Druid performs the optimization automatically, which means that the performance of string columns is generally not affected when they don't match the front-coded pattern.
+Consequently, you can enable this feature universally without having to know the underlying data shapes of the columns.
+
+You can use front coding with all types of ingestion.
+
+##### Enable front coding
+
+Before you enable front coding for your cluster, review the [Migration guide for front-coded dictionaries](../release-info/migr-front-coded-dict.md).
+It contains important information about compatibility with Druid versions preceding 25.0.0.
+
+To enable front coding, set `indexSpec.stringDictionaryEncoding.type` to `frontCoded` in the `tuningConfig` object of your ingestion spec.
+
+You can specify the following optional properties:
+
+* `bucketSize`: Number of values to place in a bucket to perform delta encoding. Setting this property instructs indexing tasks to write segments using compressed dictionaries of the specified bucket size. You can set it to any power of 2 less than or equal to 128. `bucketSize` defaults to 4.
+* `formatVersion`: Specifies which front coding version to use. Options are 0 and 1 (supported for Druid versions 26.0.0 and higher). `formatVersion` defaults to 0. For faster speeds and smaller storage sizes, set `formatVersion` to 1. After setting `formatVersion` to 1, you can no longer downgrade to Druid 25.0.0 seamlessly. To downgrade to Druid 25.0.0, you must re-ingest your data with the `formatVersion` property set to 0.
+
+For example:
+
+```
+"tuningConfig": {
+  "indexSpec": {
+    "stringDictionaryEncoding": {
+      "type":"frontCoded",
+      "bucketSize": 4,
+      "formatVersion": 0
+    }
+  }
+}
+```
diff --git a/docs/35.0.0/ingestion/input-sources.md b/docs/35.0.0/ingestion/input-sources.md
new file mode 100644
index 0000000000..49cf90cdbf
--- /dev/null
+++ b/docs/35.0.0/ingestion/input-sources.md
@@ -0,0 +1,1312 @@
+---
+id: input-sources
+title: "Input sources"
+sidebar_label: "Input sources"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+The input source defines where your index task reads data for Apache Druid native batch ingestion. Only the native parallel task and simple task support the input source.
+
+For general information on native batch indexing and parallel task indexing, see [Native batch ingestion](./native-batch.md).
+
+## S3 input source
+
+:::info[Required extension]
+To use the S3 input source, load the extension [`druid-s3-extensions`](../development/extensions-core/s3.md) in your `common.runtime.properties` file.
+:::
+
+The S3 input source reads objects directly from S3. You can specify either:
+
+* a list of S3 URI strings
+* a list of S3 location prefixes that attempts to list the contents and ingest
+all objects contained within the locations.
+
+The S3 input source is splittable. Therefore, you can use it with the [parallel task](./native-batch.md). Each worker task of `index_parallel` reads one or multiple objects.
+
+Sample specs:
+
+```json
+...
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "s3",
+        "objectGlob": "**.json",
+        "uris": ["s3://foo/bar/file.json", "s3://bar/foo/file2.json"]
+      },
+      "inputFormat": {
+        "type": "json"
+      },
+      ...
+    },
+...
+```
+
+```json
+...
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "s3",
+        "objectGlob": "**.parquet",
+        "prefixes": ["s3://foo/bar/", "s3://bar/foo/"]
+      },
+      "inputFormat": {
+        "type": "json"
+      },
+      ...
+    },
+...
+```
+
+```json
+...
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "s3",
+        "objectGlob": "**.json",
+        "objects": [
+          { "bucket": "foo", "path": "bar/file1.json"},
+          { "bucket": "bar", "path": "foo/file2.json"}
+        ]
+      },
+      "inputFormat": {
+        "type": "json"
+      },
+      ...
+    },
+...
+```
+
+```json
+...
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "s3",
+        "objectGlob": "**.json",
+        "uris": ["s3://foo/bar/file.json", "s3://bar/foo/file2.json"],
+        "properties": {
+          "accessKeyId": "KLJ78979SDFdS2",
+          "secretAccessKey": "KLS89s98sKJHKJKJH8721lljkd"
+        }
+      },
+      "inputFormat": {
+        "type": "json"
+      },
+      ...
+    },
+...
+```
+
+```json
+...
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "s3",
+        "objectGlob": "**.json",
+        "uris": ["s3://foo/bar/file.json", "s3://bar/foo/file2.json"],
+        "properties": {
+          "accessKeyId": "KLJ78979SDFdS2",
+          "secretAccessKey": "KLS89s98sKJHKJKJH8721lljkd",
+          "assumeRoleArn": "arn:aws:iam::2981002874992:role/role-s3"
+        }
+      },
+      "inputFormat": {
+        "type": "json"
+      },
+      ...
+    },
+...
+```
+
+```json
+...
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "s3",
+        "uris": ["s3://foo/bar/file.json", "s3://bar/foo/file2.json"],
+        "endpointConfig": {
+             "url" : "s3-store.aws.com",
+             "signingRegion" : "us-west-2"
+         },
+         "clientConfig": {
+             "protocol" : "http",
+             "disableChunkedEncoding" : true,
+             "enablePathStyleAccess" : true,
+             "forceGlobalBucketAccessEnabled" : false
+         },
+         "proxyConfig": {
+             "host" : "proxy-s3.aws.com",
+             "port" : 8888,
+             "username" : "admin",
+             "password" : "admin"
+         },
+
+        "properties": {
+          "accessKeyId": "KLJ78979SDFdS2",
+          "secretAccessKey": "KLS89s98sKJHKJKJH8721lljkd",
+          "assumeRoleArn": "arn:aws:iam::2981002874992:role/role-s3"
+        }
+      },
+      "inputFormat": {
+        "type": "json"
+      },
+      ...
+    },
+...
+```
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|---------|
+|type|Set the value to `s3`.|None|yes|
+|uris|JSON array of URIs where S3 objects to be ingested are located.|None|`uris` or `prefixes` or `objects` must be set|
+|prefixes|JSON array of URI prefixes for the locations of S3 objects to be ingested. Empty objects starting with one of the given prefixes will be skipped.|None|`uris` or `prefixes` or `objects` must be set|
+|objects|JSON array of S3 Objects to be ingested.|None|`uris` or `prefixes` or `objects` must be set|
+|objectGlob|A glob for the object part of the S3 URI. In the URI `s3://foo/bar/file.json`, the glob is applied to `bar/file.json`.<br /><br />The glob must match the entire object part, not just the filename. For example, the glob `*.json` does not match `s3://foo/bar/file.json`, because the object part is `bar/file.json`, and the`*` does not match the slash. To match all objects ending in `.json`, use `**.json` instead.<br /><br />For more information, refer to the documentation for [`FileSystem#getPathMatcher`](https://docs.oracle.com/en/java/javase/17/docs/api/java.base/java/nio/file/FileSystem.html#getPathMatcher(java.lang.String)).|None|no|
+|systemFields|JSON array of system fields to return as part of input rows. Possible values: `__file_uri` (S3 URI starting with `s3://`), `__file_bucket` (S3 bucket), and `__file_path` (S3 object key).|None|no|
+| endpointConfig |Config for overriding the default S3 endpoint and signing region. This would allow ingesting data from a different S3 store. Please see [s3 config](../development/extensions-core/s3.md#connecting-to-s3-configuration) for more information.|None|No (defaults will be used if not given)
+| clientConfig |S3 client properties for the overridden s3 endpoint. This is used in conjunction with `endPointConfig`. Please see [s3 config](../development/extensions-core/s3.md#connecting-to-s3-configuration) for more information.|None|No (defaults will be used if not given)
+| proxyConfig |Properties for specifying proxy information for the overridden s3 endpoint. This is used in conjunction with `clientConfig`. Please see [s3 config](../development/extensions-core/s3.md#connecting-to-s3-configuration) for more information.|None|No (defaults will be used if not given)
+|properties|Properties Object for overriding the default S3 configuration. See below for more information.|None|No (defaults will be used if not given)
+
+Note that the S3 input source will skip all empty objects only when `prefixes` is specified.
+
+S3 Object:
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|---------|
+|bucket|Name of the S3 bucket|None|yes|
+|path|The path where data is located.|None|yes|
+
+Properties Object:
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|---------|
+|accessKeyId|The [Password Provider](../operations/password-provider.md) or plain text string of this S3 input source access key|None|Yes, if `secretAccessKey` or `sessionToken` is given.|
+|secretAccessKey|The [Password Provider](../operations/password-provider.md) or plain text string of this S3 input source secret key|None|Yes, if `accessKeyId` or `sessionToken` is given.|
+|sessionToken|The [Password Provider](../operations/password-provider.md) or plain text string of this S3 input source session token|None|no|
+|assumeRoleArn|AWS ARN of the role to assume [see](https://docs.aws.amazon.com/IAM/latest/UserGuide/id_credentials_temp_request.html). **assumeRoleArn** can be used either with the ingestion spec AWS credentials or with the default S3 credentials|None|no|
+|assumeRoleExternalId|A unique identifier that might be required when you assume a role in another account [see](https://docs.aws.amazon.com/IAM/latest/UserGuide/id_credentials_temp_request.html)|None|no|
+
+:::info
+
+If `accessKeyId` and `secretAccessKey` are not given, the default [S3 credentials provider chain](../development/extensions-core/s3.md#s3-authentication-methods) is used.
+
+:::
+
+## Google Cloud Storage input source
+
+:::info[Required extension]
+To use the Google Cloud Storage input source, load the extension [`druid-google-extensions`](../development/extensions-core/google.md) in your `common.runtime.properties` file.
+:::
+
+The Google Cloud Storage input source is to support reading objects directly
+from Google Cloud Storage. Objects can be specified as list of Google
+Cloud Storage URI strings. The Google Cloud Storage input source is splittable
+and can be used by the [parallel task](./native-batch.md), where each worker task of `index_parallel` will read
+one or multiple objects.
+
+Sample specs:
+
+```json
+...
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "google",
+        "objectGlob": "**.json",
+        "uris": ["gs://foo/bar/file.json", "gs://bar/foo/file2.json"]
+      },
+      "inputFormat": {
+        "type": "json"
+      },
+      ...
+    },
+...
+```
+
+```json
+...
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "google",
+        "objectGlob": "**.parquet",
+        "prefixes": ["gs://foo/bar/", "gs://bar/foo/"]
+      },
+      "inputFormat": {
+        "type": "json"
+      },
+      ...
+    },
+...
+```
+
+```json
+...
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "google",
+        "objectGlob": "**.json",
+        "objects": [
+          { "bucket": "foo", "path": "bar/file1.json"},
+          { "bucket": "bar", "path": "foo/file2.json"}
+        ]
+      },
+      "inputFormat": {
+        "type": "json"
+      },
+      ...
+    },
+...
+```
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|---------|
+|type|Set the value to `google`.|None|yes|
+|uris|JSON array of URIs where Google Cloud Storage objects to be ingested are located.|None|`uris` or `prefixes` or `objects` must be set|
+|prefixes|JSON array of URI prefixes for the locations of Google Cloud Storage objects to be ingested. Empty objects starting with one of the given prefixes will be skipped.|None|`uris` or `prefixes` or `objects` must be set|
+|objects|JSON array of Google Cloud Storage objects to be ingested.|None|`uris` or `prefixes` or `objects` must be set|
+|objectGlob|A glob for the object part of the S3 URI. In the URI `s3://foo/bar/file.json`, the glob is applied to `bar/file.json`.<br /><br />The glob must match the entire object part, not just the filename. For example, the glob `*.json` does not match `s3://foo/bar/file.json`, because the object part is `bar/file.json`, and the`*` does not match the slash. To match all objects ending in `.json`, use `**.json` instead.<br /><br />For more information, refer to the documentation for [`FileSystem#getPathMatcher`](https://docs.oracle.com/en/java/javase/17/docs/api/java.base/java/nio/file/FileSystem.html#getPathMatcher(java.lang.String)).|None|no|
+
+Note that the Google Cloud Storage input source will skip all empty objects only when `prefixes` is specified.
+
+Google Cloud Storage object:
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|---------|
+|bucket|Name of the Google Cloud Storage bucket|None|yes|
+|path|The path where data is located.|None|yes|
+|systemFields|JSON array of system fields to return as part of input rows. Possible values: `__file_uri` (Google Cloud Storage URI starting with `gs://`), `__file_bucket` (GCS bucket), and `__file_path` (GCS key).|None|no|
+
+## Azure input source
+
+:::info[Required extension]
+To use the Azure input source, load the extension [`druid-azure-extensions`](../development/extensions-core/azure.md) in your `common.runtime.properties` file.
+:::
+
+The Azure input source (that uses the type `azureStorage`) reads objects directly from Azure Blob store or Azure Data Lake sources. You can
+specify objects as a list of file URI strings or prefixes. You can split the Azure input source for use with [parallel task](./native-batch.md) indexing and each worker task reads one chunk of the split data.
+
+The `azureStorage` input source is a new schema for Azure input sources that allows you to specify which storage account files should be ingested from. We recommend that you update any specs that use the old `azure` schema to use the new `azureStorage` schema. The new schema provides more functionality than the older `azure` schema.
+
+Sample specs:
+
+```json
+...
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "azureStorage",
+        "objectGlob": "**.json",
+        "uris": ["azureStorage://storageAccount/container/prefix1/file.json", "azureStorage://storageAccount/container/prefix2/file2.json"]
+      },
+      "inputFormat": {
+        "type": "json"
+      },
+      ...
+    },
+...
+```
+
+```json
+...
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "azureStorage",
+        "objectGlob": "**.parquet",
+        "prefixes": ["azureStorage://storageAccount/container/prefix1/", "azureStorage://storageAccount/container/prefix2/"]
+      },
+      "inputFormat": {
+        "type": "json"
+      },
+      ...
+    },
+...
+```
+
+```json
+...
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "azureStorage",
+        "objectGlob": "**.json",
+        "objects": [
+          { "bucket": "storageAccount", "path": "container/prefix1/file1.json"},
+          { "bucket": "storageAccount", "path": "container/prefix2/file2.json"}
+        ],
+        "properties": {
+          "sharedAccessStorageToken": "?sv=...<storage token secret>...",
+        }
+      },
+      "inputFormat": {
+        "type": "json"
+      },
+      ...
+    },
+...
+```
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|---------|
+|type|Set the value to `azureStorage`.|None|yes|
+|uris|JSON array of URIs where the Azure objects to be ingested are located. Use this format: `azureStorage://STORAGE_ACCOUNT/CONTAINER/PATH_TO_FILE`|None|One of the following must be set:`uris`, `prefixes`, or `objects`.|
+|prefixes|JSON array of URI prefixes for the locations of Azure objects to ingest. Use this format`azureStorage://STORAGE_ACCOUNT/CONTAINER/PREFIX`. Empty objects starting with any of the given prefixes are skipped.|None|One of the following must be set:`uris`, `prefixes`, or `objects`.|
+|objects|JSON array of Azure objects to ingest.|None|One of the following must be set:`uris`, `prefixes`, or `objects`.|
+|objectGlob|A glob for the object part of the Azure URI. In the URI `azureStorage://foo/bar/file.json`, the glob is applied to `bar/file.json`.<br /><br />The glob must match the entire object part, not just the filename. For example, the glob `*.json` does not match `azureStorage://foo/bar/file.json` because the object part is `bar/file.json`, and the`*` does not match the slash. To match all objects ending in `.json`, use `**.json` instead.<br /><br />For more information, refer to the documentation for [`FileSystem#getPathMatcher`](https://docs.oracle.com/en/java/javase/17/docs/api/java.base/java/nio/file/FileSystem.html#getPathMatcher(java.lang.String)).|None|no|
+|systemFields|JSON array of system fields to return as part of input rows. Possible values: `__file_uri` (Azure blob URI starting with `azureStorage://`), `__file_bucket` (Azure bucket), and `__file_path` (Azure object path).|None|no|
+|properties|Properties object for overriding the default Azure configuration. See below for more information.|None|No (defaults will be used if not given)|
+
+Note that the Azure input source skips all empty objects only when `prefixes` is specified.
+
+The `objects` property can one of the following:
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|---------|
+|bucket|Name of the Azure Blob Storage or Azure Data Lake storage account|None|yes|
+|path|The container and path where data is located.|None|yes|
+
+The `properties` property can be one of the following:
+
+* `sharedAccessStorageToken`
+* `key`
+* `appRegistrationClientId`, `appRegistrationClientSecret`, and `tenantId`
+* empty
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|---------|
+|sharedAccessStorageToken|The plain text string of this Azure Blob Storage Shared Access Token|None|No|
+|key|The root key of Azure Blob Storage Account|None|no|
+|appRegistrationClientId|The client ID of the Azure App registration to authenticate as|None|No|
+|appRegistrationClientSecret|The client secret of the Azure App registration to authenticate as|None|Yes if `appRegistrationClientId` is provided|
+|tenantId|The tenant ID of the Azure App registration to authenticate as|None|Yes if `appRegistrationClientId` is provided|
+
+### Legacy `azure` input source
+
+The Azure input source that uses the type `azure` is an older version of the Azure input type and is not recommended. It doesn't support specifying which storage account to ingest from. We recommend using the [`azureStorage` input source schema](#azure-input-source) instead since it provides more functionality.
+
+Sample specs:
+
+```json
+...
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "azure",
+        "objectGlob": "**.json",
+        "uris": ["azure://container/prefix1/file.json", "azure://container/prefix2/file2.json"]
+      },
+      "inputFormat": {
+        "type": "json"
+      },
+      ...
+    },
+...
+```
+
+```json
+...
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "azure",
+        "objectGlob": "**.parquet",
+        "prefixes": ["azure://container/prefix1/", "azure://container/prefix2/"]
+      },
+      "inputFormat": {
+        "type": "json"
+      },
+      ...
+    },
+...
+```
+
+```json
+...
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "azure",
+        "objectGlob": "**.json",
+        "objects": [
+          { "bucket": "container", "path": "prefix1/file1.json"},
+          { "bucket": "container", "path": "prefix2/file2.json"}
+        ]
+      },
+      "inputFormat": {
+        "type": "json"
+      },
+      ...
+    },
+...
+```
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|---------|
+|type|Set the value to `azure`.|None|yes|
+|uris|JSON array of URIs where the Azure objects to be ingested are located, in the form `azure://<container>/<path-to-file>`|None|`uris` or `prefixes` or `objects` must be set|
+|prefixes|JSON array of URI prefixes for the locations of Azure objects to ingest, in the form `azure://<container>/<prefix>`. Empty objects starting with one of the given prefixes are skipped.|None|`uris` or `prefixes` or `objects` must be set|
+|objects|JSON array of Azure objects to ingest.|None|`uris` or `prefixes` or `objects` must be set|
+|objectGlob|A glob for the object part of the Azure URI. In the URI `azure://foo/bar/file.json`, the glob is applied to `bar/file.json`.<br /><br />The glob must match the entire object part, not just the filename. For example, the glob `*.json` does not match `azure://foo/bar/file.json`, because the object part is `bar/file.json`, and the`*` does not match the slash. To match all objects ending in `.json`, use `**.json` instead.<br /><br />For more information, refer to the documentation for [`FileSystem#getPathMatcher`](https://docs.oracle.com/en/java/javase/17/docs/api/java.base/java/nio/file/FileSystem.html#getPathMatcher(java.lang.String)).|None|no|
+|systemFields|JSON array of system fields to return as part of input rows. Possible values: `__file_uri` (Azure blob URI starting with `azure://`), `__file_bucket` (Azure bucket), and `__file_path` (Azure object path).|None|no|
+
+Note that the Azure input source skips all empty objects only when `prefixes` is specified.
+
+The `objects` property is:
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|---------|
+|bucket|Name of the Azure Blob Storage or Azure Data Lake container|None|yes|
+|path|The path where data is located.|None|yes|
+
+## HDFS input source
+
+:::info[Required extension]
+To use the HDFS input source, load the extension [`druid-hdfs-storage`](../development/extensions-core/hdfs.md) in your `common.runtime.properties` file.
+:::
+
+The HDFS input source is to support reading files directly
+from HDFS storage. File paths can be specified as an HDFS URI string or a list
+of HDFS URI strings. The HDFS input source is splittable and can be used by the [parallel task](./native-batch.md),
+where each worker task of `index_parallel` will read one or multiple files.
+
+Sample specs:
+
+```json
+...
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "hdfs",
+        "paths": "hdfs://namenode_host/foo/bar/", "hdfs://namenode_host/bar/foo"
+      },
+      "inputFormat": {
+        "type": "json"
+      },
+      ...
+    },
+...
+```
+
+```json
+...
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "hdfs",
+        "paths": "hdfs://namenode_host/foo/bar/", "hdfs://namenode_host/bar/foo"
+      },
+      "inputFormat": {
+        "type": "json"
+      },
+      ...
+    },
+...
+```
+
+```json
+...
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "hdfs",
+        "paths": "hdfs://namenode_host/foo/bar/file.json", "hdfs://namenode_host/bar/foo/file2.json"
+      },
+      "inputFormat": {
+        "type": "json"
+      },
+      ...
+    },
+...
+```
+
+```json
+...
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "hdfs",
+        "paths": ["hdfs://namenode_host/foo/bar/file.json", "hdfs://namenode_host/bar/foo/file2.json"]
+      },
+      "inputFormat": {
+        "type": "json"
+      },
+      ...
+    },
+...
+```
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|---------|
+|type|Set the value to `hdfs`.|None|yes|
+|paths|HDFS paths. Can be either a JSON array or comma-separated string of paths. Wildcards like `*` are supported in these paths. Empty files located under one of the given paths will be skipped.|None|yes|
+|systemFields|JSON array of system fields to return as part of input rows. Possible values: `__file_uri` (URI) and `__file_path` (path component of URI).|None|no|
+
+You can also ingest from other storage using the HDFS input source if the HDFS client supports that storage.
+However, if you want to ingest from cloud storage, consider using the service-specific input source for your data storage.
+If you want to use a non-hdfs protocol with the HDFS input source, include the protocol
+in `druid.ingestion.hdfs.allowedProtocols`. See [HDFS input source security configuration](../configuration/index.md#hdfs-input-source) for more details.
+
+## HTTP input source
+
+The HTTP input source is to support reading files directly from remote sites via HTTP.
+
+:::info[Security notes]
+
+Ingestion tasks run under the operating system account that runs the Druid processes, for example the Indexer, Middle Manager, and Peon. This means any user who can submit an ingestion task can specify an input source referring to any location that the Druid process can access. For example, using `http` input source, users may have access to internal network servers.
+
+The `http` input source is not limited to the HTTP or HTTPS protocols. It uses the Java URI class that supports HTTP, HTTPS, FTP, file, and jar protocols by default.
+
+:::
+
+For more information about security best practices, see [Security overview](../operations/security-overview.md#best-practices).
+
+The HTTP input source is _splittable_ and can be used by the [parallel task](./native-batch.md),
+where each worker task of `index_parallel` will read only one file. This input source does not support Split Hint Spec.
+
+Sample specs:
+
+```json
+...
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "http",
+        "uris": ["http://example.com/uri1", "http://example2.com/uri2"]
+      },
+      "inputFormat": {
+        "type": "json"
+      },
+      ...
+    },
+...
+```
+
+Example with authentication fields using the DefaultPassword provider (this requires the password to be in the ingestion spec):
+
+```json
+...
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "http",
+        "uris": ["http://example.com/uri1", "http://example2.com/uri2"],
+        "httpAuthenticationUsername": "username",
+        "httpAuthenticationPassword": "password123"
+      },
+      "inputFormat": {
+        "type": "json"
+      },
+      ...
+    },
+...
+```
+
+You can also use the other existing Druid PasswordProviders. Here is an example using the EnvironmentVariablePasswordProvider:
+
+```json
+...
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "http",
+        "uris": ["http://example.com/uri1", "http://example2.com/uri2"],
+        "httpAuthenticationUsername": "username",
+        "httpAuthenticationPassword": {
+          "type": "environment",
+          "variable": "HTTP_INPUT_SOURCE_PW"
+        }
+      },
+      "inputFormat": {
+        "type": "json"
+      },
+      ...
+    },
+...
+}
+```
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|---------|
+|type|Set the value to `http`.|None|yes|
+|uris|URIs of the input files. See below for the protocols allowed for URIs.|None|yes|
+|httpAuthenticationUsername|Username to use for authentication with specified URIs. Can be optionally used if the URIs specified in the spec require a Basic Authentication Header.|None|no|
+|httpAuthenticationPassword|PasswordProvider to use with specified URIs. Can be optionally used if the URIs specified in the spec require a Basic Authentication Header.|None|no|
+|systemFields|JSON array of system fields to return as part of input rows. Possible values: `__file_uri` (URI including scheme) and `__file_path` (path component of URI).|None|no|
+
+You can only use protocols listed in the `druid.ingestion.http.allowedProtocols` property as HTTP input sources.
+The `http` and `https` protocols are allowed by default. See [HTTP input source security configuration](../configuration/index.md#http-input-source) for more details.
+
+## Inline input source
+
+The Inline input source can be used to read the data inlined in its own spec.
+It can be used for demos or for quickly testing out parsing and schema.
+
+Sample spec:
+
+```json
+...
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "inline",
+        "data": "0,values,formatted\n1,as,CSV"
+      },
+      "inputFormat": {
+        "type": "csv"
+      },
+      ...
+    },
+...
+```
+
+|Property|Description|Required|
+|--------|-----------|---------|
+|type|Set the value to `inline`.|yes|
+|data|Inlined data to ingest.|yes|
+
+## Local input source
+
+The Local input source is to support reading files directly from local storage,
+and is mainly intended for proof-of-concept testing.
+The Local input source is _splittable_ and can be used by the [parallel task](./native-batch.md),
+where each worker task of `index_parallel` will read one or multiple files.
+
+Sample spec:
+
+```json
+...
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "local",
+        "filter" : "*.csv",
+        "baseDir": "/data/directory",
+        "files": ["/bar/foo", "/foo/bar"]
+      },
+      "inputFormat": {
+        "type": "csv"
+      },
+      ...
+    },
+...
+```
+
+|Property|Description|Required|
+|--------|-----------|---------|
+|type|Set the value to `local`.|yes|
+|filter|A wildcard filter for files. See [here](http://commons.apache.org/proper/commons-io/apidocs/org/apache/commons/io/filefilter/WildcardFileFilter) for more information. Files matching the filter criteria are considered for ingestion. Files not matching the filter criteria are ignored.|yes if `baseDir` is specified|
+|baseDir|Directory to search recursively for files to be ingested. Empty files under the `baseDir` will be skipped.|At least one of `baseDir` or `files` should be specified|
+|files|File paths to ingest. Some files can be ignored to avoid ingesting duplicate files if they are located under the specified `baseDir`. Empty files will be skipped.|At least one of `baseDir` or `files` should be specified|
+|systemFields|JSON array of system fields to return as part of input rows. Possible values: `__file_uri` (File URI starting with `file:`) and `__file_path` (file path).|no|
+
+## Druid input source
+
+The Druid input source is to support reading data directly from existing Druid segments,
+potentially using a new schema and changing the name, dimensions, metrics, rollup, etc. of the segment.
+The Druid input source is _splittable_ and can be used by the [parallel task](./native-batch.md).
+This input source has a fixed input format for reading from Druid segments;
+no `inputFormat` field needs to be specified in the ingestion spec when using this input source.
+
+|Property|Description|Required|
+|--------|-----------|---------|
+|type|Set the value to `druid`.|yes|
+|dataSource|A String defining the Druid datasource to fetch rows from|yes|
+|interval|A String representing an ISO-8601 interval, which defines the time range to fetch the data over.|yes|
+|filter| See [Filters](../querying/filters.md). Only rows that match the filter, if specified, will be returned.|no|
+
+The Druid input source can be used for a variety of purposes, including:
+
+* Creating new datasources that are rolled-up copies of existing datasources.
+* Changing the [partitioning or sorting](./partitioning.md) of a datasource to improve performance.
+* Updating or removing rows using a [`transformSpec`](./ingestion-spec.md#transformspec).
+
+When using the Druid input source, the timestamp column shows up as a numeric field named `__time` set to the number
+of milliseconds since the epoch (January 1, 1970 00:00:00 UTC). It is common to use this in the timestampSpec, if you
+want the output timestamp to be equivalent to the input timestamp. In this case, set the timestamp column to `__time`
+and the format to `auto` or `millis`.
+
+It is OK for the input and output datasources to be the same. In this case, newly generated data will overwrite the
+previous data for the intervals specified in the `granularitySpec`. Generally, if you are going to do this, it is a good
+idea to test out your reindexing by writing to a separate datasource before overwriting your main one. Alternatively, if
+your goals can be satisfied by [compaction](../data-management/compaction.md), consider that instead as a simpler
+approach.
+
+An example task spec is shown below. It reads from a hypothetical raw datasource `wikipedia_raw` and creates a new
+rolled-up datasource `wikipedia_rollup` by grouping on hour, "countryName", and "page".
+
+```json
+{
+  "type": "index_parallel",
+  "spec": {
+    "dataSchema": {
+      "dataSource": "wikipedia_rollup",
+      "timestampSpec": {
+        "column": "__time",
+        "format": "millis"
+      },
+      "dimensionsSpec": {
+        "dimensions": [
+          "countryName",
+          "page"
+        ]
+      },
+      "metricsSpec": [
+        {
+          "type": "count",
+          "name": "cnt"
+        }
+      ],
+      "granularitySpec": {
+        "type": "uniform",
+        "queryGranularity": "HOUR",
+        "segmentGranularity": "DAY",
+        "intervals": ["2016-06-27/P1D"],
+        "rollup": true
+      }
+    },
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "druid",
+        "dataSource": "wikipedia_raw",
+        "interval": "2016-06-27/P1D"
+      }
+    },
+    "tuningConfig": {
+      "type": "index_parallel",
+      "partitionsSpec": {
+        "type": "hashed"
+      },
+      "forceGuaranteedRollup": true,
+      "maxNumConcurrentSubTasks": 1
+    }
+  }
+}
+```
+
+:::info
+
+Older versions (0.19 and earlier) did not respect the timestampSpec when using the Druid input source. If you have ingestion specs that rely on this and cannot rewrite them, set [`druid.indexer.task.ignoreTimestampSpecForDruidInputSource`](../configuration/index.md#indexer-general-configuration) to `true` to enable a compatibility mode where the timestampSpec is ignored.
+
+:::
+
+The [secondary partitioning method](native-batch.md#partitionsspec) determines the requisite number of concurrent worker tasks that run in parallel to complete ingestion with the Combining input source.
+Set this value in `maxNumConcurrentSubTasks` in `tuningConfig` based on the secondary partitioning method:
+
+* `range` or `single_dim` partitioning: greater than or equal to 1
+* `hashed` or `dynamic` partitioning: greater than or equal to 2
+
+For more information on the `maxNumConcurrentSubTasks` field, see [Implementation considerations](native-batch.md#implementation-considerations).
+
+## SQL input source
+
+:::info[Required extension]
+To use the SQL input source, you must load the appropriate extension in your `common.runtime.properties` file.
+* To connect to MySQL, load the extension [`mysql-metadata-storage`](../development/extensions-core/mysql.md).
+* To connect to PostgreSQL, load the extension [`postgresql-metadata-storage`](../development/extensions-core/postgresql.md).
+
+The MySQL extension requires a JDBC driver.
+For more information, see the [Installing the MySQL connector library](../development/extensions-core/mysql.md).
+:::
+
+The SQL input source is used to read data directly from RDBMS.
+You can _split_ the ingestion tasks for a SQL input source. When you use the [parallel task](./native-batch.md) type, each worker task reads from one SQL query from the list of queries.
+This input source does not support Split Hint Spec.
+
+The SQL input source has a fixed input format for reading events.
+Don't specify `inputFormat` when using this input source.
+
+Refer to the [recommended practices](#recommended-practices) before using this input source.
+
+|Property|Description|Required|
+|--------|-----------|---------|
+|type|Set the value to `sql`.|Yes|
+|database|Specifies the database connection details. The database type corresponds to the extension that supplies the `connectorConfig` support.<br/><br/>You can selectively allow JDBC properties in `connectURI`. See [JDBC connections security config](../configuration/index.md#jdbc-connections-to-external-databases) for more details.|Yes|
+|foldCase|Boolean to toggle case folding of database column names. For example, to ingest a database column named `Entry_Date` as `entry_date`, set `foldCase` to true and include `entry_date` in the [`dimensionsSpec`](ingestion-spec.md#dimensionsspec).|No|
+|sqls|List of SQL queries where each SQL query would retrieve the data to be indexed.|Yes|
+
+The following is an example of an SQL input source spec:
+
+```json
+...
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "sql",
+        "database": {
+            "type": "mysql",
+            "connectorConfig": {
+                "connectURI": "jdbc:mysql://host:port/schema",
+                "user": "user",
+                "password": "password"
+            }
+        },
+        "sqls": ["SELECT * FROM table1 WHERE timestamp BETWEEN '2013-01-01 00:00:00' AND '2013-01-01 11:59:59'", "SELECT * FROM table2 WHERE timestamp BETWEEN '2013-01-01 00:00:00' AND '2013-01-01 11:59:59'"]
+      }
+    },
+...
+```
+
+The spec above will read all events from two separate SQLs for the interval `2013-01-01/2013-01-02`.
+Each of the SQL queries will be run in its own sub-task and thus for the above example, there would be two sub-tasks.
+
+### Recommended practices
+
+Compared to the other native batch input sources, SQL input source behaves differently in terms of reading the input data. Therefore, consider the following points before using this input source in a production environment:
+
+* During indexing, each sub-task would execute one of the SQL queries and the results are stored locally on disk. The sub-tasks then proceed to read the data from these local input files and generate segments. Presently, there isn’t any restriction on the size of the generated files and this would require the Middle Managers or Indexers to have sufficient disk capacity based on the volume of data being indexed.
+
+* Filtering the SQL queries based on the intervals specified in the `granularitySpec` can avoid unwanted data being retrieved and stored locally by the indexing sub-tasks. For example, if the `intervals` specified in the `granularitySpec` is `["2013-01-01/2013-01-02"]` and the SQL query is `SELECT * FROM table1`, `SqlInputSource` will read all the data for `table1` based on the query, even though only data between the intervals specified will be indexed into Druid.
+
+* Pagination may be used on the SQL queries to ensure that each query pulls a similar amount of data, thereby improving the efficiency of the sub-tasks.
+
+* Similar to file-based input formats, any updates to existing data will replace the data in segments specific to the intervals specified in the `granularitySpec`.
+
+## Combining input source
+
+The Combining input source lets you read data from multiple input sources.
+It identifies the splits from delegate input sources and uses a worker task to process each split.
+Each delegate input source must be splittable and compatible with the [parallel task type](./native-batch.md).
+
+Similar to other input sources, the Combining input source supports a single `inputFormat`.
+Delegate input sources that require an `inputFormat` must have the same format for input data.
+If you include the [Druid input source](#druid-input-source), the timestamp column is stored in the `__time` field.
+To correctly combine the data from the Druid input source with another source, ensure that other delegate input sources also store the timestamp column in `__time`.
+
+|Property|Description|Required|
+|--------|-----------|---------|
+|type|Set the value to `combining`.|Yes|
+|delegates|List of splittable input sources to read data from.|Yes|
+
+The following is an example of a Combining input source spec:
+
+```json
+...
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "combining",
+        "delegates" : [
+         {
+          "type": "local",
+          "filter" : "*.csv",
+          "baseDir": "/data/directory",
+          "files": ["/bar/foo", "/foo/bar"]
+         },
+         {
+          "type": "druid",
+          "dataSource": "wikipedia",
+          "interval": "2013-01-01/2013-01-02"
+         }
+        ]
+      },
+      "inputFormat": {
+        "type": "csv"
+      },
+      ...
+    },
+...
+```
+
+## Iceberg input source
+
+:::info[Required extension]
+To use the Iceberg input source, load the extension [`druid-iceberg-extensions`](../development/extensions-contrib/iceberg.md) in your `common.runtime.properties` file.
+:::
+
+You use the Iceberg input source to read data stored in the Iceberg table format. For a given table, the input source scans up to the latest Iceberg snapshot from the configured Hive catalog. Druid ingests the underlying live data files using the existing input source formats.
+
+The Iceberg input source cannot be independent as it relies on the existing input sources to read from the data files.
+For example, if the warehouse associated with an Iceberg catalog is on S3, you must also load the [`druid-s3-extensions`](../development/extensions-core/s3.md) extension.
+
+The following is a sample spec for a HDFS warehouse source:
+
+```json
+...
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "iceberg",
+        "tableName": "iceberg_table",
+        "namespace": "iceberg_namespace",
+        "icebergCatalog": {
+            "type": "hive",
+            "warehousePath": "hdfs://warehouse/path",
+            "catalogUri": "thrift://hive-metastore.x.com:8970",
+            "catalogProperties": {
+                "hive.metastore.connect.retries": "1",
+                "hive.metastore.execute.setugi": "false",
+                "hive.metastore.kerberos.principal": "KRB_PRINCIPAL",
+                "hive.metastore.sasl.enabled": "true",
+                "metastore.catalog.default": "catalog_test",
+                "hadoop.security.authentication": "kerberos",
+                "hadoop.security.authorization": "true"
+            }
+        },
+        "icebergFilter": {
+            "type": "interval",
+            "filterColumn": "event_time",
+            "intervals": [
+              "2023-05-10T19:00:00.000Z/2023-05-10T20:00:00.000Z"
+            ]
+        },
+        "warehouseSource": {
+            "type": "hdfs"
+        },
+        "snapshotTime": "2023-06-01T00:00:00.000Z",
+      },
+      "inputFormat": {
+        "type": "parquet"
+      }
+  },
+      ...
+},
+...
+```
+
+The following is a sample spec for a S3 warehouse source:
+
+```json
+...
+        "ioConfig": {
+          "type": "index_parallel",
+          "inputSource": {
+            "type": "iceberg",
+            "tableName": "iceberg_table",
+            "namespace": "iceberg_namespace",
+            "icebergCatalog": {
+              "type": "hive",
+              "warehousePath": "s3://warehouse/path",
+              "catalogUri": "thrift://hive-metastore.x.com:8970",
+              "catalogProperties": {
+                "hive.metastore.connect.retries": "1",
+                "hive.metastore.execute.setugi": "false",
+                "hive.metastore.kerberos.principal": "KRB_PRINCIPAL",
+                "hive.metastore.sasl.enabled": "true",
+                "metastore.catalog.default": "default_catalog",
+                "fs.s3a.access.key" : "S3_ACCESS_KEY",
+                "fs.s3a.secret.key" : "S3_SECRET_KEY",
+                "fs.s3a.endpoint" : "S3_API_ENDPOINT"
+              }
+            },
+            "icebergFilter": {
+              "type": "interval",
+              "filterColumn": "event_time",
+              "intervals": [
+                "2023-05-10T19:00:00.000Z/2023-05-10T20:00:00.000Z"
+              ]
+            },
+            "warehouseSource": {
+              "type": "s3",
+              "endpointConfig": {
+                "url": "teststore.aws.com",
+                "signingRegion": "us-west-2a"
+              },
+              "clientConfig": {
+                "protocol": "http",
+                "disableChunkedEncoding": true,
+                "enablePathStyleAccess": true,
+                "forceGlobalBucketAccessEnabled": false
+              },
+              "properties": {
+                "accessKeyId": {
+                  "type": "default",
+                  "password": "foo"
+                },
+                "secretAccessKey": {
+                  "type": "default",
+                  "password": "bar"
+                }
+              },
+            }
+          },
+          "inputFormat": {
+            "type": "parquet"
+          }
+        },
+...
+},
+```
+
+|Property|Description|Required|
+|--------|-----------|---------|
+|type|Set the value to `iceberg`.|yes|
+|tableName|The Iceberg table name configured in the catalog.|yes|
+|namespace|The Iceberg namespace associated with the table.|yes|
+|icebergFilter|The JSON Object that filters data files within a snapshot.|no|
+|icebergCatalog|The JSON Object used to define the catalog that manages the configured Iceberg table.|yes|
+|warehouseSource|The JSON Object that defines the native input source for reading the data files from the warehouse.|yes|
+|snapshotTime|Timestamp in ISO8601 DateTime format that will be used to fetch the most recent snapshot as of this time.|no|
+
+### Catalog Object
+
+The catalog object supports `rest`, `hive`, `glue` and `local` catalog types.
+
+The following table lists the properties of a `local` catalog:
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|---------|
+|type|Set this value to `local`.|None|yes|
+|warehousePath|The location of the warehouse associated with the catalog.|None|yes|
+|catalogProperties|Map of any additional properties that needs to be attached to the catalog.|None|no|
+|caseSensitive|Toggle case sensitivity for column names during Iceberg table reads.|true|no|
+
+The following table lists the properties of a `hive` catalog:
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|---------|
+|type|Set this value to `hive`.|None|yes|
+|warehousePath|The location of the warehouse associated with the catalog.|None|yes|
+|catalogUri|The URI associated with the hive catalog.|None|yes|
+|catalogProperties|Map of any additional properties that needs to be attached to the catalog.|None|no|
+|caseSensitive|Toggle case sensitivity for column names during Iceberg table reads.|true|no|
+
+The following table lists the properties of a `rest` catalog:
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|---------|
+|type|Set this value to `rest`.|None|yes|
+|catalogUri|The URI associated with the catalog's HTTP endpoint.|None|yes|
+|catalogProperties|Map of any additional properties that needs to be attached to the catalog.|None|no|
+
+The following table lists the properties of a `glue` catalog:
+
+|Property| Description                                                                                                                                          |Default| Required |
+|--------|------------------------------------------------------------------------------------------------------------------------------------------------------|-------|----------|
+|type| Set this value to `glue`.                                                                                                                            |None| yes      |
+|catalogProperties| Map of any additional properties that needs to be attached to the catalog. This expects all the config as per [Iceberg Catalog configuration docs](https://iceberg.apache.org/docs/latest/configuration/#catalog-properties) |None| Yes      |
+
+Sample: 
+
+```angular2html
+...
+"icebergCatalog":
+{ 
+    "type": "glue",
+    "catalogProperties":
+    {
+        "warehouse": "s3a://bucket/warehouse",
+        "io-impl": "org.apache.iceberg.aws.s3.S3FileIO"
+    }
+}
+..
+```
+
+### Iceberg filter object
+
+This input source provides the following filters: `and`, `equals`, `interval`, `timeWindow`, `range` and `or`. You can use these filters to filter out data files from a snapshot, reducing the number of files Druid has to ingest.
+It is strongly recommended to apply filtering only on Iceberg partition columns. When filtering on non-partition columns, Iceberg filters may return rows that do not fully match the expression. To address this, it may help to define an additional filter in the [`transformSpec`](./ingestion-spec.md#transformspec) to remove residual rows.
+
+`equals` Filter:
+
+|Property|Description|Required|
+|--------|-----------|---------|
+|type|Set this value to `equals`.|yes|
+|filterColumn|The name of the column from the Iceberg table schema to use for filtering.|yes|
+|filterValue|The value to filter on.|yes|
+
+`interval` Filter:
+
+|Property|Description|Required|
+|--------|-----------|---------|
+|type|Set this value to `interval`.|yes|
+|filterColumn|The column name from the iceberg table schema based on which filtering needs to happen|yes|
+|intervals|A JSON array containing ISO 8601 interval strings. This defines the time ranges to filter on. The start interval is inclusive and the end interval is exclusive. |yes|
+
+`and` Filter:
+
+|Property|Description|Required|
+|--------|-----------|---------|
+|type|Set this value to `and`.|yes|
+|filters|List of iceberg filters that needs to be AND-ed|yes|
+
+`or` Filter:
+
+|Property|Description|Required|
+|--------|-----------|---------|
+|type|Set this value to `or`.|yes|
+|filters|List of iceberg filters that needs to be OR-ed|yes|
+
+`not` Filter:
+
+|Property|Description|Required|
+|--------|-----------|---------|
+|type|Set this value to `not`.|yes|
+|filter|The iceberg filter on which logical NOT is applied|yes|
+
+`range` Filter:
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|--------|
+|type|Set this value to `range`.|None|yes|
+|filterColumn|The column name from the iceberg table schema based on which range filtering needs to happen.|None|yes|
+|lower|Lower bound value to match.|None|no. At least one of `lower` or `upper` must not be null.|
+|upper|Upper bound value to match. |None|no. At least one of `lower` or `upper` must not be null.|
+|lowerOpen|Boolean indicating if lower bound is open in the interval of values defined by the range (`>` instead of `>=`). |false|no|
+|upperOpen|Boolean indicating if upper bound is open on the interval of values defined by range (`<` instead of `<=`). |false|no|
+
+`timeWindow` Filter:
+
+| Property|Description|Default| Required |
+|---------|-----------|-------|----------|
+|type| Set this value to `timeWindow`.|None|yes|
+|filterColumn|The column name from the iceberg table schema based on which filtering needs to happen. The filter column must be defined as TimestampType in Iceberg.|None|yes|
+|baseTime|Determines the reference timestamp from which the lookback and lookahead durations are applied to define the time window.|Current UTC timestamp|no|
+|lookbackDuration|Defines the duration that determines how far backward should the filter include data relative to `baseTime`.|P1D|no|
+|lookaheadDuration|Defines the duration that determines how far ahead should the filter include data relative to `baseTime`.|Zero|no|
+
+## Delta Lake input source
+
+:::info[Required extension]
+To use the Delta Lake input source, load the extension [`druid-deltalake-extensions`](../development/extensions-contrib/delta-lake.md) in your `common.runtime.properties` file.
+:::
+
+You can use the Delta input source to read data stored in a Delta Lake table. For a given table, the input source scans
+the latest snapshot from the configured table. Druid ingests the underlying delta files from the table.
+
+| Property | Description | Default | Required |
+|----------|-------------|---------|----------|
+| type | Set this value to `delta`. | None | yes |
+| tablePath | The location of the Delta table. | None | yes |
+| filter | The JSON Object that filters data files within a snapshot. | None | no |
+| snapshotVersion | The snapshot version to read from the Delta table. An integer value must be specified. | Latest | no |
+
+### Delta filter object
+
+You can use these filters to filter out data files from a snapshot, reducing the number of files Druid has to ingest from
+a Delta table. This input source provides the following filters: `and`, `or`, `not`, `=`, `>`, `>=`, `<`, `<=`.
+
+When a filter is applied on non-partitioned columns, the filtering is best-effort as the Delta Kernel solely relies
+on statistics collected when the non-partitioned table is created. In this scenario, this Druid connector may ingest
+data that doesn't match the filter. To guarantee that the Delta Kernel prunes out unnecessary column values, only use
+filters on partitioned columns.
+
+`and` filter:
+
+| Property | Description                                                                                                                                                   | Required |
+|----------|---------------------------------------------------------------------------------------------------------------------------------------------------------------|----------|
+| type     | Set this value to `and`.                                                                                                                                      | yes      |
+| filters  | List of Delta filter predicates that get evaluated using logical AND where both conditions need to be true. `and` filter requires two filter predicates.      | yes      |
+
+`or` filter:
+
+| Property | Description                                                                                                                                                     | Required |
+|----------|-----------------------------------------------------------------------------------------------------------------------------------------------------------------|----------|
+| type     | Set this value to `or`.                                                                                                                                         | yes      |
+| filters  | List of Delta filter predicates that get evaluated using logical OR where only one condition needs to be true. `or` filter requires two filter predicates.      | yes      |
+
+`not` filter:
+
+| Property | Description                                                                                                   | Required |
+|----------|---------------------------------------------------------------------------------------------------------------|----------|
+| type     | Set this value to `not`.                                                                                      | yes      |
+| filter   | The Delta filter predicate that gets evaluated using logical NOT. `not` filter requires one filter predicate. | yes      |
+
+`=` filter:
+
+| Property | Description                              | Required |
+|----------|------------------------------------------|----------|
+| type     | Set this value to `=`.                   | yes      |
+| column   | The table column to apply the filter on. | yes      |
+| value    | The value to use in the filter.          | yes      |
+
+`>` filter:
+
+| Property | Description                              | Required |
+|----------|------------------------------------------|----------|
+| type     | Set this value to `>`.                   | yes      |
+| column   | The table column to apply the filter on. | yes      |
+| value    | The value to use in the filter.          | yes      |
+
+`>=` filter:
+
+| Property | Description                              | Required |
+|----------|------------------------------------------|----------|
+| type     | Set this value to `>=`.                  | yes      |
+| column   | The table column to apply the filter on. | yes      |
+| value    | The value to use in the filter.          | yes      |
+
+`<` filter:
+
+| Property | Description                              | Required |
+|----------|------------------------------------------|----------|
+| type     | Set this value to `<`.                   | Yes      |
+| column   | The table column to apply the filter on. | Yes      |
+| value    | The value to use in the filter.          | Yes      |
+
+`<=` filter:
+
+| Property | Description                              | Required |
+|----------|------------------------------------------|----------|
+| type     | Set this value to `<=`.                  | yes      |
+| column   | The table column to apply the filter on. | yes      |
+| value    | The value to use in the filter.          | yes      |
+
+The following is a sample spec to read all records from the latest snapshot from Delta table `/delta-table/foo`:
+
+```json
+...
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "delta",
+        "tablePath": "/delta-table/foo"
+      },
+    }
+```
+
+The following is a sample spec to read records from the Delta table `/delta-table/foo` snapshot version `3` to select records where
+`name = 'Employee4' and age >= 30`:
+
+```json
+...
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "delta",
+        "tablePath": "/delta-table/foo",
+        "filter": {
+          "type": "and",
+          "filters": [
+            {
+             "type": "=",
+             "column": "name",
+             "value": "Employee4"
+            },
+            {
+              "type": ">=",
+              "column": "age",
+              "value": "30"
+            }
+          ]
+        },
+       "snapshotVersion":  3
+      },
+    }
+```
diff --git a/docs/35.0.0/ingestion/kafka-ingestion.md b/docs/35.0.0/ingestion/kafka-ingestion.md
new file mode 100644
index 0000000000..67b1a96a3d
--- /dev/null
+++ b/docs/35.0.0/ingestion/kafka-ingestion.md
@@ -0,0 +1,467 @@
+---
+id: kafka-ingestion
+title: "Apache Kafka ingestion"
+sidebar_label: "Apache Kafka ingestion"
+description: "Overview of the Kafka indexing service for Druid. Includes example supervisor specs to help you get started."
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+To use the Kafka indexing service, you must be on Apache Kafka version 0.11.x or higher.
+If you are using an older version, refer to the [Apache Kafka upgrade guide](https://kafka.apache.org/documentation/#upgrade).
+:::
+
+When you enable the Kafka indexing service, you can configure supervisors on the Overlord to manage the creation and lifetime of Kafka indexing tasks.
+Kafka indexing tasks read events using Kafka partition and offset mechanism to guarantee exactly-once ingestion. The supervisor oversees the state of the indexing tasks to coordinate handoffs, manage failures, and ensure that scalability and replication requirements are maintained.
+
+This topic contains configuration information for the Kafka indexing service supervisor for Apache Druid.
+
+## Setup
+
+To use the Kafka indexing service, you must first load the `druid-kafka-indexing-service` extension on both the Overlord and the Middle Manager. See [Loading extensions](../configuration/extensions.md) for more information.
+
+## Supervisor spec configuration
+
+This section outlines the configuration properties that are specific to the Apache Kafka streaming ingestion method. For configuration properties shared across all streaming ingestion methods supported by Druid, see [Supervisor spec](supervisor.md#supervisor-spec).
+
+The following example shows a supervisor spec for the Kafka indexing service:
+
+<details>
+  <summary>Click to view the example</summary>
+
+```json
+{
+  "type": "kafka",
+  "spec": {
+    "dataSchema": {
+      "dataSource": "metrics-kafka",
+      "timestampSpec": {
+        "column": "timestamp",
+        "format": "auto"
+      },
+      "dimensionsSpec": {
+        "dimensions": [],
+        "dimensionExclusions": [
+          "timestamp",
+          "value"
+        ]
+      },
+      "metricsSpec": [
+        {
+          "name": "count",
+          "type": "count"
+        },
+        {
+          "name": "value_sum",
+          "fieldName": "value",
+          "type": "doubleSum"
+        },
+        {
+          "name": "value_min",
+          "fieldName": "value",
+          "type": "doubleMin"
+        },
+        {
+          "name": "value_max",
+          "fieldName": "value",
+          "type": "doubleMax"
+        }
+      ],
+      "granularitySpec": {
+        "type": "uniform",
+        "segmentGranularity": "HOUR",
+        "queryGranularity": "NONE"
+      }
+    },
+    "ioConfig": {
+      "topic": "metrics",
+      "inputFormat": {
+        "type": "json"
+      },
+      "consumerProperties": {
+        "bootstrap.servers": "localhost:9092"
+      },
+      "taskCount": 1,
+      "replicas": 1,
+      "taskDuration": "PT1H"
+    },
+    "tuningConfig": {
+      "type": "kafka",
+      "maxRowsPerSegment": 5000000
+    }
+  }
+}
+```
+
+</details>
+
+### I/O configuration
+
+The following table outlines the `ioConfig` configuration properties specific to Kafka.
+For configuration properties shared across all streaming ingestion methods, refer to [Supervisor I/O configuration](supervisor.md#io-configuration).
+
+|Property|Type|Description|Required|Default|
+|--------|----|-----------|--------|-------|
+|`topic`|String|The Kafka topic to read from. Note that once this value is established for a supervisor, updating it is not supported. To ingest data from multiple topic, use `topicPattern`. |Yes if `topicPattern` isn't set.||
+|`topicPattern`|String|Multiple Kafka topics to read from, passed as a regex pattern. See [Ingest from multiple topics](#ingest-from-multiple-topics) for more information.|Yes if `topic` isn't set.||
+|`consumerProperties`|String, Object|A map of properties to pass to the Kafka consumer. See [Consumer properties](#consumer-properties) for details.|Yes. At the minimum, you must set the `bootstrap.servers` property to establish the initial connection to the Kafka cluster.||
+|`pollTimeout`|Long|The length of time to wait for the Kafka consumer to poll records, in milliseconds.|No|100|
+|`useEarliestOffset`|Boolean|If a supervisor is managing a datasource for the first time, it obtains a set of starting offsets from Kafka. This flag determines whether the supervisor retrieves the earliest or latest offsets in Kafka. Under normal circumstances, subsequent tasks start from where the previous segments ended so this flag is only used on the first run.|No|`false`|
+|`idleConfig`|Object|Defines how and when the Kafka supervisor can become idle. See [Idle configuration](#idle-configuration) for more details.|No|null|
+
+#### Ingest from multiple topics
+
+:::info
+If you enable multi-topic ingestion for a datasource, downgrading to a version older than
+28.0.0 will cause the ingestion for that datasource to fail.
+:::
+
+:::info
+Migrating an existing supervisor to use `topicPattern` instead of `topic` is not supported. It is also not supported to change the `topicPattern` of an existing supervisor to a different regex pattern.
+You can force the migration by doing the following:
+1. Suspend the supervisor.
+2. Reset the offsets.
+3. Submit updated supervisor.
+:::
+
+You can ingest data from one or multiple topics.
+When ingesting data from multiple topics, Druid assigns partitions based on the hashcode of the topic name and the ID of the partition within that topic. The partition assignment might not be uniform across all the tasks. Druid assumes that partitions across individual topics have similar load. If you want to ingest from both high and low load topics in the same supervisor, it is recommended that you have a higher number of partitions for a high load topic and a lower number of partitions for a low load topic.
+
+To ingest data from multiple topics, use the `topicPattern` property instead of `topic`.
+You pass multiple topics as a regex pattern. For example, to ingest data from clicks and impressions, set `topicPattern` to `clicks|impressions`.
+Similarly, you can use `metrics-.*` as the value for `topicPattern` if you want to ingest from all the topics that start with `metrics-`. If you add a new topic that matches the regex to the cluster, Druid automatically starts ingesting from the new topic. Topic names that match partially, such as `my-metrics-12`, are not included for ingestion.
+
+#### Consumer properties
+
+Consumer properties control how a supervisor reads and processes event messages from a Kafka stream. For more information about consumer configuration and advanced use cases, refer to the [Kafka documentation](https://kafka.apache.org/documentation/#consumerconfigs).
+
+You must include `bootstrap.servers` in consumer properties with a list of Kafka brokers in the format `<BROKER_1>:<PORT_1>,<BROKER_2>:<PORT_2>,...`.
+In some cases, you may need to retrieve consumer properties at runtime. For example, when `bootstrap.servers` is unknown or not static.
+
+The `isolation.level` property in `consumerProperties` determines how Druid reads messages written transactionally.
+If you use older versions of Kafka servers without transaction support or you don't want Druid to consume only committed transactions, set `isolation.level` to `read_uncommitted`.
+With `read_uncommitted`, which is the default setting, Druid reads all messages, including aborted transactional messages.
+Make sure offsets are sequential, since there is no offset gap check in Druid.
+For Druid to consume only committed transactional messages, set `isolation.level` to `read_committed`.
+
+If your Kafka cluster enables consumer group ACLs, you can set `group.id` in `consumerProperties` to override the default auto generated group ID.
+
+To enable SSL connections, you must provide passwords for `keystore`, `truststore`, and `key` confidentially. You can specify these settings in the `jaas.conf` login configuration file or in `consumerProperties` with `sasl.jaas.config`.
+To protect sensitive information, use the [environment variable dynamic config provider](../operations/dynamic-config-provider.md#environment-variable-dynamic-config-provider) to store credentials in system environment variables instead of plain text.
+Although you can also use the [password provider](../operations/password-provider.md) interface to specify SSL configuration for Kafka ingestion, consider using the dynamic config provider as this feature is deprecated.
+
+For example, when using SASL and SSL with Kafka, set the following environment variables for the Druid user on machines running the Overlord and Peon services. Replace the values to match your environment configurations.
+
+```
+export KAFKA_JAAS_CONFIG="org.apache.kafka.common.security.plain.PlainLoginModule required username='accesskey' password='secret key';"
+export SSL_KEY_PASSWORD=mysecretkeypassword
+export SSL_KEYSTORE_PASSWORD=mysecretkeystorepassword
+export SSL_TRUSTSTORE_PASSWORD=mysecrettruststorepassword
+```
+
+When you define the consumer properties in the supervisor spec, use the dynamic config provider to refer to the environment variables:
+
+```json
+"consumerProperties": {
+  "bootstrap.servers": "localhost:9092",
+  "security.protocol": "SASL_SSL", 
+  "sasl.mechanism": "PLAIN", 
+  "ssl.keystore.location": "/opt/kafka/config/kafka01.keystore.jks",
+  "ssl.truststore.location": "/opt/kafka/config/kafka.truststore.jks",
+  "druid.dynamic.config.provider": {
+    "type": "environment",
+    "variables": {
+      "sasl.jaas.config": "KAFKA_JAAS_CONFIG",
+      "ssl.key.password": "SSL_KEY_PASSWORD",
+      "ssl.keystore.password": "SSL_KEYSTORE_PASSWORD",
+      "ssl.truststore.password": "SSL_TRUSTSTORE_PASSWORD"
+    }
+  }
+}
+```
+
+When connecting to Kafka, Druid replaces the environment variables with their corresponding values.
+
+#### Idle configuration
+
+:::info
+Idle state transitioning is currently designated as experimental.
+:::
+
+When the supervisor enters the idle state, no new tasks are launched subsequent to the completion of the currently executing tasks. This strategy may lead to reduced costs for cluster operators while using topics that get sporadic data.
+
+The following table outlines the configuration options for `idleConfig`:
+
+|Property|Description|Required|
+|--------|-----------|--------|
+|`enabled`|If `true`, the supervisor becomes idle if there is no data on input stream or topic for some time.|No|`false`|
+|`inactiveAfterMillis`|The supervisor becomes idle if all existing data has been read from input topic and no new data has been published for `inactiveAfterMillis` milliseconds.|No|`600_000`|
+
+The following example shows a supervisor spec with idle configuration enabled:
+
+<details>
+  <summary>Click to view the example</summary>
+
+```json
+{
+  "type": "kafka",
+  "spec": {
+    "dataSchema": {...},
+    "ioConfig": {
+      "topic": "metrics",
+      "inputFormat": {
+        "type": "json"
+      },
+      "consumerProperties": {
+        "bootstrap.servers": "localhost:9092"
+      },
+      "autoScalerConfig": {
+        "enableTaskAutoScaler": true,
+        "taskCountMax": 6,
+        "taskCountMin": 2,
+        "minTriggerScaleActionFrequencyMillis": 600000,
+        "autoScalerStrategy": "lagBased",
+        "lagCollectionIntervalMillis": 30000,
+        "lagCollectionRangeMillis": 600000,
+        "scaleOutThreshold": 6000000,
+        "triggerScaleOutFractionThreshold": 0.3,
+        "scaleInThreshold": 1000000,
+        "triggerScaleInFractionThreshold": 0.9,
+        "scaleActionStartDelayMillis": 300000,
+        "scaleActionPeriodMillis": 60000,
+        "scaleInStep": 1,
+        "scaleOutStep": 2
+      },
+      "taskCount": 1,
+      "replicas": 1,
+      "taskDuration": "PT1H",
+      "idleConfig": {
+        "enabled": true,
+        "inactiveAfterMillis": 600000
+      }
+    },
+    "tuningConfig": {...}
+  }
+}
+```
+</details>
+
+#### Data format
+
+The Kafka indexing service supports both [`inputFormat`](data-formats.md#input-format) and [`parser`](data-formats.md#parser) to specify the data format. Use the `inputFormat` to specify the data format for the Kafka indexing service unless you need a format only supported by the legacy `parser`. For more information, see [Source input formats](data-formats.md).
+
+The Kinesis indexing service supports the following values for `inputFormat`:
+
+* `csv`
+* `tvs`
+* `json`
+* `kafka`
+* `avro_stream`
+* `protobuf`
+
+You can use `parser` to read [`thrift`](../development/extensions-contrib/thrift.md) formats.
+
+##### Kafka input format supervisor spec example
+
+The `kafka` input format lets you parse the Kafka metadata fields in addition to the Kafka payload value contents.
+
+The `kafka` input format wraps around the payload parsing input format and augments the data it outputs with the Kafka event timestamp, the Kafka topic name, the Kafka event headers, and the key field that itself can be parsed using any available input format.
+
+For example, consider the following structure for a Kafka message that represents a wiki edit in a development environment:
+
+- **Kafka timestamp**: `1680795276351`
+- **Kafka topic**: `wiki-edits`
+- **Kafka headers**:
+  - `env=development`
+  - `zone=z1`
+- **Kafka key**: `wiki-edit`
+- **Kafka payload value**: `{"channel":"#sv.wikipedia","timestamp":"2016-06-27T00:00:11.080Z","page":"Salo Toraut","delta":31,"namespace":"Main"}`
+
+Using `{ "type": "json" }` as the input format only parses the payload value.
+To parse the Kafka metadata in addition to the payload, use the `kafka` input format.
+
+You configure it as follows:
+
+- `valueFormat`: Define how to parse the payload value. Set this to the payload parsing input format (`{ "type": "json" }`).
+- `timestampColumnName`: Supply a custom name for the Kafka timestamp in the Druid schema to avoid conflicts with columns from the payload. The default is `kafka.timestamp`.
+- `topicColumnName`: Supply a custom name for the Kafka topic in the Druid schema to avoid conflicts with columns from the payload. The default is `kafka.topic`. This field is useful when ingesting data from multiple topics into the same datasource.
+- `headerFormat`: The default value `string` decodes strings in UTF-8 encoding from the Kafka header.  
+   Other supported encoding formats include the following:
+   - `ISO-8859-1`: ISO Latin Alphabet No. 1, that is, ISO-LATIN-1.
+   - `US-ASCII`: Seven-bit ASCII. Also known as ISO646-US. The Basic Latin block of the Unicode character set.
+   - `UTF-16`: Sixteen-bit UCS Transformation Format, byte order identified by an optional byte-order mark.
+   - `UTF-16BE`: Sixteen-bit UCS Transformation Format, big-endian byte order.
+   - `UTF-16LE`: Sixteen-bit UCS Transformation Format, little-endian byte order.
+- `headerColumnPrefix`: Supply a prefix to the Kafka headers to avoid any conflicts with columns from the payload. The default is `kafka.header.`.
+  Considering the header from the example, Druid maps the headers to the following columns: `kafka.header.env`, `kafka.header.zone`.
+- `keyFormat`: Supply an input format to parse the key. Only the first value is used.
+  If, as in the example, your key values are simple strings, then you can use the `tsv` format to parse them.
+  ```json
+  {
+    "type": "tsv",
+    "findColumnsFromHeader": false,
+    "columns": ["x"]
+  } 
+  ```
+  Note that for `tsv`,`csv`, and `regex` formats, you need to provide a `columns` array to make a valid input format. Only the first one is used, and its name will be ignored in favor of `keyColumnName`.
+- `keyColumnName`: Supply the name for the Kafka key column to avoid conflicts with columns from the payload. The default is `kafka.key`.
+
+The following input format uses default values for `timestampColumnName`, `topicColumnName`, `headerColumnPrefix`, and `keyColumnName`:
+
+```json
+{
+  "type": "kafka",
+  "valueFormat": {
+    "type": "json"
+  },
+  "headerFormat": {
+    "type": "string"
+  },
+  "keyFormat": {
+    "type": "tsv",
+    "findColumnsFromHeader": false,
+    "columns": ["x"]
+  }
+}
+```
+
+It parses the example message as follows:
+
+```json
+{
+  "channel": "#sv.wikipedia",
+  "timestamp": "2016-06-27T00:00:11.080Z",
+  "page": "Salo Toraut",
+  "delta": 31,
+  "namespace": "Main",
+  "kafka.timestamp": 1680795276351,
+  "kafka.topic": "wiki-edits",
+  "kafka.header.env": "development",
+  "kafka.header.zone": "z1",
+  "kafka.key": "wiki-edit"
+}
+```
+
+Finally, add these Kafka metadata columns to the `dimensionsSpec` or set your `dimensionsSpec` to auto-detect columns.
+     
+The following supervisor spec demonstrates how to ingest the Kafka header, key, timestamp, and topic into Druid dimensions:
+
+<details>
+  <summary>Click to view the example</summary>
+
+```json
+{
+  "type": "kafka",
+  "spec": {
+    "ioConfig": {
+      "type": "kafka",
+      "consumerProperties": {
+        "bootstrap.servers": "localhost:9092"
+      },
+      "topic": "wiki-edits",
+      "inputFormat": {
+        "type": "kafka",
+        "valueFormat": {
+          "type": "json"
+        },
+        "headerFormat": {
+          "type": "string"
+        },
+        "keyFormat": {
+          "type": "tsv",
+          "findColumnsFromHeader": false,
+          "columns": ["x"]
+        }
+      },
+      "useEarliestOffset": true
+    },
+    "dataSchema": {
+      "dataSource": "wikiticker",
+      "timestampSpec": {
+        "column": "timestamp",
+        "format": "posix"
+      },
+      "dimensionsSpec":  "dimensionsSpec": {
+        "useSchemaDiscovery": true,
+        "includeAllDimensions": true
+      },
+      "granularitySpec": {
+        "queryGranularity": "none",
+        "rollup": false,
+        "segmentGranularity": "day"
+      }
+    },
+    "tuningConfig": {
+      "type": "kafka"
+    }
+  }
+}
+```
+</details>
+
+After Druid ingests the data, you can query the Kafka metadata columns as follows:
+
+```sql
+SELECT
+  "kafka.header.env",
+  "kafka.key",
+  "kafka.timestamp",
+  "kafka.topic"
+FROM "wikiticker"
+```
+
+This query returns:
+
+|`kafka.header.env`|`kafka.key`|`kafka.timestamp`|`kafka.topic`|
+|------------------|-----------|-----------------|-------------|
+|`development`|`wiki-edit`|`1680795276351`|`wiki-edits`|
+
+### Tuning configuration
+
+The following table outlines the `tuningConfig` configuration properties specific to Kafka.
+For configuration properties shared across all streaming ingestion methods, refer to [Supervisor tuning configuration](supervisor.md#tuning-configuration).
+
+|Property|Type|Description|Required|Default|
+|--------|----|-----------|--------|-------|
+|`numPersistThreads`|Integer|The number of threads to use to create and persist incremental segments on the disk. Higher ingestion data throughput results in a larger number of incremental segments, causing significant CPU time to be spent on the creation of the incremental segments on the disk. For datasources with number of columns running into hundreds or thousands, creation of the incremental segments may take up significant time, in the order of multiple seconds. In both of these scenarios, ingestion can stall or pause frequently, causing it to fall behind. You can use additional threads to parallelize the segment creation without blocking ingestion as long as there are sufficient CPU resources available.|No|1|
+
+## Deployment notes on Kafka partitions and Druid segments
+
+Druid assigns Kafka partitions to each Kafka indexing task. A task writes the events it consumes from Kafka into a single segment for the segment granularity interval until it reaches one of the following limits: `maxRowsPerSegment`, `maxTotalRows`, or `intermediateHandoffPeriod`. At this point, the task creates a new partition for this segment granularity to contain subsequent events.
+
+The Kafka indexing task also does incremental hand-offs. Therefore, segments become available as they are ready and you don't have to wait for all segments until the end of the task duration. When the task reaches one of `maxRowsPerSegment`, `maxTotalRows`, or `intermediateHandoffPeriod`, it hands off all the segments and creates a new set of segments for further events. This allows the task to run for longer durations without accumulating old segments locally on Middle Manager services.
+
+The Kafka indexing service may still produce some small segments. For example, consider the following scenario:
+- Task duration is 4 hours.
+- Segment granularity is set to an HOUR.
+- The supervisor was started at 9:10.
+After 4 hours at 13:10, Druid starts a new set of tasks. The events for the interval 13:00 - 14:00 may be split across existing tasks and the new set of tasks which could result in small segments. To merge them together into new segments of an ideal size (in the range of ~500-700 MB per segment), you can schedule re-indexing tasks, optionally with a different segment granularity.
+
+For information on how to optimize the segment size, see [Segment size optimization](../operations/segment-optimization.md).
+
+## Learn more
+
+See the following topics for more information:
+
+* [Supervisor API](../api-reference/supervisor-api.md) for how to manage and monitor supervisors using the API.
+* [Supervisor](../ingestion/supervisor.md) for supervisor status and capacity planning.
+* [Loading from Apache Kafka](../tutorials/tutorial-kafka.md) for a tutorial on streaming data from Apache Kafka.
+* [Kafka input format](../ingestion/data-formats.md#kafka) to learn about the `kafka` input format.
diff --git a/docs/35.0.0/ingestion/kinesis-ingestion.md b/docs/35.0.0/ingestion/kinesis-ingestion.md
new file mode 100644
index 0000000000..c0eced9489
--- /dev/null
+++ b/docs/35.0.0/ingestion/kinesis-ingestion.md
@@ -0,0 +1,335 @@
+---
+id: kinesis-ingestion
+title: "Amazon Kinesis ingestion"
+sidebar_label: "Amazon Kinesis ingestion"
+---
+import Tabs from '@theme/Tabs';
+import TabItem from '@theme/TabItem';
+
+
+<!--
+
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+When you enable the Kinesis indexing service, you can configure supervisors on the Overlord to manage the creation and lifetime of Kinesis indexing tasks. Kinesis indexing tasks read events using the Kinesis shard and sequence number mechanism to guarantee exactly-once ingestion. The supervisor oversees the state of the indexing tasks to coordinate handoffs, manage failures, and ensure that scalability and replication requirements are maintained.
+
+This topic contains configuration information for the Kinesis indexing service supervisor for Apache Druid.
+
+## Setup
+
+To use the Kinesis indexing service, you must first load the `druid-kinesis-indexing-service` core extension on both the Overlord and the Middle Manager. See [Loading extensions](../configuration/extensions.md#loading-extensions) for more information.
+
+Review [Known issues](#known-issues) before deploying the `druid-kinesis-indexing-service` extension to production.
+
+## Supervisor spec configuration
+
+This section outlines the configuration properties that are specific to the Amazon Kinesis streaming ingestion method. For configuration properties shared across all streaming ingestion methods supported by Druid, see [Supervisor spec](supervisor.md#supervisor-spec).
+
+The following example shows a supervisor spec for a stream with the name `KinesisStream`:
+
+<details>
+<summary>Click to view the example</summary>
+
+```json
+{
+  "type": "kinesis",
+  "spec": {
+    "ioConfig": {
+      "type": "kinesis",
+      "stream": "KinesisStream",
+      "inputFormat": {
+        "type": "json"
+      },
+      "useEarliestSequenceNumber": true
+    },
+    "tuningConfig": {
+      "type": "kinesis"
+    },
+    "dataSchema": {
+      "dataSource": "KinesisStream",
+      "timestampSpec": {
+        "column": "timestamp",
+        "format": "iso"
+      },
+      "dimensionsSpec": {
+        "dimensions": [
+          "isRobot",
+          "channel",
+          "flags",
+          "isUnpatrolled",
+          "page",
+          "diffUrl",
+          {
+            "type": "long",
+            "name": "added"
+          },
+          "comment",
+          {
+            "type": "long",
+            "name": "commentLength"
+          },
+          "isNew",
+          "isMinor",
+          {
+            "type": "long",
+            "name": "delta"
+          },
+          "isAnonymous",
+          "user",
+          {
+            "type": "long",
+            "name": "deltaBucket"
+          },
+          {
+            "type": "long",
+            "name": "deleted"
+          },
+          "namespace",
+          "cityName",
+          "countryName",
+          "regionIsoCode",
+          "metroCode",
+          "countryIsoCode",
+          "regionName"
+        ]
+      },
+      "granularitySpec": {
+        "queryGranularity": "none",
+        "rollup": false,
+        "segmentGranularity": "hour"
+      }
+    }
+  }
+}
+```
+</details>
+
+### I/O configuration
+
+The following table outlines the `ioConfig` configuration properties specific to Kinesis.
+For configuration properties shared across all streaming ingestion methods, refer to [Supervisor I/O configuration](supervisor.md#io-configuration).
+
+|Property|Type|Description|Required|Default|
+|--------|----|-----------|--------|-------|
+|`stream`|String|The Kinesis stream to read.|Yes||
+|`endpoint`|String|The AWS Kinesis stream endpoint for a region. You can find a list of endpoints in the [AWS service endpoints](http://docs.aws.amazon.com/general/latest/gr/rande.html#ak_region) document.|No|`kinesis.us-east-1.amazonaws.com`|
+|`useEarliestSequenceNumber`|Boolean|If a supervisor is managing a datasource for the first time, it obtains a set of starting sequence numbers from Kinesis. This flag determines whether the supervisor retrieves the earliest or latest sequence numbers in Kinesis. Under normal circumstances, subsequent tasks start from where the previous segments ended so this flag is only used on the first run.|No|`false`|
+|`fetchDelayMillis`|Integer|Time in milliseconds to wait between subsequent calls to fetch records from Kinesis. See [Determine fetch settings](#determine-fetch-settings).|No|0|
+|`awsAssumedRoleArn`|String|The AWS assumed role to use for additional permissions.|No||
+|`awsExternalId`|String|The AWS external ID to use for additional permissions.|No||
+
+#### Data format
+
+The Kinesis indexing service supports both [`inputFormat`](data-formats.md#input-format) and [`parser`](data-formats.md#parser) to specify the data format. Use the `inputFormat` to specify the data format for the Kinesis indexing service unless you need a format only supported by the legacy `parser`. For more information, see [Source input formats](data-formats.md).
+
+The Kinesis indexing service supports the following values for `inputFormat`:
+
+* `kinesis`
+* `csv`
+* `tvs`
+* `json`
+* `avro_stream`
+* `protobuf`
+
+You can use `parser` to read [`thrift`](../development/extensions-contrib/thrift.md) formats.
+
+### Tuning configuration
+
+The following table outlines the `tuningConfig` configuration properties specific to Kinesis.
+For configuration properties shared across all streaming ingestion methods, refer to [Supervisor tuning configuration](supervisor.md#tuning-configuration).
+
+|Property|Type|Description|Required|Default|
+|--------|----|-----------|--------|-------|
+|`skipSequenceNumberAvailabilityCheck`|Boolean|Whether to enable checking if the current sequence number is still available in a particular Kinesis shard. If `false`, the indexing task attempts to reset the current sequence number, depending on the value of `resetOffsetAutomatically`. For more information on the `resetOffsetAutomatically` property, see [Supervisor tuning configuration](supervisor.md#tuning-configuration).|No|`false`|
+|`recordBufferSizeBytes`|Integer| The size of the buffer (heap memory bytes) Druid uses between the Kinesis fetch threads and the main ingestion thread.|No| See [Determine fetch settings](#determine-fetch-settings) for defaults.|
+|`recordBufferOfferTimeout`|Integer|The number of milliseconds to wait for space to become available in the buffer before timing out.|No|5000|
+|`recordBufferFullWait`|Integer|The number of milliseconds to wait for the buffer to drain before Druid attempts to fetch records from Kinesis again.|No|5000|
+|`fetchThreads`|Integer|The size of the pool of threads fetching data from Kinesis. There is no benefit in having more threads than Kinesis shards.|No| `procs * 2`, where `procs` is the number of processors available to the task.|
+|`maxBytesPerPoll`|Integer| The maximum number of bytes to be fetched from buffer per poll. At least one record is polled from the buffer regardless of this config.|No| 1000000 bytes|
+|`repartitionTransitionDuration`|ISO 8601 period|When shards are split or merged, the supervisor recomputes shard to task group mappings. The supervisor also signals any running tasks created under the old mappings to stop early at current time + `repartitionTransitionDuration`. Stopping the tasks early allows Druid to begin reading from the new shards more quickly. The repartition transition wait time controlled by this property gives the stream additional time to write records to the new shards after the split or merge, which helps avoid issues with [empty shard handling](https://github.com/apache/druid/issues/7600).|No|`PT2M`|
+|`useListShards`|Boolean|Indicates if `listShards` API of AWS Kinesis SDK can be used to prevent `LimitExceededException` during ingestion. You must set the necessary `IAM` permissions.|No|`false`|
+
+## AWS authentication
+
+Druid uses AWS access and secret keys to authenticate Kinesis API requests. There are a few ways to provide this information to Druid:
+
+1. Using roles or short-term credentials:
+
+  Druid looks for credentials set in [environment variables](https://docs.aws.amazon.com/cli/latest/userguide/cli-configure-envvars.html), via [Web Identity Token](https://docs.aws.amazon.com/IAM/latest/UserGuide/id_roles_providers_oidc.html), in the default [profile configuration file](https://docs.aws.amazon.com/cli/latest/userguide/cli-configure-files.html), and from the EC2 instance profile provider (in this order).
+
+2. Using long-term security credentials:
+
+  You can directly provide your AWS access key and AWS secret key in the `common.runtime.properties` file as shown in the example below:
+
+  ```properties
+  druid.kinesis.accessKey=AKIAWxxxxxxxxxx4NCKS
+  druid.kinesis.secretKey=Jbytxxxxxxxxxxx2+555
+  ```
+
+:::info
+AWS does not recommend providing long-term security credentials in configuration files since it might pose a security risk.
+If you use this approach, it takes precedence over all other methods of providing credentials.
+:::
+
+To ingest data from Kinesis, ensure that the policy attached to your IAM role contains the necessary permissions.
+The required permissions depend on the value of `useListShards`.
+
+If the `useListShards` flag is set to `true`, you need following permissions:
+
+- `ListStreams` to list your data streams.
+- `Get*` required for `GetShardIterator`.
+- `GetRecords` to get data records from a data stream's shard.
+- `ListShards` to get the shards for a stream of interest.
+
+The following is an example policy:
+
+```json
+[
+  {
+    "Effect": "Allow",
+    "Action": ["kinesis:List*"],
+    "Resource": ["*"]
+  },
+  {
+    "Effect": "Allow",
+    "Action": ["kinesis:Get*"],
+    "Resource": [<ARN for shards to be ingested>]
+  }
+]
+```
+
+If the `useListShards` flag is set to `false`, you need following permissions:
+
+- `ListStreams` to list your data streams.
+- `Get*` required for `GetShardIterator`.
+- `GetRecords` to get data records from a data stream's shard.
+- `DescribeStream` to describe the specified data stream.
+
+The following is an example policy:
+
+```json
+[
+  {
+    "Effect": "Allow",
+    "Action": ["kinesis:ListStreams"],
+    "Resource": ["*"]
+  },
+  {
+    "Effect": "Allow",
+    "Action": ["kinesis:DescribeStream"],
+    "Resource": ["*"]
+  },
+  {
+    "Effect": "Allow",
+    "Action": ["kinesis:Get*"],
+    "Resource": [<ARN for shards to be ingested>]
+  }
+]
+```
+
+## Shards and segment handoff
+
+Each Kinesis indexing task writes the events it consumes from Kinesis shards into a single segment for the segment granularity interval until it reaches one of the following limits: `maxRowsPerSegment`, `maxTotalRows`, or `intermediateHandoffPeriod`.
+At this point, the task creates a new shard for this segment granularity to contain subsequent events.
+
+The Kinesis indexing task also performs incremental hand-offs so that the segments created by the task are not held up until the task duration is over.
+When the task reaches one of the `maxRowsPerSegment`, `maxTotalRows`, or `intermediateHandoffPeriod` limits, it hands off all the segments and creates a new set of segments for further events. This allows the task to run for longer durations
+without accumulating old segments locally on Middle Manager services.
+
+The Kinesis indexing service may still produce some small segments.
+For example, consider the following scenario:
+
+- Task duration is 4 hours
+- Segment granularity is set to an HOUR
+- The supervisor was started at 9:10
+
+After 4 hours at 13:10, Druid starts a new set of tasks. The events for the interval 13:00 - 14:00 may be split across existing tasks and the new set of tasks which could result in small segments. To merge them together into new segments of an ideal size (in the range of ~500-700 MB per segment), you can schedule re-indexing tasks, optionally with a different segment granularity.
+
+For information on how to optimize the segment size, see [Segment size optimization](../operations/segment-optimization.md).
+
+## Determine fetch settings
+
+Kinesis indexing tasks fetch records using `fetchThreads` threads.
+If `fetchThreads` is higher than the number of Kinesis shards, the excess threads are unused.
+Each fetch thread fetches up to 10 MB of records at once from a Kinesis shard, with a delay between fetches of `fetchDelayMillis`.
+The records fetched by each thread are pushed into a shared queue of size `recordBufferSizeBytes`.
+
+The default values for these parameters are:
+
+- `fetchThreads`: Twice the number of processors available to the task. The number of processors available to the task
+is the total number of processors on the server, divided by `druid.worker.capacity` (the number of task slots on that
+particular server). This value is further limited so that the total data record data fetched at a given time does not
+exceed 5% of the max heap configured, assuming that each thread fetches 10 MB of records at once. If the value specified
+for this configuration is higher than this limit, no failure occurs, but a warning is logged, and the value is
+implicitly lowered to the max allowed by this constraint.
+- `fetchDelayMillis`: 0 (no delay between fetches).
+- `recordBufferSizeBytes`: 100 MB or an estimated 10% of available heap, whichever is smaller.
+- `maxBytesPerPoll`: 1000000.
+
+Kinesis places the following restrictions on calls to fetch records:
+
+- Each data record can be up to 1 MB in size.
+- Each shard can support up to 5 transactions per second for reads.
+- Each shard can read up to 2 MB per second.
+- The maximum size of data that GetRecords can return is 10 MB.
+
+If the above limits are exceeded, Kinesis throws `ProvisionedThroughputExceededException` errors. If this happens, Druid
+Kinesis tasks pause by `fetchDelayMillis` or 3 seconds, whichever is larger, and then attempt the call again.
+
+In most cases, the default settings for fetch parameters are sufficient to achieve good performance without excessive
+memory usage. However, in some cases, you may need to adjust these parameters to control fetch rate
+and memory usage more finely. Optimal values depend on the average size of a record and the number of consumers you
+have reading from a given shard, which will be `replicas` unless you have other consumers also reading from this
+Kinesis stream.
+
+## Deaggregation
+
+The Kinesis indexing service supports de-aggregation of multiple rows stored within a single [Kinesis Data Streams](https://docs.aws.amazon.com/streams/latest/dev/introduction.html) record for more efficient data transfer.
+
+## Resharding
+
+[Resharding](https://docs.aws.amazon.com/streams/latest/dev/kinesis-using-sdk-java-resharding.html) is an advanced operation that lets you adjust the number of shards in a stream to adapt to changes in the rate of data flowing through a stream.
+
+When changing the shard count for a Kinesis stream, there is a window of time around the resharding operation with early shutdown of Kinesis ingestion tasks and possible task failures.
+
+The early shutdowns and task failures are expected. They occur because the supervisor updates the shard to task group mappings as shards are closed and fully read. This ensures that tasks are not running
+with an assignment of closed shards that have been fully read and balances distribution of active shards across tasks.
+
+This window with early task shutdowns and possible task failures concludes when:
+
+- All closed shards have been fully read and the Kinesis ingestion tasks have published the data from those shards, committing the "closed" state to metadata storage.
+- Any remaining tasks that had inactive shards in the assignment have been shut down. These tasks would have been created before the closed shards were completely drained.
+
+Note that when the supervisor is running and detects new partitions, tasks read new partitions from the earliest sequence number, irrespective of the `useEarliestSequence` setting. This is because these new shards were immediately discovered and are therefore unlikely to experience a lag.
+
+If resharding occurs when the supervisor is suspended and `useEarliestSequence` is set to `false`, resuming the supervisor causes tasks to read the new shards from the latest sequence. This is by design so that the consumer can catch up quickly with any lag accumulated while the supervisor was suspended.
+
+## Known issues
+
+Before you deploy the `druid-kinesis-indexing-service` extension to production, consider the following known issues:
+
+- Kinesis imposes a read throughput limit per shard. If you have multiple supervisors reading from the same Kinesis stream, consider adding more shards to ensure sufficient read throughput for all supervisors.
+- A Kinesis supervisor can sometimes compare the checkpoint sequence number to the retention window of the stream to see if it has fallen behind. These checks fetch the earliest sequence number for Kinesis which can result in `IteratorAgeMilliseconds` becoming very high in AWS CloudWatch.
+
+## Learn more
+
+See the following topics for more information:
+
+* [Supervisor API](../api-reference/supervisor-api.md) for how to manage and monitor supervisors using the API.
+* [Supervisor](../ingestion/supervisor.md) for supervisor status and capacity planning.
\ No newline at end of file
diff --git a/docs/35.0.0/ingestion/native-batch-firehose.md b/docs/35.0.0/ingestion/native-batch-firehose.md
new file mode 100644
index 0000000000..16e9634ff2
--- /dev/null
+++ b/docs/35.0.0/ingestion/native-batch-firehose.md
@@ -0,0 +1,28 @@
+---
+id: native-batch-firehose
+title: "JSON-based batch ingestion with firehose (Deprecated)"
+sidebar_label: "Firehose (deprecated)"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ Firehose ingestion has been removed in Druid 26.0. See [Migrate from firehose to input source ingestion](../operations/migrate-from-firehose-ingestion.md) for instructions on migrating from firehose ingestion to using native batch ingestion input sources.
+:::
diff --git a/docs/35.0.0/ingestion/native-batch-simple-task.md b/docs/35.0.0/ingestion/native-batch-simple-task.md
new file mode 100644
index 0000000000..6b93d119ec
--- /dev/null
+++ b/docs/35.0.0/ingestion/native-batch-simple-task.md
@@ -0,0 +1,185 @@
+---
+id: native-batch-simple-task
+title: "JSON-based batch simple task indexing"
+sidebar_label: "JSON-based batch (simple)"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ This page describes native batch ingestion using [ingestion specs](ingestion-spec.md). Refer to the [ingestion
+ methods](../ingestion/index.md#batch) table to determine which ingestion method is right for you.
+:::
+
+The simple task ([task type](tasks.md) `index`) executes single-threaded as a single task within the indexing service. For parallel, scalable options consider using [`index_parallel` tasks](./native-batch.md) or [SQL-based batch ingestion](../multi-stage-query/index.md).
+
+## Simple task example
+
+A sample task is shown below:
+
+```json
+{
+  "type" : "index",
+  "spec" : {
+    "dataSchema" : {
+      "dataSource" : "wikipedia",
+      "timestampSpec" : {
+        "column" : "timestamp",
+        "format" : "auto"
+      },
+      "dimensionsSpec" : {
+        "dimensions": ["country", "page","language","user","unpatrolled","newPage","robot","anonymous","namespace","continent","region","city"],
+        "dimensionExclusions" : []
+      },
+      "metricsSpec" : [
+        {
+          "type" : "count",
+          "name" : "count"
+        },
+        {
+          "type" : "doubleSum",
+          "name" : "added",
+          "fieldName" : "added"
+        },
+        {
+          "type" : "doubleSum",
+          "name" : "deleted",
+          "fieldName" : "deleted"
+        },
+        {
+          "type" : "doubleSum",
+          "name" : "delta",
+          "fieldName" : "delta"
+        }
+      ],
+      "granularitySpec" : {
+        "type" : "uniform",
+        "segmentGranularity" : "DAY",
+        "queryGranularity" : "NONE",
+        "intervals" : [ "2013-08-31/2013-09-01" ]
+      }
+    },
+    "ioConfig" : {
+      "type" : "index",
+      "inputSource" : {
+        "type" : "local",
+        "baseDir" : "examples/indexing/",
+        "filter" : "wikipedia_data.json"
+       },
+       "inputFormat": {
+         "type": "json"
+       }
+    },
+    "tuningConfig" : {
+      "type" : "index",
+      "partitionsSpec": {
+        "type": "hashed",
+        "partitionDimensions": ["country"],
+        "targetRowsPerSegment": 5000000
+      }
+    }
+  }
+}
+```
+
+## Simple task configuration
+
+|property|description|required?|
+|--------|-----------|---------|
+|type|The task type, this should always be `index`.|yes|
+|id|The task ID. If this is not explicitly specified, Druid generates the task ID using task type, data source name, interval, and date-time stamp. |no|
+|spec|The ingestion spec including the [data schema](#dataschema), [IO config](#ioconfig), and [tuning config](#tuningconfig).|yes|
+|context|Context to specify various task configuration parameters. See [Task context parameters](tasks.md#context-parameters) for more details.|no|
+
+### `dataSchema`
+
+This field is required.
+
+See the [`dataSchema`](./ingestion-spec.md#dataschema) section of the ingestion docs for details.
+
+If you do not specify `intervals` explicitly in your dataSchema's granularitySpec, the Local Index Task will do an extra
+pass over the data to determine the range to lock when it starts up.  If you specify `intervals` explicitly, any rows
+outside the specified intervals will be thrown away. We recommend setting `intervals` explicitly if you know the time
+range of the data because it allows the task to skip the extra pass, and so that you don't accidentally replace data outside
+that range if there's some stray data with unexpected timestamps.
+
+### `ioConfig`
+
+|property|description|default|required?|
+|--------|-----------|-------|---------|
+|type|The task type, this should always be "index".|none|yes|
+|inputFormat|[`inputFormat`](./data-formats.md#input-format) to specify how to parse input data.|none|yes|
+|appendToExisting|Creates segments as additional shards of the latest version, effectively appending to the segment set instead of replacing it. This means that you can append new segments to any datasource regardless of its original partitioning scheme. You must use the `dynamic` partitioning type for the appended segments. If you specify a different partitioning type, the task fails with an error.|false|no|
+|dropExisting|If this setting is `false` then ingestion proceeds as usual. Set this to `true` and `appendToExisting` to `false` to enforce true "replace" functionality as described next. If `true` and `appendToExisting` is `false` and the `granularitySpec` contains at least one`interval`, then the ingestion task will create regular segments for time chunk intervals with input data and `tombstones` for all other time chunks with no data. The task will publish the data segments and the tombstone segments together when the it publishes new segments. The net effect of the data segments and the tombstones is to completely adhere to a "replace" semantics where the  input data contained in the `granularitySpec` intervals replaces all existing data in the intervals even for time chunks that would be empty in the case that no input data was associated with them. In the extreme case when the input data set that falls in the `granularitySpec` intervals is empty all existing data in the interval will be replaced with an empty data set (i.e. with nothing -- all existing data will be covered by `tombstones`). If ingestion fails, no segments and tombstones will be published. The following two combinations are not supported and will make the ingestion fail with an error: `dropExisting` is `true` and `interval` is not specified in `granularitySpec` or  `appendToExisting` is true and `dropExisting` is `true`. WARNING: this functionality is still in beta and even though we are not aware of any bugs, use with caution.|false|no|
+
+### `tuningConfig`
+
+The tuningConfig is optional and default parameters will be used if no tuningConfig is specified. See below for more details.
+
+|property|description|default|required?|
+|--------|-----------|-------|---------|
+|type|The task type, this should always be "index".|none|yes|
+|maxRowsInMemory|Used in determining when intermediate persists to disk should occur. Normally user does not need to set this, but depending on the nature of data, if rows are short in terms of bytes, user may not want to store a million rows in memory and this value should be set.|1000000|no|
+|maxBytesInMemory|Used in determining when intermediate persists to disk should occur. Normally this is computed internally and user does not need to set it. This value represents number of bytes to aggregate in heap memory before persisting. This is based on a rough estimate of memory usage and not actual usage. The maximum heap memory usage for indexing is maxBytesInMemory * (2 + maxPendingPersists). Note that `maxBytesInMemory` also includes heap usage of artifacts created from intermediary persists. This means that after every persist, the amount of `maxBytesInMemory` until next persist will decreases, and task will fail when the sum of bytes of all intermediary persisted artifacts exceeds `maxBytesInMemory`.|1/6 of max JVM memory|no|
+|maxTotalRows|Deprecated. Use `partitionsSpec` instead. Total number of rows in segments waiting for being pushed. Used in determining when intermediate pushing should occur.|20000000|no|
+|numShards|Deprecated. Use `partitionsSpec` instead. Directly specify the number of shards to create. If this is specified and `intervals` is specified in the `granularitySpec`, the index task can skip the determine intervals/partitions pass through the data.|null|no|
+|partitionDimensions|Deprecated. Use `partitionsSpec` instead. The dimensions to partition on. Leave blank to select all dimensions. Only used with `forceGuaranteedRollup` = true, will be ignored otherwise.|null|no|
+|partitionsSpec|Defines how to partition data in each timeChunk, see [PartitionsSpec](#partitionsspec)|`dynamic` if `forceGuaranteedRollup` = false, `hashed` if `forceGuaranteedRollup` = true|no|
+|indexSpec|Defines segment storage format options to be used at indexing time, see [IndexSpec](ingestion-spec.md#indexspec)|null|no|
+|indexSpecForIntermediatePersists|Defines segment storage format options to be used at indexing time for intermediate persisted temporary segments. This can be used to disable dimension/metric compression on intermediate segments to reduce memory required for final merging. However, disabling compression on intermediate segments might increase page cache use while they are used before getting merged into final segment published, see [IndexSpec](ingestion-spec.md#indexspec) for possible values.|same as indexSpec|no|
+|maxPendingPersists|Maximum number of persists that can be pending but not started. If this limit would be exceeded by a new intermediate persist, ingestion will block until the currently-running persist finishes. Maximum heap memory usage for indexing scales with maxRowsInMemory * (2 + maxPendingPersists).|0 (meaning one persist can be running concurrently with ingestion, and none can be queued up)|no|
+|forceGuaranteedRollup|Forces guaranteeing the [perfect rollup](rollup.md). The perfect rollup optimizes the total size of generated segments and querying time while indexing time will be increased. If this is set to true, the index task will read the entire input data twice: one for finding the optimal number of partitions per time chunk and one for generating segments. Note that the result segments would be hash-partitioned. This flag cannot be used with `appendToExisting` of IOConfig. For more details, see the below __Segment pushing modes__ section.|false|no|
+|reportParseExceptions|DEPRECATED. If true, exceptions encountered during parsing will be thrown and will halt ingestion; if false, unparseable rows and fields will be skipped. Setting `reportParseExceptions` to true will override existing configurations for `maxParseExceptions` and `maxSavedParseExceptions`, setting `maxParseExceptions` to 0 and limiting `maxSavedParseExceptions` to no more than 1.|false|no|
+|pushTimeout|Milliseconds to wait for pushing segments. It must be >= 0, where 0 means to wait forever.|0|no|
+|segmentWriteOutMediumFactory|Segment write-out medium to use when creating segments. See [SegmentWriteOutMediumFactory](native-batch.md#segmentwriteoutmediumfactory).|Not specified, the value from `druid.peon.defaultSegmentWriteOutMediumFactory.type` is used|no|
+|logParseExceptions|If true, log an error message when a parsing exception occurs, containing information about the row where the error occurred.|false|no|
+|maxParseExceptions|The maximum number of parse exceptions that can occur before the task halts ingestion and fails. Overridden if `reportParseExceptions` is set.|unlimited|no|
+|maxSavedParseExceptions|When a parse exception occurs, Druid can keep track of the most recent parse exceptions. "maxSavedParseExceptions" limits how many exception instances will be saved. These saved exceptions will be made available after the task finishes in the [task completion report](tasks.md#task-reports). Overridden if `reportParseExceptions` is set.|0|no|
+
+### `partitionsSpec`
+
+PartitionsSpec is to describe the secondary partitioning method.
+You should use different partitionsSpec depending on the [rollup mode](rollup.md) you want.
+For perfect rollup, you should use `hashed`.
+
+|property|description|default|required?|
+|--------|-----------|-------|---------|
+|type|This should always be `hashed`|none|yes|
+|maxRowsPerSegment|Used in sharding. Determines how many rows are in each segment.|5000000|no|
+|numShards|Directly specify the number of shards to create. If this is specified and `intervals` is specified in the `granularitySpec`, the index task can skip the determine intervals/partitions pass through the data. `numShards` cannot be specified if `maxRowsPerSegment` is set.|null|no|
+|partitionDimensions|The dimensions to partition on. Leave blank to select all dimensions.|null|no|
+|partitionFunction|A function to compute hash of partition dimensions. See [Hash partition function](./native-batch.md#hash-partition-function)|`murmur3_32_abs`|no|
+
+For best-effort rollup, you should use `dynamic`.
+
+|property|description|default|required?|
+|--------|-----------|-------|---------|
+|type|This should always be `dynamic`|none|yes|
+|maxRowsPerSegment|Used in sharding. Determines how many rows are in each segment.|5000000|no|
+|maxTotalRows|Total number of rows in segments waiting for being pushed.|20000000|no|
+
+## Segment pushing modes
+
+While ingesting data using the simple task indexing, Druid creates segments from the input data and pushes them. For segment pushing,
+the simple task index supports the following segment pushing modes based upon your type of [rollup](./rollup.md):
+
+- Bulk pushing mode: Used for perfect rollup. Druid pushes every segment at the very end of the index task. Until then, Druid stores created segments in memory and local storage of the service running the index task. This mode can cause problems if you have limited storage capacity, and is not recommended to use in production.
+To enable bulk pushing mode, set `forceGuaranteedRollup` in your TuningConfig. You can not use bulk pushing with `appendToExisting` in your IOConfig.
+- Incremental pushing mode: Used for best-effort rollup. Druid pushes segments are incrementally during the course of the indexing task. The index task collects data and stores created segments in the memory and disks of the services running the task until the total number of collected rows exceeds `maxTotalRows`. At that point the index task immediately pushes all segments created up until that moment, cleans up pushed segments, and continues to ingest the remaining data.
diff --git a/docs/35.0.0/ingestion/native-batch.md b/docs/35.0.0/ingestion/native-batch.md
new file mode 100644
index 0000000000..be3219a500
--- /dev/null
+++ b/docs/35.0.0/ingestion/native-batch.md
@@ -0,0 +1,771 @@
+---
+id: native-batch
+title: JSON-based batch
+sidebar_label: JSON-based batch
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ This page describes JSON-based batch ingestion using [ingestion specs](ingestion-spec.md). For SQL-based batch ingestion using the [`druid-multi-stage-query`](../multi-stage-query/index.md) extension, see [SQL-based ingestion](../multi-stage-query/index.md). Refer to the [ingestion methods](../ingestion/index.md#batch) table to determine which ingestion method is right for you.
+:::
+
+Apache Druid supports the following types of JSON-based batch indexing tasks:
+
+- Parallel task indexing (`index_parallel`) that can run multiple indexing tasks concurrently. Parallel task works well for production ingestion tasks.
+- Simple task indexing (`index`) that run a single indexing task at a time. Simple task indexing is suitable for development and test environments.
+
+This topic covers the configuration for `index_parallel` ingestion specs.
+
+For related information on batch indexing, see:
+
+- [Batch ingestion method comparison table](./index.md#batch) for a comparison of batch ingestion methods.
+- [Tutorial: Loading a file](../tutorials/tutorial-batch.md) for a tutorial on JSON-based batch ingestion.
+- [Input sources](./input-sources.md) for possible input sources.
+- [Source input formats](./data-formats.md#input-format) for possible input formats.
+
+## Submit an indexing task
+
+To run either kind of JSON-based batch indexing task, you can:
+
+- Use the **Load Data** UI in the web console to define and submit an ingestion spec.
+- Define an ingestion spec in JSON based upon the [examples](#parallel-indexing-example) and reference topics for batch indexing. Then POST the ingestion spec to the [Tasks API endpoint](../api-reference/tasks-api.md), `/druid/indexer/v1/task`, the Overlord service. Alternatively, you can use the indexing script included with Druid at `bin/post-index-task`.
+
+## Parallel task indexing
+
+The parallel task type `index_parallel` is a task for multi-threaded batch indexing. Parallel task indexing only relies on Druid resources. It doesn't depend on other external systems like Hadoop.
+
+The `index_parallel` task is a supervisor task that orchestrates
+the whole indexing process. The supervisor task splits the input data and creates worker tasks to process the individual portions of data.
+
+Druid issues the worker tasks to the Overlord. The Overlord schedules and runs the workers on Middle Managers or Indexers. After a worker task successfully processes the assigned input portion, it reports the resulting segment list to the Supervisor task.
+
+The Supervisor task periodically checks the status of worker tasks. If a task fails, the Supervisor retries the task until the number of retries reaches the configured limit. If all worker tasks succeed, it publishes the reported segments at once and finalizes ingestion.
+
+The detailed behavior of the parallel task is different depending on the `partitionsSpec`. See [`partitionsSpec`](#partitionsspec) for more details.
+
+Parallel tasks require the following:
+
+- A splittable [`inputSource`](#splittable-input-sources) in the `ioConfig`. For a list of supported splittable input formats, see [Splittable input sources](#splittable-input-sources).
+- The `maxNumConcurrentSubTasks` greater than 1 in the `tuningConfig`. Otherwise tasks run sequentially. The `index_parallel` task reads each input file one by one and creates segments by itself.
+
+### Supported compression formats
+
+JSON-based batch ingestion supports the following compression formats:
+
+- `bz2`
+- `gz`
+- `xz`
+- `zip`
+- `sz` (Snappy)
+- `zst` (ZSTD)
+
+### Implementation considerations
+
+This section covers implementation details to consider when you implement parallel task ingestion.
+
+#### Volume control for worker tasks
+
+You can control the amount of input data each worker task processes using different configurations depending on the phase in parallel ingestion.
+See [`partitionsSpec`](#partitionsspec) for details about how partitioning affects data volume for tasks.
+
+For the tasks that read data from the `inputSource`, you can set the [Split hint spec](#split-hint-spec) in the `tuningConfig`.
+For the task that merge shuffled segments, you can set the `totalNumMergeTasks` in the `tuningConfig`.
+
+#### Number of running tasks
+
+The `maxNumConcurrentSubTasks` in the `tuningConfig` determines the number of concurrent worker tasks that run in parallel. The Supervisor task checks the number of current running worker tasks and creates more if it's smaller than `maxNumConcurrentSubTasks` regardless of the number of available task slots. This may affect to other ingestion performance. See [Capacity planning](#capacity-planning) section for more details.
+
+#### Replacing or appending data
+
+By default, JSON-based batch ingestion replaces all data in the intervals in your `granularitySpec` for any segment that it writes to. If you want to add to the segment instead, set the `appendToExisting` flag in the `ioConfig`. JSON-based batch ingestion only replaces data in segments where it actively adds data. If there are segments in the intervals for your `granularitySpec` that don't have data from a task, they remain unchanged. If any existing segments partially overlap with the intervals in the `granularitySpec`, the portion of those segments outside the interval for the new spec remain visible.
+
+You can also perform concurrent append and replace tasks. For more information, see [Concurrent append and replace](./concurrent-append-replace.md)
+
+#### Fully replacing existing segments using tombstones
+
+:::info
+This feature is still experimental.
+:::
+
+You can set `dropExisting` flag in the `ioConfig` to true if you want the ingestion task to replace all existing segments that start and end within the intervals for your `granularitySpec`. This applies whether or not the new data covers all existing segments. `dropExisting` only applies when `appendToExisting` is false and the `granularitySpec` contains an `interval`.
+
+The following examples demonstrate when to set the `dropExisting` property to true in the `ioConfig`:
+
+Consider an existing segment with an interval of 2020-01-01 to 2021-01-01 and `YEAR` `segmentGranularity`. You want to overwrite the whole interval of 2020-01-01 to 2021-01-01 with new data using the finer segmentGranularity of `MONTH`. If the replacement data does not have a record within every months from 2020-01-01 to 2021-01-01 Druid cannot drop the original `YEAR` segment even if it does include all the replacement data. Set `dropExisting` to true in this case to replace the original segment at `YEAR` `segmentGranularity` since you no longer need it.
+
+Imagine you want to re-ingest or overwrite a datasource and the new data does not contain some time intervals that exist in the datasource. For example, a datasource contains the following data at `MONTH` `segmentGranularity`:
+
+- **January**: 1 record  
+- **February**: 10 records  
+- **March**: 10 records  
+
+You want to re-ingest and overwrite with new data as follows:
+
+- **January**: 0 records  
+- **February**: 10 records  
+- **March**: 9 records  
+
+Unless you set `dropExisting` to true, the result after ingestion with overwrite using the same `MONTH` `segmentGranularity` would be:
+
+- **January**: 1 record  
+- **February**: 10 records  
+- **March**: 9 records
+
+This may not be what it is expected since the new data has 0 records for January. Set `dropExisting` to true to replace the unneeded January segment with a tombstone.
+
+## Parallel indexing example
+
+The following example illustrates the configuration for a parallel indexing task.
+
+<details>
+<summary>Click to view the example</summary>
+
+```json
+{
+  "type": "index_parallel",
+  "spec": {
+    "dataSchema": {
+      "dataSource": "wikipedia_parallel_index_test",
+      "timestampSpec": {
+        "column": "timestamp"
+      },
+      "dimensionsSpec": {
+        "dimensions": [
+          "country",
+          "page",
+          "language",
+          "user",
+          "unpatrolled",
+          "newPage",
+          "robot",
+          "anonymous",
+          "namespace",
+          "continent",
+          "region",
+          "city"
+        ]
+      },
+      "metricsSpec": [
+        {
+          "type": "count",
+          "name": "count"
+        },
+        {
+          "type": "doubleSum",
+          "name": "added",
+          "fieldName": "added"
+        },
+        {
+          "type": "doubleSum",
+          "name": "deleted",
+          "fieldName": "deleted"
+        },
+        {
+          "type": "doubleSum",
+          "name": "delta",
+          "fieldName": "delta"
+        }
+      ],
+      "granularitySpec": {
+        "segmentGranularity": "DAY",
+        "queryGranularity": "second",
+        "intervals": [
+          "2013-08-31/2013-09-02"
+        ]
+      }
+    },
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "local",
+        "baseDir": "examples/indexing/",
+        "filter": "wikipedia_index_data*"
+      },
+      "inputFormat": {
+        "type": "json"
+      }
+    },
+    "tuningConfig": {
+      "type": "index_parallel",
+      "partitionsSpec": {
+        "type": "single_dim",
+        "partitionDimension": "country",
+        "targetRowsPerSegment": 5000000
+      },
+      "maxNumConcurrentSubTasks": 2
+    }
+  }
+}
+```
+
+</details>
+
+## Parallel indexing configuration
+
+The following table defines the primary sections of the input spec:
+
+|Property|Description|Required|
+|--------|-----------|--------|
+|`type`|The task type. For parallel task indexing, set the value to `index_parallel`.|yes|
+|`id`|The task ID. If omitted, Druid generates the task ID using the task type, data source name, interval, and date-time stamp.|no|
+|`spec`|The ingestion spec that defines the [data schema](#dataschema), [IO config](#ioconfig), and [tuning config](#tuningconfig).|yes|
+|`context`|Context to specify various task configuration parameters. See [Task context parameters](../ingestion/tasks.md#context-parameters) for more details.|no|
+
+### `dataSchema`
+
+This field is required. In general, it defines the way that Druid stores your data: the primary timestamp column, the dimensions, metrics, and any transformations. For an overview, see [Ingestion Spec DataSchema](../ingestion/ingestion-spec.md#dataschema).
+
+When defining the `granularitySpec` for index parallel, consider the defining `intervals` explicitly if you know the time range of the data. This way locking failure happens faster and Druid won't accidentally replace data outside the interval range some rows contain unexpected timestamps. The reasoning is as follows:
+
+- If you explicitly define `intervals`, JSON-based batch ingestion locks all intervals specified when it starts up. Problems with locking become evident quickly when multiple ingestion or indexing tasks try to obtain a lock on the same interval. For example, if a Kafka ingestion task tries to obtain a lock on a locked interval causing the ingestion task fail. Furthermore, if there are rows outside the specified intervals, Druid drops them, avoiding conflict with unexpected intervals.
+- If you don't define `intervals`, JSON-based batch ingestion locks each interval when the interval is discovered. In this case, if the task overlaps with a higher-priority task, issues with conflicting locks occur later in the ingestion process. If the source data includes rows with unexpected timestamps, they may caused unexpected locking of intervals.
+
+### `ioConfig`
+
+The following table lists the properties of a `ioConfig` object:
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|---------|
+|`type`|The task type. Set to the value to `index_parallel`.|none|yes|
+|`inputFormat`|[`inputFormat`](./data-formats.md#input-format) to specify how to parse input data.|none|yes|
+|`appendToExisting`|Creates segments as additional shards of the latest version, effectively appending to the segment set instead of replacing it. This means that you can append new segments to any datasource regardless of its original partitioning scheme. You must use the `dynamic` partitioning type for the appended segments. If you specify a different partitioning type, the task fails with an error.|false|no|
+|`dropExisting`|If `true` and `appendToExisting` is `false` and the `granularitySpec` contains an`interval`, then the ingestion task replaces all existing segments fully contained by the specified `interval` when the task publishes new segments. If ingestion fails, Druid doesn't change any existing segments. In the case of misconfiguration where either `appendToExisting` is `true` or `interval` isn't specified in `granularitySpec`, Druid doesn't replace any segments even if `dropExisting` is `true`. WARNING: this feature is still experimental.|false|no|
+
+### `tuningConfig`
+
+The `tuningConfig` is optional. Druid uses default parameters if `tuningConfig` is not specified.
+
+The following table lists the properties of a `tuningConfig` object:
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|---------|
+|`type`|The task type. Set the value to`index_parallel`.|none|yes|
+|`maxRowsInMemory`|Determines when Druid should perform intermediate persists to disk. Normally you don't need to set this. Depending on the nature of your data, if rows are short in terms of bytes. For example, you may not want to store a million rows in memory. In this case, set this value.|1000000|no|
+|`maxBytesInMemory`|Use to determine when Druid should perform intermediate persists to disk. Normally Druid computes this internally and you don't need to set it. This value represents number of bytes to aggregate in heap memory before persisting. This is based on a rough estimate of memory usage and not actual usage. The maximum heap memory usage for indexing is `maxBytesInMemory * (2 + maxPendingPersists)`. Note that `maxBytesInMemory` also includes heap usage of artifacts created from intermediary persists. This means that after every persist, the amount of `maxBytesInMemory` until next persist will decrease. Tasks fail when the sum of bytes of all intermediary persisted artifacts exceeds `maxBytesInMemory`.|1/6 of max JVM memory|no|
+|`maxColumnsToMerge`|Limit of the number of segments to merge in a single phase when merging segments for publishing. This limit affects the total number of columns present in a set of segments to merge. If the limit is exceeded, segment merging occurs in multiple phases. Druid merges at least 2 segments per phase, regardless of this setting.|-1 (unlimited)|no|
+|`maxTotalRows`|Deprecated. Use `partitionsSpec` instead. Total number of rows in segments waiting to be pushed. Used to determine when intermediate pushing should occur.|20000000|no|
+|`numShards`|Deprecated. Use `partitionsSpec` instead. Directly specify the number of shards to create when using a `hashed` `partitionsSpec`. If this is specified and `intervals` is specified in the `granularitySpec`, the index task can skip the determine intervals/partitions pass through the data.|null|no|
+|`splitHintSpec`|Hint to control the amount of data that each first phase task reads. Druid may ignore the hint depending on the implementation of the input source. See [Split hint spec](#split-hint-spec) for more details.|size-based split hint spec|no|
+|`partitionsSpec`|Defines how to partition data in each timeChunk, see [PartitionsSpec](#partitionsspec).|`dynamic` if `forceGuaranteedRollup` = false, `hashed` or `single_dim` if `forceGuaranteedRollup` = true|no|
+|`indexSpec`|Defines segment storage format options to be used at indexing time, see [IndexSpec](ingestion-spec.md#indexspec).|null|no|
+|`indexSpecForIntermediatePersists`|Defines segment storage format options to use at indexing time for intermediate persisted temporary segments. You can use this configuration to disable dimension/metric compression on intermediate segments to reduce memory required for final merging. However, if you disable compression on intermediate segments, page cache use my increase while intermediate segments are used before Druid merges them to the final published segment published. See [IndexSpec](./ingestion-spec.md#indexspec) for possible values.|same as `indexSpec`|no|
+|`maxPendingPersists`|Maximum number of pending persists that remain not started. If a new intermediate persist exceeds this limit, ingestion blocks until the currently-running persist finishes. Maximum heap memory usage for indexing scales with `maxRowsInMemory * (2 + maxPendingPersists)`.|0 (meaning one persist can be running concurrently with ingestion, and none can be queued up)|no|
+|`forceGuaranteedRollup`|Forces [perfect rollup](rollup.md). The perfect rollup optimizes the total size of generated segments and querying time but increases indexing time. If true, specify `intervals` in the `granularitySpec` and use either `hashed` or `single_dim` for the `partitionsSpec`. You cannot use this flag in conjunction with `appendToExisting` of `IOConfig`. For more details, see [Segment pushing modes](#segment-pushing-modes).|false|no|
+|`reportParseExceptions`|If true, Druid throws exceptions encountered during parsing and halts ingestion. If false, Druid skips unparseable rows and fields.|false|no|
+|`pushTimeout`|Milliseconds to wait to push segments. Must be >= 0, where 0 means to wait forever.|0|no|
+|`segmentWriteOutMediumFactory`|Segment write-out medium to use when creating segments. See [SegmentWriteOutMediumFactory](#segmentwriteoutmediumfactory).|If not specified, uses the value from `druid.peon.defaultSegmentWriteOutMediumFactory.type` |no|
+|`maxNumConcurrentSubTasks`|Maximum number of worker tasks that can be run in parallel at the same time. The supervisor task spawns worker tasks up to `maxNumConcurrentSubTasks` regardless of the current available task slots. If this value is 1, the supervisor task processes data ingestion on its own instead of spawning worker tasks. If this value is set to too large, the supervisor may create too many worker tasks that block other ingestion tasks. See [Capacity planning](#capacity-planning) for more details.|1|no|
+|`maxRetry`|Maximum number of retries on task failures.|3|no|
+|`maxNumSegmentsToMerge`|Max limit for the number of segments that a single task can merge at the same time in the second phase. Used only when `forceGuaranteedRollup` is true.|100|no|
+|`totalNumMergeTasks`|Total number of tasks that merge segments in the merge phase when `partitionsSpec` is set to `hashed` or `single_dim`.|10|no|
+|`taskStatusCheckPeriodMs`|Polling period in milliseconds to check running task statuses.|1000|no|
+|`chatHandlerTimeout`|Timeout for reporting the pushed segments in worker tasks.|PT10S|no|
+|`chatHandlerNumRetries`|Retries for reporting the pushed segments in worker tasks.|5|no|
+|`awaitSegmentAvailabilityTimeoutMillis`|Milliseconds to wait for the newly indexed segments to become available for query after ingestion completes. If `<= 0`, no wait occurs. If `> 0`, the task waits for the Coordinator to indicate that the new segments are available for querying. If the timeout expires, the task exits as successful, but the segments are not confirmed as available for query.|Long|no (default = 0)|
+
+### Split Hint Spec
+
+The split hint spec is used to help the supervisor task divide input sources. Each worker task processes a single input division. You can control the amount of data each worker task reads during the first phase.
+
+#### Size-based Split Hint Spec
+
+The size-based split hint spec affects all splittable input sources except for the HTTP input source and SQL input source.
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|---------|
+|`type`|Set the value to `maxSize`.|none|yes|
+|`maxSplitSize`|Maximum number of bytes of input files to process in a single subtask. If a single file is larger than the limit, Druid processes the file alone in a single subtask. Druid does not split files across tasks. One subtask will not process more files than `maxNumFiles` even when their total size is smaller than `maxSplitSize`. [Human-readable format](../configuration/human-readable-byte.md) is supported.|1GiB|no|
+|`maxNumFiles`|Maximum number of input files to process in a single subtask. This limit avoids task failures when the ingestion spec is too long. There are two known limits on the max size of serialized ingestion spec: the max ZNode size in ZooKeeper (`jute.maxbuffer`) and the max packet size in MySQL (`max_allowed_packet`). These limits can cause ingestion tasks fail if the serialized ingestion spec size hits one of them. One subtask will not process more data than `maxSplitSize` even when the total number of files is smaller than `maxNumFiles`.|1000|no|
+
+#### Segments Split Hint Spec
+
+The segments split hint spec is used only for [`DruidInputSource`](./input-sources.md).
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|---------|
+|`type`|Set the value to `segments`.|none|yes|
+|`maxInputSegmentBytesPerTask`|Maximum number of bytes of input segments to process in a single subtask. If a single segment is larger than this number, Druid processes the segment alone in a single subtask. Druid never splits input segments across tasks. A single subtask will not process more segments than `maxNumSegments` even when their total size is smaller than `maxInputSegmentBytesPerTask`. [Human-readable format](../configuration/human-readable-byte.md) is supported.|1GiB|no|
+|`maxNumSegments`|Maximum number of input segments to process in a single subtask. This limit avoids failures due to the the ingestion spec being too long. There are two known limits on the max size of serialized ingestion spec: the max ZNode size in ZooKeeper (`jute.maxbuffer`) and the max packet size in MySQL (`max_allowed_packet`). These limits can make ingestion tasks fail when the serialized ingestion spec size hits one of them. A single subtask will not process more data than `maxInputSegmentBytesPerTask` even when the total number of segments is smaller than `maxNumSegments`.|1000|no|
+
+### `partitionsSpec`
+
+The primary partition for Druid is time. You can define a secondary partitioning method in the partitions spec. Use the `partitionsSpec` type that applies for your [rollup](rollup.md) method.
+
+For perfect rollup, you can use:
+
+- `hashed` partitioning based on the hash value of specified dimensions for each row
+- `single_dim` based on ranges of values for a single dimension
+- `range` based on ranges of values of multiple dimensions.
+
+For best-effort rollup, use `dynamic`.
+
+For an overview, see [Partitioning](./partitioning.md).
+
+The `partitionsSpec` types have different characteristics.
+
+| PartitionsSpec | Ingestion speed | Partitioning method | Supported rollup mode | Secondary partition pruning at query time |
+|----------------|-----------------|---------------------|-----------------------|-------------------------------|
+| `dynamic` | Fastest  | [Dynamic partitioning](#dynamic-partitioning) based on the number of rows in a segment. | Best-effort rollup | N/A |
+| `hashed`  | Moderate | Multiple dimension [hash-based partitioning](#hash-based-partitioning) may reduce both your datasource size and query latency by improving data locality. See [Partitioning](./partitioning.md) for more details. | Perfect rollup | The broker can use the partition information to prune segments early to speed up queries. Since the broker knows how to hash `partitionDimensions` values to locate a segment, given a query including a filter on all the `partitionDimensions`, the broker can pick up only the segments holding the rows satisfying the filter on `partitionDimensions` for query processing.<br/><br/>Note that `partitionDimensions` must be set at ingestion time to enable secondary partition pruning at query time.|
+| `single_dim` | Slower | Single dimension [range partitioning](#single-dimension-range-partitioning) may reduce your datasource size and query latency by improving data locality. See [Partitioning](./partitioning.md) for more details. | Perfect rollup | The broker can use the partition information to prune segments early to speed up queries. Since the broker knows the range of `partitionDimension` values in each segment, given a query including a filter on the `partitionDimension`, the broker can pick up only the segments holding the rows satisfying the filter on `partitionDimension` for query processing. |
+| `range` | Slowest | Multiple dimension [range partitioning](#multi-dimension-range-partitioning) may reduce your datasource size and query latency by improving data locality. See [Partitioning](./partitioning.md) for more details. | Perfect rollup | The broker can use the partition information to prune segments early to speed up queries. Since the broker knows the range of `partitionDimensions` values within each segment, given a query including a filter on the first of the `partitionDimensions`, the broker can pick up only the segments holding the rows satisfying the filter on the first partition dimension for query processing. |
+
+#### Dynamic partitioning
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|---------|
+|`type`|Set the value to `dynamic`.|none|yes|
+|`maxRowsPerSegment`|Used in sharding. Determines how many rows are in each segment.|5000000|no|
+|`maxTotalRows`|Total number of rows across all segments waiting for being pushed. Used in determining when intermediate segment push should occur.|20000000|no|
+
+With the dynamic partitioning, the parallel index task runs in a single phase spawning multiple worker tasks (type `single_phase_sub_task`), each of which creates segments.
+
+How the worker task creates segments:
+
+- Whenever the number of rows in the current segment exceeds
+  `maxRowsPerSegment`.
+- When the total number of rows in all segments across all time chunks reaches to `maxTotalRows`. At this point the task pushes all segments created so far to the deep storage and creates new ones.
+
+#### Hash-based partitioning
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|---------|
+|`type`|Set the value to `hashed`.|none|yes|
+|`numShards`|Directly specify the number of shards to create. If this is specified and `intervals` is specified in the `granularitySpec`, the index task can skip the determine intervals/partitions pass through the data. This property and `targetRowsPerSegment` cannot both be set.|none|no|
+|`targetRowsPerSegment`|A target row count for each partition. If `numShards` is left unspecified, the Parallel task will determine a partition count automatically such that each partition has a row count close to the target, assuming evenly distributed keys in the input data. A target per-segment row count of 5 million is used if both `numShards` and `targetRowsPerSegment` are null. |null (or 5,000,000 if both `numShards` and `targetRowsPerSegment` are null)|no|
+|`partitionDimensions`|The dimensions to partition on. Leave blank to select all dimensions.|null|no|
+|`partitionFunction`|A function to compute hash of partition dimensions. See [Hash partition function](#hash-partition-function)|`murmur3_32_abs`|no|
+
+The Parallel task with hash-based partitioning is similar to [MapReduce](https://en.wikipedia.org/wiki/MapReduce).
+The task runs in up to three phases: `partial dimension cardinality`, `partial segment generation` and `partial segment merge`.
+
+The `partial dimension cardinality` phase is an optional phase that only runs if `numShards` is not specified.
+The Parallel task splits the input data and assigns them to worker tasks based on the split hint spec.
+Each worker task (type `partial_dimension_cardinality`) gathers estimates of partitioning dimensions cardinality for
+each time chunk. The Parallel task will aggregate these estimates from the worker tasks and determine the highest
+cardinality across all of the time chunks in the input data, dividing this cardinality by `targetRowsPerSegment` to
+automatically determine `numShards`.
+
+In the `partial segment generation` phase, just like the Map phase in MapReduce,
+the Parallel task splits the input data based on the split hint spec
+and assigns each split to a worker task. Each worker task (type `partial_index_generate`) reads the assigned split, and partitions rows by the time chunk from `segmentGranularity` (primary partition key) in the `granularitySpec`
+and then by the hash value of `partitionDimensions` (secondary partition key) in the `partitionsSpec`.
+The partitioned data is stored in local storage of
+the [middle Manager](../design/middlemanager.md) or the [indexer](../design/indexer.md).
+
+The `partial segment merge` phase is similar to the Reduce phase in MapReduce.
+The Parallel task spawns a new set of worker tasks (type `partial_index_generic_merge`) to merge the partitioned data created in the previous phase. Here, the partitioned data is shuffled based on
+the time chunk and the hash value of `partitionDimensions` to be merged; each worker task reads the data falling in the same time chunk and the same hash value from multiple Middle Manager/Indexer processes and merges them to create the final segments. Finally, they push the final segments to the deep storage at once.
+
+##### Hash partition function
+
+In hash partitioning, the partition function is used to compute hash of partition dimensions. The partition dimension values are first serialized into a byte array as a whole, and then the partition function is applied to compute hash of the byte array. Druid currently supports only one partition function.
+
+|name|description|
+|----|-----------|
+|`murmur3_32_abs`|Applies an absolute value function to the result of [`murmur3_32`](https://guava.dev/releases/16.0/api/docs/com/google/common/hash/Hashing.html#murmur3_32()).|
+
+#### Single-dimension range partitioning
+
+:::info
+ Single dimension range partitioning is not supported in the sequential mode of the `index_parallel` task type.
+:::
+
+Range partitioning has [several benefits](#benefits-of-range-partitioning) related to storage footprint and query
+performance.
+
+The Parallel task will use one subtask when you set `maxNumConcurrentSubTasks` to 1.
+
+When you use this technique to partition your data, segment sizes may be unequally distributed if the data in your `partitionDimension` is also unequally distributed.  Therefore, to avoid imbalance in data layout, review the distribution of values in your source data before deciding on a partitioning strategy.
+
+Range partitioning is not possible on multi-value dimensions. If the provided
+`partitionDimension` is multi-value, your ingestion job will report an error.
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|---------|
+|`type`|Set the value to `single_dim`.|none|yes|
+|`partitionDimension`|The dimension to partition on. Only rows with a single dimension value are allowed.|none|yes|
+|`targetRowsPerSegment`|Target number of rows to include in a partition, should be a number that targets segments of 500MB\~1GB.|none|either this or `maxRowsPerSegment`|
+|`maxRowsPerSegment`|Soft max for the number of rows to include in a partition.|none|either this or `targetRowsPerSegment`|
+|`assumeGrouped`|Assume that input data has already been grouped on time and dimensions. Ingestion will run faster, but may choose sub-optimal partitions if this assumption is violated.|false|no|
+
+With `single-dim` partitioning, the Parallel task runs in 3 phases,
+i.e., `partial dimension distribution`, `partial segment generation`, and `partial segment merge`.
+The first phase is to collect some statistics to find
+the best partitioning and the other 2 phases are to create partial segments
+and to merge them, respectively, as in hash-based partitioning.
+
+In the `partial dimension distribution` phase, the Parallel task splits the input data and
+assigns them to worker tasks based on the split hint spec. Each worker task (type `partial_dimension_distribution`) reads
+the assigned split and builds a histogram for `partitionDimension`.
+The Parallel task collects those histograms from worker tasks and finds
+the best range partitioning based on `partitionDimension` to evenly
+distribute rows across partitions. Note that either `targetRowsPerSegment`
+or `maxRowsPerSegment` will be used to find the best partitioning.
+
+In the `partial segment generation` phase, the Parallel task spawns new worker tasks (type `partial_range_index_generate`)
+to create partitioned data. Each worker task reads a split created as in the previous phase,
+partitions rows by the time chunk from the `segmentGranularity` (primary partition key) in the `granularitySpec`
+and then by the range partitioning found in the previous phase.
+The partitioned data is stored in local storage of
+the [Middle Manager](../design/middlemanager.md) or the [indexer](../design/indexer.md).
+
+In the `partial segment merge` phase, the parallel index task spawns a new set of worker tasks (type `partial_index_generic_merge`) to merge the partitioned
+data created in the previous phase. Here, the partitioned data is shuffled based on
+the time chunk and the value of `partitionDimension`; each worker task reads the segments
+falling in the same partition of the same range from multiple Middle Manager/Indexer processes and merges
+them to create the final segments. Finally, they push the final segments to the deep storage.
+
+:::info
+ Because the task with single-dimension range partitioning makes two passes over the input
+ in `partial dimension distribution` and `partial segment generation` phases,
+ the task may fail if the input changes in between the two passes.
+:::
+
+#### Multi-dimension range partitioning
+
+:::info
+ Multi-dimension range partitioning is not supported in the sequential mode of the `index_parallel` task type.
+:::
+
+Range partitioning has [several benefits](#benefits-of-range-partitioning) related to storage footprint and query
+performance. Multi-dimension range partitioning improves over single-dimension range partitioning by allowing
+Druid to distribute segment sizes more evenly, and to prune on more dimensions.
+
+Range partitioning is not possible on multi-value dimensions. If one of the provided
+`partitionDimensions` is multi-value, your ingestion job will report an error.
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|---------|
+|`type`|Set the value to `range`.|none|yes|
+|`partitionDimensions`|An array of dimensions to partition on. Order the dimensions from most frequently queried to least frequently queried. For best results, limit your number of dimensions to between three and five dimensions.|none|yes|
+|`targetRowsPerSegment`|Target number of rows to include in a partition, should be a number that targets segments of 500MB\~1GB.|none|either this or `maxRowsPerSegment`|
+|maxRowsPerSegment|Soft max for the number of rows to include in a partition.|none|either this or `targetRowsPerSegment`|
+|`assumeGrouped`|Assume that input data has already been grouped on time and dimensions. Ingestion will run faster, but may choose sub-optimal partitions if this assumption is violated.|false|no|
+
+#### Benefits of range partitioning
+
+Range partitioning, either `single_dim` or `range`, has several benefits:
+
+1. Lower storage footprint due to combining similar data into the same segments, which improves compressibility.
+2. Better query performance due to Broker-level segment pruning, which removes segments from
+   consideration when they cannot possibly contain data matching the query filter.
+
+For Broker-level segment pruning to be effective, you must include partition dimensions in the `WHERE` clause. Each
+partition dimension can participate in pruning if the prior partition dimensions (those to its left) are also
+participating, and if the query uses filters that support pruning.
+
+Filters that support pruning include:
+
+- Equality on string literals, like `x = 'foo'` and `x IN ('foo', 'bar')` where `x` is a string.
+- Comparison between string columns and string literals, like `x < 'foo'` or other comparisons
+  involving `<`, `>`, `<=`, or `>=`.
+
+For example, if you configure the following `range` partitioning during ingestion:
+
+```json
+"partitionsSpec": {
+  "type": "range",
+  "partitionDimensions": ["countryName", "cityName"],
+  "targetRowsPerSegment": 5000000
+}
+```
+
+Then, filters like `WHERE countryName = 'United States'` or `WHERE countryName = 'United States' AND cityName = 'New York'`
+can make use of pruning. However, `WHERE cityName = 'New York'` cannot make use of pruning, because countryName is not
+involved. The clause `WHERE cityName LIKE 'New%'` cannot make use of pruning either, because LIKE filters do not
+support pruning.
+
+## HTTP status endpoints
+
+The Supervisor task provides some HTTP endpoints to get running status.
+
+`http://{PEON_IP}:{PEON_PORT}/druid/worker/v1/chat/{SUPERVISOR_TASK_ID}/mode`  
+Returns `parallel` if the indexing task is running in parallel. Otherwise, it returns `sequential`.
+
+`http://{PEON_IP}:{PEON_PORT}/druid/worker/v1/chat/{SUPERVISOR_TASK_ID}/phase`  
+Returns the name of the current phase if the task running in the parallel mode.
+
+`http://{PEON_IP}:{PEON_PORT}/druid/worker/v1/chat/{SUPERVISOR_TASK_ID}/progress`  
+Returns the estimated progress of the current phase if the supervisor task is running in the parallel mode.
+
+An example of the result is
+
+```json
+{
+  "running":10,
+  "succeeded":0,
+  "failed":0,
+  "complete":0,
+  "total":10,
+  "estimatedExpectedSucceeded":10
+}
+```
+
+`http://{PEON_IP}:{PEON_PORT}/druid/worker/v1/chat/{SUPERVISOR_TASK_ID}/subtasks/running`  
+Returns the task IDs of running worker tasks, or an empty list if the supervisor task is running in the sequential mode.
+
+`http://{PEON_IP}:{PEON_PORT}/druid/worker/v1/chat/{SUPERVISOR_TASK_ID}/subtaskspecs`  
+Returns all worker task specs, or an empty list if the supervisor task is running in the sequential mode.
+
+`http://{PEON_IP}:{PEON_PORT}/druid/worker/v1/chat/{SUPERVISOR_TASK_ID}/subtaskspecs/running`  
+Returns running worker task specs, or an empty list if the supervisor task is running in the sequential mode.
+
+`http://{PEON_IP}:{PEON_PORT}/druid/worker/v1/chat/{SUPERVISOR_TASK_ID}/subtaskspecs/complete`  
+Returns complete worker task specs, or an empty list if the supervisor task is running in the sequential mode.
+
+`http://{PEON_IP}:{PEON_PORT}/druid/worker/v1/chat/{SUPERVISOR_TASK_ID}/subtaskspec/{SUB_TASK_SPEC_ID}`  
+Returns the worker task spec of the given id, or HTTP 404 Not Found error if the supervisor task is running in the sequential mode.
+
+`http://{PEON_IP}:{PEON_PORT}/druid/worker/v1/chat/{SUPERVISOR_TASK_ID}/subtaskspec/{SUB_TASK_SPEC_ID}/state`  
+Returns the state of the worker task spec of the given id, or HTTP 404 Not Found error if the supervisor task is running in the sequential mode.
+The returned result contains the worker task spec, a current task status if exists, and task attempt history.
+
+<details>
+<summary>Click to view the response</summary>
+
+```json
+{
+  "spec": {
+    "id": "index_parallel_lineitem_2018-04-20T22:12:43.610Z_2",
+    "groupId": "index_parallel_lineitem_2018-04-20T22:12:43.610Z",
+    "supervisorTaskId": "index_parallel_lineitem_2018-04-20T22:12:43.610Z",
+    "context": null,
+    "inputSplit": {
+      "split": "/path/to/data/lineitem.tbl.5"
+    },
+    "ingestionSpec": {
+      "dataSchema": {
+        "dataSource": "lineitem",
+        "timestampSpec": {
+          "column": "l_shipdate",
+          "format": "yyyy-MM-dd"
+        },
+        "dimensionsSpec": {
+          "dimensions": [
+            "l_orderkey",
+            "l_partkey",
+            "l_suppkey",
+            "l_linenumber",
+            "l_returnflag",
+            "l_linestatus",
+            "l_shipdate",
+            "l_commitdate",
+            "l_receiptdate",
+            "l_shipinstruct",
+            "l_shipmode",
+            "l_comment"
+          ]
+        },
+        "metricsSpec": [
+          {
+            "type": "count",
+            "name": "count"
+          },
+          {
+            "type": "longSum",
+            "name": "l_quantity",
+            "fieldName": "l_quantity",
+            "expression": null
+          },
+          {
+            "type": "doubleSum",
+            "name": "l_extendedprice",
+            "fieldName": "l_extendedprice",
+            "expression": null
+          },
+          {
+            "type": "doubleSum",
+            "name": "l_discount",
+            "fieldName": "l_discount",
+            "expression": null
+          },
+          {
+            "type": "doubleSum",
+            "name": "l_tax",
+            "fieldName": "l_tax",
+            "expression": null
+          }
+        ],
+        "granularitySpec": {
+          "type": "uniform",
+          "segmentGranularity": "YEAR",
+          "queryGranularity": {
+            "type": "none"
+          },
+          "rollup": true,
+          "intervals": [
+            "1980-01-01T00:00:00.000Z/2020-01-01T00:00:00.000Z"
+          ]
+        },
+        "transformSpec": {
+          "filter": null,
+          "transforms": []
+        }
+      },
+      "ioConfig": {
+        "type": "index_parallel",
+        "inputSource": {
+          "type": "local",
+          "baseDir": "/path/to/data/",
+          "filter": "lineitem.tbl.5"
+        },
+        "inputFormat": {
+          "type": "tsv",
+          "delimiter": "|",
+          "columns": [
+            "l_orderkey",
+            "l_partkey",
+            "l_suppkey",
+            "l_linenumber",
+            "l_quantity",
+            "l_extendedprice",
+            "l_discount",
+            "l_tax",
+            "l_returnflag",
+            "l_linestatus",
+            "l_shipdate",
+            "l_commitdate",
+            "l_receiptdate",
+            "l_shipinstruct",
+            "l_shipmode",
+            "l_comment"
+          ]
+        },
+        "appendToExisting": false,
+        "dropExisting": false
+      },
+      "tuningConfig": {
+        "type": "index_parallel",
+        "partitionsSpec": {
+          "type": "dynamic"
+        },
+        "maxRowsInMemory": 1000000,
+        "maxTotalRows": 20000000,
+        "numShards": null,
+        "indexSpec": {
+          "bitmap": {
+            "type": "roaring"
+          },
+          "dimensionCompression": "lz4",
+          "metricCompression": "lz4",
+          "longEncoding": "longs"
+        },
+        "indexSpecForIntermediatePersists": {
+          "bitmap": {
+            "type": "roaring"
+          },
+          "dimensionCompression": "lz4",
+          "metricCompression": "lz4",
+          "longEncoding": "longs"
+        },
+        "maxPendingPersists": 0,
+        "reportParseExceptions": false,
+        "pushTimeout": 0,
+        "segmentWriteOutMediumFactory": null,
+        "maxNumConcurrentSubTasks": 4,
+        "maxRetry": 3,
+        "taskStatusCheckPeriodMs": 1000,
+        "chatHandlerTimeout": "PT10S",
+        "chatHandlerNumRetries": 5,
+        "logParseExceptions": false,
+        "maxParseExceptions": 2147483647,
+        "maxSavedParseExceptions": 0,
+        "forceGuaranteedRollup": false
+      }
+    }
+  },
+  "currentStatus": {
+    "id": "index_sub_lineitem_2018-04-20T22:16:29.922Z",
+    "type": "index_sub",
+    "createdTime": "2018-04-20T22:16:29.925Z",
+    "queueInsertionTime": "2018-04-20T22:16:29.929Z",
+    "statusCode": "RUNNING",
+    "duration": -1,
+    "location": {
+      "host": null,
+      "port": -1,
+      "tlsPort": -1
+    },
+    "dataSource": "lineitem",
+    "errorMsg": null
+  },
+  "taskHistory": []
+}
+```
+
+</details>
+
+`http://{PEON_IP}:{PEON_PORT}/druid/worker/v1/chat/{SUPERVISOR_TASK_ID}/subtaskspec/{SUB_TASK_SPEC_ID}/history`  
+Returns the task attempt history of the worker task spec of the given id, or HTTP 404 Not Found error if the supervisor task is running in the sequential mode.
+
+## Segment pushing modes
+
+While ingesting data using the parallel task indexing, Druid creates segments from the input data and pushes them. For segment pushing,
+the parallel task index supports the following segment pushing modes based upon your type of [rollup](./rollup.md):
+
+- Bulk pushing mode: Used for perfect rollup. Druid pushes every segment at the very end of the index task. Until then, Druid stores created segments in memory and local storage of the service running the index task. To enable bulk pushing mode, set `forceGuaranteedRollup` to `true` in your tuning config. You cannot use bulk pushing with `appendToExisting` in your IOConfig.
+- Incremental pushing mode: Used for best-effort rollup. Druid pushes segments are incrementally during the course of the indexing task. The index task collects data and stores created segments in the memory and disks of the services running the task until the total number of collected rows exceeds `maxTotalRows`. At that point the index task immediately pushes all segments created up until that moment, cleans up pushed segments, and continues to ingest the remaining data.
+
+## Capacity planning
+
+The Supervisor task can create up to `maxNumConcurrentSubTasks` worker tasks no matter how many task slots are currently available.
+As a result, total number of tasks which can be run at the same time is `(maxNumConcurrentSubTasks + 1)` (including the Supervisor task).
+Please note that this can be even larger than total number of task slots (sum of the capacity of all workers).
+If `maxNumConcurrentSubTasks` is larger than `n (available task slots)`, then
+`maxNumConcurrentSubTasks` tasks are created by the supervisor task, but only `n` tasks would be started.
+Others will wait in the pending state until any running task is finished.
+
+If you are using the Parallel Index Task with stream ingestion together,
+we would recommend to limit the max capacity for batch ingestion to prevent
+stream ingestion from being blocked by batch ingestion. Suppose you have
+`t` Parallel Index Tasks to run at the same time, but want to limit
+the max number of tasks for batch ingestion to `b`. Then, (sum of `maxNumConcurrentSubTasks`
+of all Parallel Index Tasks + `t` (for supervisor tasks)) must be smaller than `b`.
+
+If you have some tasks of a higher priority than others, you may set their
+`maxNumConcurrentSubTasks` to a higher value than lower priority tasks.
+This may help the higher priority tasks to finish earlier than lower priority tasks
+by assigning more task slots to them.
+
+## Splittable input sources
+
+Use the `inputSource` object to define the location where your index can read data. Only the native parallel task and simple task support the input source.
+
+For details on available input sources see:
+
+- [S3 input source](./input-sources.md#s3-input-source) (`s3`) reads data from Amazon S3 storage.
+- [Google Cloud Storage input source](./input-sources.md#google-cloud-storage-input-source) (`gs`) reads data from Google Cloud Storage.
+- [Azure input source](./input-sources.md#azure-input-source) (`azure`) reads data from Azure Blob Storage and Azure Data Lake.
+- [HDFS input source](./input-sources.md#hdfs-input-source) (`hdfs`) reads data from HDFS storage.
+- [HTTP input Source](./input-sources.md#http-input-source) (`http`) reads data from HTTP servers.
+- [Inline input Source](./input-sources.md#inline-input-source) reads data you paste into the web console.
+- [Local input Source](./input-sources.md#local-input-source) (`local`) reads data from local storage.
+- [Druid input Source](./input-sources.md#druid-input-source) (`druid`) reads data from a Druid datasource.
+- [SQL input Source](./input-sources.md#sql-input-source) (`sql`) reads data from a RDBMS source.
+
+For information on how to combine input sources, see [Combining input source](./input-sources.md#combining-input-source).
+
+### `segmentWriteOutMediumFactory`
+
+|Property|Type|Description|Required|
+|-----|----|-----------|--------|
+|`type`|String|See [Additional Peon Configuration: SegmentWriteOutMediumFactory](../configuration/index.md#segmentwriteoutmediumfactory) for explanation and available options.|yes|
diff --git a/docs/35.0.0/ingestion/partitioning.md b/docs/35.0.0/ingestion/partitioning.md
new file mode 100644
index 0000000000..4d4b4b4dac
--- /dev/null
+++ b/docs/35.0.0/ingestion/partitioning.md
@@ -0,0 +1,107 @@
+---
+id: partitioning
+title: Partitioning
+sidebar_label: Partitioning
+description: Describes time chunk and secondary partitioning in Druid. Provides guidance to choose a secondary partition dimension.
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+You can use segment partitioning and sorting within your Druid datasources to reduce the size of your data and increase performance.
+
+One way to partition is to load data into separate datasources. This is a perfectly viable approach that works very well when the number of datasources does not lead to excessive per-datasource overheads.
+
+This topic describes how to set up partitions within a single datasource. It does not cover how to use multiple datasources. See [Multitenancy considerations](../querying/multitenancy.md) for more details on splitting data into separate datasources and potential operational considerations.
+
+## Time chunk partitioning
+
+Druid always partitions datasources by time into _time chunks_. Each time chunk contains one or more segments. This partitioning happens for all ingestion methods based on the `segmentGranularity` parameter in your ingestion spec `dataSchema` object.
+
+Partitioning by time is important for two reasons:
+
+1. Queries that filter by `__time` (SQL) or `intervals` (native) are able to use time partitioning to prune the set of segments to consider.
+2. Certain data management operations, such as overwriting and compacting existing data, acquire exclusive write locks on time partitions.
+3. Each segment file is wholly contained within a time partition. Too-fine-grained partitioning may cause a large number
+   of small segments, which leads to poor performance.
+
+The most common choices to balance these considerations are `hour` and `day`. For streaming ingestion, `hour` is especially
+common, because it allows compaction to follow ingestion with less of a time delay.
+
+The following table describes how to configure time chunk partitioning.
+
+|Method|Configuration|
+|------|------------|
+|[SQL](../multi-stage-query/index.md)|[`PARTITIONED BY`](../multi-stage-query/concepts.md#partitioning-by-time)|
+|[Kafka](../ingestion/kafka-ingestion.md) or [Kinesis](../ingestion/kinesis-ingestion.md)|`segmentGranularity` inside the [`granularitySpec`](ingestion-spec.md#granularityspec)|
+|[Native batch](native-batch.md) or [Hadoop](hadoop.md)|`segmentGranularity` inside the [`granularitySpec`](ingestion-spec.md#granularityspec)|
+
+## Secondary partitioning
+
+Druid further partitions each time chunk into immutable segments. Secondary partitioning on a particular dimension improves locality. This means that rows with the same value for that dimension are stored together, decreasing access time.
+
+To achieve the best performance and smallest overall footprint, partition your data on a "natural" dimension that
+you often use as a filter, or that achieves some alignment within your data. Such partitioning can improve compression
+and query performance by significant multiples.
+
+The following table describes how to configure secondary partitioning.
+
+|Method|Configuration|
+|------|------------|
+|[SQL](../multi-stage-query/index.md)|[`CLUSTERED BY`](../multi-stage-query/concepts.md#clustering)|
+|[Kafka](../ingestion/kafka-ingestion.md) or [Kinesis](../ingestion/kinesis-ingestion.md)|Upstream partitioning defines how Druid partitions the datasource. You can also alter clustering using [`REPLACE`](../multi-stage-query/concepts.md#overwrite-data-with-replace) (with `CLUSTERED BY`) or [compaction](../data-management/compaction.md) after initial ingestion.|
+|[Native batch](native-batch.md) or [Hadoop](hadoop.md)|[`partitionsSpec`](native-batch.md#partitionsspec) inside the `tuningConfig`|
+
+## Sorting
+
+Each segment is internally sorted to promote compression and locality.
+
+Partitioning and sorting work well together. If you do have a "natural" partitioning dimension, consider placing it
+first in your sort order as well. This way, Druid sorts rows within each segment by that column. This sorting configuration
+frequently improves compression and performance more than using partitioning alone.
+
+The following table describes how to configure sorting.
+
+|Method|Configuration|
+|------|------------|
+|[SQL](../multi-stage-query/index.md)|Uses order of fields in [`CLUSTERED BY`](../multi-stage-query/concepts.md#clustering) or [`segmentSortOrder`](../multi-stage-query/reference.md#context-parameters) in the query context|
+|[Kafka](../ingestion/kafka-ingestion.md) or [Kinesis](../ingestion/kinesis-ingestion.md)|Uses order of fields in [`dimensionsSpec`](ingestion-spec.md#dimensionsspec)|
+|[Native batch](native-batch.md) or [Hadoop](hadoop.md)|Uses order of fields in [`dimensionsSpec`](ingestion-spec.md#dimensionsspec)|
+
+:::info
+Druid implicitly sorts rows within a segment by `__time` first before any `dimensions` or `CLUSTERED BY` fields, unless
+you set `forceSegmentSortByTime` to `false` in your
+[query context](../multi-stage-query/reference.md#context-parameters) (for SQL) or in your
+[`dimensionsSpec`](ingestion-spec.md#dimensionsspec) (for other ingestion forms).
+
+Setting `forceSegmentSortByTime` to `false` is an experimental feature. Segments created with sort orders that
+do not start with `__time` can only be read by Druid 31 or later. Additionally, at this time, certain queries are not
+supported on such segments, including:
+
+- Native queries with `granularity` other than `all`.
+- Native `scan` query with ascending or descending time order.
+- SQL queries that plan into an unsupported native query.
+:::
+
+## Learn more
+
+See the following topics for more information:
+
+* [`partitionsSpec`](native-batch.md#partitionsspec) for more detail on partitioning with Native Batch ingestion.
+* [Reindexing](../data-management/update.md#reindex) and [Compaction](../data-management/compaction.md) for information on how to repartition existing data in Druid.
diff --git a/docs/35.0.0/ingestion/rollup.md b/docs/35.0.0/ingestion/rollup.md
new file mode 100644
index 0000000000..52ffc26333
--- /dev/null
+++ b/docs/35.0.0/ingestion/rollup.md
@@ -0,0 +1,97 @@
+---
+id: rollup
+title: "Data rollup"
+sidebar_label: Rollup
+description: Introduces rollup as a concept. Provides suggestions to maximize the benefits of rollup. Differentiates between perfect and best-effort rollup.
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+Druid can roll up data at ingestion time to reduce the amount of raw data to  store on disk. Rollup is a form of summarization or pre-aggregation. Rolling up data can dramatically reduce the size of data to be stored and reduce row counts by potentially orders of magnitude. As a trade-off for the efficiency of rollup, you lose the ability to query individual events.
+
+At ingestion time, you control rollup with the `rollup` setting in the [`granularitySpec`](./ingestion-spec.md#granularityspec). Rollup is enabled by default. This means Druid combines into a single row any rows that have identical [dimension](./schema-model.md#dimensions) values and [timestamp](./schema-model.md#primary-timestamp) values after [`queryGranularity`-based truncation](./ingestion-spec.md#granularityspec).
+
+When you disable rollup, Druid loads each row as-is without doing any form of pre-aggregation. This mode is similar to databases that do not support a rollup feature. Set `rollup` to `false` if you want Druid to store each record as-is, without any rollup summarization.
+
+Use roll-up when creating a table datasource if both:
+
+- You want optimal performance or you have strict space constraints.
+- You don't need raw values from [high-cardinality dimensions](schema-design.md#sketches-for-high-cardinality-columns).
+
+Conversely, disable roll-up if either:
+
+- You need results for individual rows.
+- You need to execute `GROUP BY` or `WHERE` queries on _any_ column.
+
+If you have conflicting needs for different use cases, you can create multiple tables with different roll-up configurations on each table.
+
+## Maximizing rollup ratio
+
+To measure the rollup ratio of a datasource, compare the number of rows in Druid (`COUNT`) with the number of ingested events. For example, run a [Druid SQL](../querying/sql.md) query where "num_rows" refers to a `count`-type metric generated at ingestion time as follows:
+
+```sql
+SELECT SUM("num_rows") / (COUNT(*) * 1.0) FROM datasource
+```
+
+The higher the result, the greater the benefit you gain from rollup. See [Counting the number of ingested events](schema-design.md#counting-the-number-of-ingested-events) for more details about how counting works with rollup is enabled.
+
+Tips for maximizing rollup:
+
+- Design your schema with fewer dimensions and lower cardinality dimensions to yield better rollup ratios.
+- Use [sketches](schema-design.md#sketches-for-high-cardinality-columns) to avoid storing high cardinality dimensions, which decrease rollup ratios.
+- Adjust your `queryGranularity` at ingestion time to increase the chances that multiple rows in Druid having matching timestamps. For example, use five minute query granularity (`PT5M`) instead of one minute (`PT1M`).
+- You can optionally load the same data into more than one Druid datasource. For example:
+  - Create a "full" datasource that has rollup disabled, or enabled, but with a minimal rollup ratio.
+  - Create a second "abbreviated" datasource with fewer dimensions and a higher rollup ratio.
+     When queries only involve dimensions in the "abbreviated" set, use the second datasource to reduce query times. Often, this method only requires a small increase in storage footprint because abbreviated datasources tend to be substantially smaller.
+- If you use a [best-effort rollup](#perfect-rollup-vs-best-effort-rollup) ingestion configuration that does not guarantee perfect rollup, try one of the following:
+  - Switch to a guaranteed perfect rollup option.
+  - [Reindex](../data-management/update.md#reindex) or [compact](../data-management/compaction.md) your data in the background after initial ingestion.
+
+## Perfect rollup vs best-effort rollup
+
+Depending on the ingestion method, Druid has the following rollup options:
+
+- Guaranteed _perfect rollup_: Druid perfectly aggregates input data at ingestion time.
+- _Best-effort rollup_: Druid may not perfectly aggregate input data. Therefore, multiple segments might contain rows with the same timestamp and dimension values.
+
+In general, ingestion methods that offer best-effort rollup do this for one of the following reasons:
+
+- The ingestion method parallelizes ingestion without a shuffling step required for perfect rollup.
+- The ingestion method uses _incremental publishing_ which means it finalizes and publishes segments before all data for a time chunk has been received.
+In both of these cases, records that could theoretically be rolled up may end up in different segments. All types of streaming ingestion run in this mode.
+
+Ingestion methods that guarantee perfect rollup use an additional preprocessing step to determine intervals and partitioning before data ingestion. This preprocessing step scans the entire input dataset. While this step increases the time required for ingestion, it provides information necessary for perfect rollup.
+
+The following table shows how each method handles rollup:
+
+|Method|How it works|
+|------|------------|
+|[Native batch](native-batch.md)|`index_parallel` and `index` type may be either perfect or best-effort, based on configuration.|
+|[SQL-based batch](../multi-stage-query/index.md)|Always perfect.|
+|[Hadoop](hadoop.md)|Always perfect.|
+|[Kafka indexing service](../ingestion/kafka-ingestion.md)|Always best-effort.|
+|[Kinesis indexing service](../ingestion/kinesis-ingestion.md)|Always best-effort.|
+
+## Learn more
+
+See the following topic for more information:
+
+- [Rollup tutorial](../tutorials/tutorial-rollup.md) for an example of how to configure rollup, and of how the feature modifies your data.
diff --git a/docs/35.0.0/ingestion/schema-design.md b/docs/35.0.0/ingestion/schema-design.md
new file mode 100644
index 0000000000..25b84a9a4d
--- /dev/null
+++ b/docs/35.0.0/ingestion/schema-design.md
@@ -0,0 +1,316 @@
+---
+id: schema-design
+title: "Schema design tips"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+## Druid's data model
+
+For general information, check out the documentation on [Druid schema model](./schema-model.md) on the main
+ingestion overview page. The rest of this page discusses tips for users coming from other kinds of systems, as well as
+general tips and common practices.
+
+* Druid data is stored in [datasources](./schema-model.md), which are similar to tables in a traditional RDBMS.
+* Druid datasources can be ingested with or without [rollup](./rollup.md). With rollup enabled, Druid partially aggregates your data during ingestion, potentially reducing its row count, decreasing storage footprint, and improving query performance. With rollup disabled, Druid stores one row for each row in your input data, without any pre-aggregation.
+* Every row in Druid must have a timestamp. Data is always partitioned by time, and every query has a time filter. Query results can also be broken down by time buckets like minutes, hours, days, and so on.
+* All columns in Druid datasources, other than the timestamp column, are either dimensions or metrics. This follows the [standard naming convention](https://en.wikipedia.org/wiki/Online_analytical_processing#Overview_of_OLAP_systems) of OLAP data.
+* Typical production datasources have tens to hundreds of columns.
+* [Dimension columns](./schema-model.md#dimensions) are stored as-is, so they can be filtered on, grouped by, or aggregated at query time. They are always single Strings, [arrays of Strings](../querying/multi-value-dimensions.md), single Longs, single Doubles or single Floats.
+* [Metric columns](./schema-model.md#metrics) are stored [pre-aggregated](../querying/aggregations.md), so they can only be aggregated at query time (not filtered or grouped by). They are often stored as numbers (integers or floats) but can also be stored as complex objects like [HyperLogLog sketches or approximate quantile sketches](../querying/aggregations.md#approximate-aggregations). Metrics can be configured at ingestion time even when rollup is disabled, but are most useful when rollup is enabled.
+
+## If you're coming from a
+
+### Relational model
+
+(Like Hive or PostgreSQL.)
+
+Druid datasources are generally equivalent to tables in a relational database. Druid [lookups](../querying/lookups.md)
+can act similarly to data-warehouse-style dimension tables, but as you'll see below, denormalization is often
+recommended if you can get away with it.
+
+Common practice for relational data modeling involves [normalization](https://en.wikipedia.org/wiki/Database_normalization):
+the idea of splitting up data into multiple tables such that data redundancy is reduced or eliminated. For example, in a
+"sales" table, best-practices relational modeling calls for a "product id" column that is a foreign key into a separate
+"products" table, which in turn has "product id", "product name", and "product category" columns. This prevents the
+product name and category from needing to be repeated on different rows in the "sales" table that refer to the same
+product.
+
+In Druid, on the other hand, it is common to use totally flat datasources that do not require joins at query time. In
+the example of the "sales" table, in Druid it would be typical to store "product_id", "product_name", and
+"product_category" as dimensions directly in a Druid "sales" datasource, without using a separate "products" table.
+Totally flat schemas substantially increase performance, since the need for joins is eliminated at query time. As an
+added speed boost, this also allows Druid's query layer to operate directly on compressed dictionary-encoded data.
+Perhaps counter-intuitively, this does _not_ substantially increase storage footprint relative to normalized schemas,
+since Druid uses dictionary encoding to effectively store just a single integer per row for string columns.
+
+If necessary, Druid datasources can be partially normalized through the use of [lookups](../querying/lookups.md),
+which are the rough equivalent of dimension tables in a relational database. At query time, you would use Druid's SQL
+`LOOKUP` function, or native lookup extraction functions, instead of using the JOIN keyword like you would in a
+relational database. Since lookup tables impose an increase in memory footprint and incur more computational overhead
+at query time, it is only recommended to do this if you need the ability to update a lookup table and have the changes
+reflected immediately for already-ingested rows in your main table.
+
+Tips for modeling relational data in Druid:
+
+* Druid datasources do not have primary or unique keys, so skip those.
+* Denormalize if possible. If you need to be able to update dimension / lookup tables periodically and have those
+changes reflected in already-ingested data, consider partial normalization with [lookups](../querying/lookups.md).
+* If you need to join two large distributed tables with each other, you must do this before loading the data into Druid.
+Druid does not support query-time joins of two datasources. Lookups do not help here, since a full copy of each lookup
+table is stored on each Druid server, so they are not a good choice for large tables.
+* Consider whether you want to enable [rollup](#rollup) for pre-aggregation, or whether you want to disable
+rollup and load your existing data as-is. Rollup in Druid is similar to creating a summary table in a relational model.
+
+### Time series model
+
+(Like OpenTSDB or InfluxDB.)
+
+Similar to time series databases, Druid's data model requires a timestamp. Druid is not a timeseries database, but
+it is a natural choice for storing timeseries data. Its flexible data model allows it to store both timeseries and
+non-timeseries data, even in the same datasource.
+
+To achieve best-case compression and query performance in Druid for timeseries data, it is important to partition and
+sort by metric name, like timeseries databases often do. See [Partitioning and sorting](./partitioning.md) for more details.
+
+Tips for modeling timeseries data in Druid:
+
+* Druid does not think of data points as being part of a "time series". Instead, Druid treats each point separately
+for ingestion and aggregation.
+* Create a dimension that indicates the name of the series that a data point belongs to. This dimension is often called
+"metric" or "name". Do not get the dimension named "metric" confused with the concept of Druid metrics. Place this
+first in the list of dimensions in your "dimensionsSpec" for best performance (this helps because it improves locality;
+see [partitioning and sorting](./partitioning.md) below for details).
+* Create other dimensions for attributes attached to your data points. These are often called "tags" in timeseries
+database systems.
+* Create [metrics](../querying/aggregations.md) corresponding to the types of aggregations that you want to be able
+to query. Typically, this includes "sum", "min", and "max" (in one of the long, float, or double flavors). If you want the ability
+to compute percentiles or quantiles, use Druid's [approximate aggregators](../querying/aggregations.md#approximate-aggregations).
+* Consider enabling [rollup](./rollup.md), which will allow Druid to potentially combine multiple points into one
+row in your Druid datasource. This can be useful if you want to store data at a different time granularity than it is
+naturally emitted. It is also useful if you want to combine timeseries and non-timeseries data in the same datasource.
+* If you don't know ahead of time what columns you'll want to ingest, use an empty dimensions list to trigger
+[automatic detection of dimension columns](#schema-auto-discovery-for-dimensions).
+
+### Log aggregation model
+
+(Like Elasticsearch or Splunk.)
+
+Similar to log aggregation systems, Druid offers inverted indexes for fast searching and filtering. Druid's search
+capabilities are generally less developed than these systems, and its analytical capabilities are generally more
+developed. The main data modeling differences between Druid and these systems are that when ingesting data into Druid,
+you must be more explicit. Druid columns have types specific upfront.
+
+Tips for modeling log data in Druid:
+
+* If you don't know ahead of time what columns to ingest, you can have Druid perform [schema auto-discovery](#schema-auto-discovery-for-dimensions).
+* If you have nested data, you can ingest it using the [nested columns](../querying/nested-columns.md) feature or flatten it using a [`flattenSpec`](./ingestion-spec.md#flattenspec).
+* Consider enabling [rollup](./rollup.md) if you have mainly analytical use cases for your log data. This will
+mean you lose the ability to retrieve individual events from Druid, but you potentially gain substantial compression and
+query performance boosts.
+
+## General tips and best practices
+
+### Rollup
+
+Druid can roll up data as it is ingested to minimize the amount of raw data that needs to be stored. This is a form
+of summarization or pre-aggregation. For more details, see the [Rollup](./rollup.md) section of the ingestion
+documentation.
+
+### Partitioning and sorting
+
+Optimally partitioning and sorting your data can have substantial impact on footprint and performance. For more details,
+see the [Partitioning](./partitioning.md) section of the ingestion documentation.
+
+<a name="sketches"></a>
+
+### Sketches for high cardinality columns
+
+When dealing with high cardinality columns like user IDs or other unique IDs, consider using sketches for approximate
+analysis rather than operating on the actual values. When you ingest data using a sketch, Druid does not store the
+original raw data, but instead stores a "sketch" of it that it can feed into a later computation at query time. Popular
+use cases for sketches include count-distinct and quantile computation. Each sketch is designed for just one particular
+kind of computation.
+
+In general using sketches serves two main purposes: improving rollup, and reducing memory footprint at
+query time.
+
+Sketches improve rollup ratios because they allow you to collapse multiple distinct values into the same sketch. For
+example, if you have two rows that are identical except for a user ID (perhaps two users did the same action at the
+same time), storing them in a count-distinct sketch instead of as-is means you can store the data in one row instead of
+two. You won't be able to retrieve the user IDs or compute exact distinct counts, but you'll still be able to compute
+approximate distinct counts, and you'll reduce your storage footprint.
+
+Sketches reduce memory footprint at query time because they limit the amount of data that needs to be shuffled between
+servers. For example, in a quantile computation, instead of needing to send all data points to a central location
+so that they can be sorted and the quantile can be computed, Druid instead only needs to send a sketch of the points. This
+can reduce data transfer needs to mere kilobytes.
+
+For details about the sketches available in Druid, see the
+[approximate aggregators](../querying/aggregations.md#approximate-aggregations) page.
+
+If you prefer videos, take a look at [Not exactly!](https://www.youtube.com/watch?v=Hpd3f_MLdXo), a conference talk
+about sketches in Druid.
+
+### String vs numeric dimensions
+
+If the user wishes to ingest a column as a numeric-typed dimension (Long, Double or Float), it is necessary to specify the type of the column in the `dimensions` section of the `dimensionsSpec`. If the type is omitted, Druid will ingest a column as the default String type.
+
+There are performance tradeoffs between string and numeric columns. Numeric columns are generally faster to group on
+than string columns. But unlike string columns, numeric columns don't have indexes, so they can be slower to filter on.
+You may want to experiment to find the optimal choice for your use case.
+
+For details about how to configure numeric dimensions, see the [`dimensionsSpec`](./ingestion-spec.md#dimensionsspec) documentation.
+
+### Secondary timestamps
+
+Druid schemas must always include a primary timestamp. The primary timestamp is used for
+[partitioning and sorting](./partitioning.md) your data, so it should be the timestamp that you will most often filter on.
+Druid is able to rapidly identify and retrieve data corresponding to time ranges of the primary timestamp column.
+
+If your data has more than one timestamp, you can ingest the others as secondary timestamps. The best way to do this
+is to ingest them as [long-typed dimensions](./ingestion-spec.md#dimensionsspec) in milliseconds format.
+If necessary, you can get them into this format using a [`transformSpec`](./ingestion-spec.md#transformspec) and
+[expressions](../querying/math-expr.md) like `timestamp_parse`, which returns millisecond timestamps.
+
+At query time, you can query secondary timestamps with [SQL time functions](../querying/sql-scalar.md#date-and-time-functions)
+like `MILLIS_TO_TIMESTAMP`, `TIME_FLOOR`, and others. If you're using native Druid queries, you can use
+[expressions](../querying/math-expr.md).
+
+### Nested dimensions
+
+You can ingest and store nested data in a Druid column as a `COMPLEX<json>` data type. See [Nested columns](../querying/nested-columns.md) for more information.
+
+If you want to ingest nested data in a format unsupported by the nested columns feature, you  must use the `flattenSpec` object to flatten it. For example, if you have data of the following form:
+
+```json
+{ "foo": { "bar": 3 } }
+```
+
+then before indexing it, you should transform it to:
+
+```json
+{ "foo_bar": 3 }
+```
+
+See the [`flattenSpec`](./ingestion-spec.md#flattenspec) documentation for more details.
+
+<a name="counting"></a>
+
+### Counting the number of ingested events
+
+When rollup is enabled, count aggregators at query time do not actually tell you the number of rows that have been
+ingested. They tell you the number of rows in the Druid datasource, which may be smaller than the number of rows
+ingested.
+
+In this case, a count aggregator at _ingestion_ time can be used to count the number of events. However, it is important to note
+that when you query for this metric, you should use a `longSum` aggregator. A `count` aggregator at query time will return
+the number of Druid rows for the time interval, which can be used to determine what the roll-up ratio was.
+
+To clarify with an example, if your ingestion spec contains:
+
+```json
+"metricsSpec": [
+    { "type": "count", "name": "count" }
+]
+```
+
+You should query for the number of ingested rows with:
+
+```json
+"aggregations": [
+    { "type": "longSum", "name": "numIngestedEvents", "fieldName": "count" }
+]
+```
+
+### Schema auto-discovery for dimensions
+
+Druid can infer the schema for your data in one of two ways:
+
+- [Type-aware schema discovery](#type-aware-schema-discovery) where Druid infers the schema and type for your data. Type-aware schema discovery is available for native batch and streaming ingestion.
+- [String-based schema discovery](#string-based-schema-discovery) where all the discovered columns are typed as either native string or multi-value string columns.
+
+#### Type-aware schema discovery
+
+:::info
+ Note that using type-aware schema discovery can impact downstream BI tools depending on how they handle ARRAY typed columns.
+:::
+
+You can have Druid infer the schema and types for your data partially or fully by setting `dimensionsSpec.useSchemaDiscovery` to `true` and defining some or no dimensions in the dimensions list. 
+
+When performing type-aware schema discovery, Druid can discover all the columns of your input data (that are not present in
+the exclusion list). Druid automatically chooses the most appropriate native Druid type among `STRING`, `LONG`,
+`DOUBLE`, `ARRAY<STRING>`, `ARRAY<LONG>`, `ARRAY<DOUBLE>`, or `COMPLEX<json>` for nested data. For input formats with
+native boolean types, Druid ingests these values as longs. Array typed columns can be queried using
+the [array functions](../querying/sql-array-functions.md) or [UNNEST](../querying/sql.md#unnest). Nested
+columns can be queried with the [JSON functions](../querying/sql-json-functions.md).
+
+Mixed type columns follow the same rules for schema differences between segments, and present as the _least_ restrictive
+type that can represent all values in the column. For example:
+
+- Mixed numeric columns are `DOUBLE`
+- If there are any strings present, then the column is a `STRING`
+- If there are arrays, then the column becomes an array with the least restrictive element type
+- Any nested data or arrays of nested data become `COMPLEX<json>` nested columns.
+
+Grouping, filtering, and aggregating mixed type values will handle these columns as if all values are represented as the
+least restrictive type. The exception to this is the scan query, which will return the values in their original mixed
+types, but any downstream operations on these values will still coerce them to the common type.
+
+If you're already using string-based schema discovery and want to migrate, see [Migrating to type-aware schema discovery](#migrating-to-type-aware-schema-discovery).
+
+#### String-based schema discovery
+
+If you do not set `dimensionsSpec.useSchemaDiscovery` to `true`, Druid can still use the string-based schema discovery for ingestion if any of the following conditions are met: 
+
+- The dimension list is empty 
+- You set `includeAllDimensions` to `true` 
+
+Druid coerces primitives and arrays of primitive types into the native Druid string type. Nested data structures and arrays of nested data structures are ignored and not ingested.
+
+#### Migrating to type-aware schema discovery
+
+If you previously used string-based schema discovery and want to migrate to type-aware schema discovery, do the following:
+
+- Update any queries that use multi-value dimensions (MVDs) to use UNNEST in conjunction with other functions so that no MVD behavior is being relied upon. Type-aware schema discovery generates ARRAY typed columns instead of MVDs, so queries that use any MVD features will fail.
+- Be aware of mixed typed inputs and test how type-aware schema discovery handles them. Druid attempts to cast them as the least restrictive type.
+- If you notice issues with numeric types, you may need to explicitly cast them. Generally, Druid handles the coercion for you.
+- Update your dimension exclusion list and add any nested columns if you want to continue to exclude them. String-based schema discovery automatically ignores nested columns, but type-aware schema discovery will ingest them.
+
+### Including the same column as a dimension and a metric
+
+One workflow with unique IDs is to be able to filter on a particular ID, while still being able to do fast unique counts on the ID column.
+If you are not using schema-less dimensions, this use case is supported by setting the `name` of the metric to something different from the dimension.
+If you are using schema-less dimensions, the best practice here is to include the same column twice, once as a dimension, and as a `hyperUnique` metric. This may involve
+some work at ETL time.
+
+As an example, for schema-less dimensions, repeat the same column:
+
+```json
+{ "device_id_dim": 123, "device_id_met": 123 }
+```
+
+and in your `metricsSpec`, include:
+
+```json
+{ "type": "hyperUnique", "name": "devices", "fieldName": "device_id_met" }
+```
+
+`device_id_dim` should automatically get picked up as a dimension.
diff --git a/docs/35.0.0/ingestion/schema-model.md b/docs/35.0.0/ingestion/schema-model.md
new file mode 100644
index 0000000000..9d7358001d
--- /dev/null
+++ b/docs/35.0.0/ingestion/schema-model.md
@@ -0,0 +1,58 @@
+---
+id: schema-model
+title: Druid schema model
+sidebar_label: Schema model
+description: Introduces concepts of datasources, primary timestamp, dimensions, and metrics.
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+Druid stores data in datasources, which are similar to tables in a traditional relational database management system (RDBMS). Druid's data model shares  similarities with both relational and timeseries data models.
+
+## Primary timestamp
+
+Druid schemas must always include a primary timestamp. Druid uses the primary timestamp to [partition and sort](./partitioning.md) your data. Druid uses the primary timestamp to rapidly identify and retrieve data within the time range of queries. Druid also uses the primary timestamp column
+for time-based [data management operations](../data-management/index.md) such as dropping time chunks, overwriting time chunks, and time-based retention rules.
+
+Druid parses the primary timestamp based on the [`timestampSpec`](./ingestion-spec.md#timestampspec) configuration at ingestion time. Regardless of the source field for the primary timestamp, Druid always stores the timestamp in the `__time` column in your Druid datasource.
+
+You can control other important operations that are based on the primary timestamp in the
+[`granularitySpec`](./ingestion-spec.md#granularityspec). If you have more than one timestamp column, you can store the others as
+[secondary timestamps](./schema-design.md#secondary-timestamps).
+
+## Dimensions
+
+Dimensions are columns that Druid stores "as-is". You can use dimensions for any purpose. For example, you can group, filter, or apply aggregators to dimensions at query time when necessary.
+
+If you disable [rollup](./rollup.md), then Druid treats the set of
+dimensions like a set of columns to ingest. The dimensions behave exactly as you would expect from any database that does not support a rollup feature.
+
+At ingestion time, you configure dimensions in the [`dimensionsSpec`](./ingestion-spec.md#dimensionsspec).
+
+## Metrics
+
+Metrics are columns that Druid stores in an aggregated form. Metrics are most useful when you enable [rollup](rollup.md). If you specify a metric, you can apply an aggregation function to each row during ingestion. This
+has the following benefits:
+
+Rollup is a form of aggregation that collapses dimensions while aggregating the values in the metrics, that is, it collapses rows but retains its summary information."
+- [Rollup](rollup.md) is a form of aggregation that combines multiple rows with the same timestamp value and dimension values. For example, the [rollup tutorial](../tutorials/tutorial-rollup.md) demonstrates using rollup to collapse netflow data to a single row per `(minute, srcIP, dstIP)` tuple, while retaining aggregate information about total packet and byte counts.
+- Druid can compute some aggregators, especially approximate ones, more quickly at query time if they are partially computed at ingestion time, including data that has not been rolled up.
+
+ At ingestion time, you configure Metrics in the [`metricsSpec`](./ingestion-spec.md#metricsspec).
diff --git a/docs/35.0.0/ingestion/standalone-realtime.md b/docs/35.0.0/ingestion/standalone-realtime.md
new file mode 100644
index 0000000000..94a8565baa
--- /dev/null
+++ b/docs/35.0.0/ingestion/standalone-realtime.md
@@ -0,0 +1,45 @@
+---
+id: standalone-realtime
+layout: doc_page
+title: "Realtime Process"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+Older versions of Apache Druid supported a standalone 'Realtime' process to query and index 'stream pull'
+modes of real-time ingestion. These processes would periodically build segments for the data they had collected over
+some span of time and then set up hand-off to [Historical](../design/historical.md) servers.
+
+This processes could be invoked by
+
+```
+org.apache.druid.cli.Main server realtime
+```
+
+This model of stream pull ingestion was deprecated for a number of both operational and architectural reasons, and
+removed completely in Druid 0.16.0. Operationally, realtime nodes were difficult to configure, deploy, and scale because
+each node required an unique configuration. The design of the stream pull ingestion system for realtime nodes also
+suffered from limitations which made it not possible to achieve exactly once ingestion.
+
+The extensions `druid-kafka-eight`, `druid-kafka-eight-simpleConsumer`, `druid-rabbitmq`, and `druid-rocketmq` were also
+removed at this time, since they were built to operate on the realtime nodes.
+
+Please consider using the [Kafka Indexing Service](../ingestion/kafka-ingestion.md) or
+[Kinesis Indexing Service](../ingestion/kinesis-ingestion.md) for stream pull ingestion instead.
diff --git a/docs/35.0.0/ingestion/streaming.md b/docs/35.0.0/ingestion/streaming.md
new file mode 100644
index 0000000000..942ed46b98
--- /dev/null
+++ b/docs/35.0.0/ingestion/streaming.md
@@ -0,0 +1,35 @@
+---
+id: streaming
+title: "Streaming ingestion"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+Apache Druid can consume data streams from the following external streaming sources:
+
+* Apache Kafka through the bundled [Kafka indexing service](kafka-ingestion.md) extension.
+* Amazon Kinesis through the bundled [Kinesis indexing service](kinesis-ingestion.md) extension.
+
+Each indexing service provides real-time data ingestion with exactly-once stream processing guarantee.
+To use either of the streaming ingestion methods, you must first load the associated extension on both the Overlord and the Middle Manager. See [Loading extensions](../configuration/extensions.md#loading-extensions) for more information.
+
+Streaming ingestion is controlled by a continuously running [supervisor](supervisor.md).
+The supervisor oversees the state of indexing tasks to coordinate handoffs, manage failures, and ensure that scalability and replication requirements are maintained.
+You start a supervisor by submitting a JSON specification, often referred to as the supervisor spec, either though the Druid web console or using the [Supervisor API](../api-reference/supervisor-api.md).
\ No newline at end of file
diff --git a/docs/35.0.0/ingestion/supervisor.md b/docs/35.0.0/ingestion/supervisor.md
new file mode 100644
index 0000000000..882207cac1
--- /dev/null
+++ b/docs/35.0.0/ingestion/supervisor.md
@@ -0,0 +1,436 @@
+---
+id: supervisor
+title: Supervisor
+sidebar_label: Supervisor
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+Apache Druid uses supervisors to manage streaming ingestion from external streaming sources into Druid.
+Supervisors oversee the state of indexing tasks to coordinate handoffs, manage failures, and ensure that the scalability and replication requirements are maintained. They can also be used to perform [automatic compaction](../data-management/automatic-compaction.md) after data has been ingested.
+
+This topic uses the Apache Kafka term offset to refer to the identifier for records in a partition. If you are using Amazon Kinesis, the equivalent is sequence number.
+
+## Supervisor spec
+
+Druid uses a JSON specification, often referred to as the supervisor spec, to define tasks used for streaming ingestion or auto-compaction.
+The supervisor spec specifies how Druid should consume, process, and index data from an external stream or Druid itself.
+
+The following table outlines the high-level configuration options for a supervisor spec:
+
+|Property|Type|Description|Required|
+|--------|----|-----------|--------|
+|`id`|String|The supervisor id. This should be a unique ID that will identify the supervisor. If unspecified, defaults to `spec.dataSchema.dataSource`.|No|
+|`type`|String|The supervisor type. For streaming ingestion, this can be either `kafka`, `kinesis`, or `rabbit`. For automatic compaction, set the type to `autocompact`. |Yes|
+|`spec`|Object|The container object for the supervisor configuration. For automatic compaction, this is the same as the compaction configuration. |Yes|
+|`spec.dataSchema`|Object|The schema for the indexing task to use during ingestion. See [`dataSchema`](../ingestion/ingestion-spec.md#dataschema) for more information.|Yes|
+|`spec.ioConfig`|Object|The I/O configuration object to define the connection and I/O-related settings for the supervisor and indexing tasks.|Yes|
+|`spec.tuningConfig`|Object|The tuning configuration object to define performance-related settings for the supervisor and indexing tasks.|No|
+|`context`|Object|Allows for extra configuration of both the supervisor and the tasks it spawns.|No|
+|`suspended`|Boolean|Puts the supervisor in a suspended state|No|
+
+### I/O configuration
+
+The following table outlines the `ioConfig` configuration properties that apply to both Apache Kafka and Amazon Kinesis ingestion methods.
+For configuration properties specific to Kafka and Kinesis, see [Kafka I/O configuration](kafka-ingestion.md#io-configuration) and [Kinesis I/O configuration](kinesis-ingestion.md#io-configuration) respectively.
+
+|Property|Type|Description|Required|Default|
+|--------|----|-----------|--------|-------|
+|`inputFormat`|Object|The [input format](../ingestion/data-formats.md#input-format) to define input data parsing.|Yes||
+|`autoScalerConfig`|Object|Defines auto scaling behavior for ingestion tasks. See [Task autoscaler](#task-autoscaler) for more information.|No|null|
+|`taskCount`|Integer|The maximum number of reading tasks in a replica set. Multiply `taskCount` and replicas to measure the maximum number of reading tasks. The total number of tasks, reading and publishing, is higher than the maximum number of reading tasks. See [Capacity planning](../ingestion/supervisor.md#capacity-planning) for more details. When `taskCount` is greater than the number of Kafka partitions or Kinesis shards, the actual number of reading tasks is less than the `taskCount` value.|No|1|
+|`replicas`|Integer|The number of replica sets, where 1 is a single set of tasks (no replication). Druid always assigns replicate tasks to different workers to provide resiliency against process failure.|No|1|
+|`taskDuration`|ISO 8601 period|The length of time before tasks stop reading and begin publishing segments.|No|`PT1H`|
+|`startDelay`|ISO 8601 period|The period to wait before the supervisor starts managing tasks.|No|`PT5S`|
+|`period`|ISO 8601 period|Determines how often the supervisor executes its management logic. Note that the supervisor also runs in response to certain events, such as tasks succeeding, failing, and reaching their task duration. The `period` value specifies the maximum time between iterations.|No|`PT30S`|
+|`completionTimeout`|ISO 8601 period|The length of time to wait before declaring a publishing task as failed and terminating it. If the value is too low, tasks may never publish. The publishing clock for a task begins roughly after `taskDuration` elapses.|No|`PT30M`|
+|`lateMessageRejectionStartDateTime`|ISO 8601 date time|Configures tasks to reject messages with timestamps earlier than this date time. For example, if this property is set to `2016-01-01T11:00Z` and the supervisor creates a task at `2016-01-01T12:00Z`, Druid drops messages with timestamps earlier than `2016-01-01T11:00Z`. This can prevent concurrency issues if your data stream has late messages and you have multiple pipelines that need to operate on the same segments, such as a realtime and a nightly batch ingestion pipeline.|No||
+|`lateMessageRejectionPeriod`|ISO 8601 period|Configures tasks to reject messages with timestamps earlier than this period before the task was created. For example, if this property is set to `PT1H` and the supervisor creates a task at `2016-01-01T12:00Z`, Druid drops messages with timestamps earlier than `2016-01-01T11:00Z`. This may help prevent concurrency issues if your data stream has late messages and you have multiple pipelines that need to operate on the same segments, such as a streaming and a nightly batch ingestion pipeline. You can specify only one of the late message rejection properties.|No||
+|`earlyMessageRejectionPeriod`|ISO 8601 period|Configures tasks to reject messages with timestamps later than this period after the task reached its task duration. For example, if this property is set to `PT1H`, the task duration is set to `PT1H` and the supervisor creates a task at `2016-01-01T12:00Z`, Druid drops messages with timestamps later than `2016-01-01T14:00Z`. Tasks sometimes run past their task duration, such as in cases of supervisor failover.|No||
+|`stopTaskCount`|Integer|Limits the number of ingestion tasks Druid can cycle at any given time. If not set, Druid can cycle all tasks at the same time. If set to a value less than `taskCount`, your cluster needs fewer available slots to run the supervisor. You can save costs by scaling down your ingestion tier, but this can lead to slower cycle times and lag. See [`stopTaskCount`](#stoptaskcount) for more information.|No|`taskCount` value|
+
+#### Task autoscaler
+
+You can optionally configure autoscaling behavior for ingestion tasks using the `autoScalerConfig` property of the `ioConfig` object.
+
+The following table outlines the configuration properties for `autoScalerConfig`:
+
+|Property|Description|Required|Default|
+|--------|-----------|--------|-------|
+|`enableTaskAutoScaler`|Enables the autoscaler. If not specified, Druid disables the autoscaler even when `autoScalerConfig` is not null.|No|`false`|
+|`taskCountMax`|The maximum number of ingestion tasks. Must be greater than or equal to `taskCountMin`. If `taskCountMax` is greater than the number of Kafka partitions or Kinesis shards, Druid sets the maximum number of reading tasks to the number of Kafka partitions or Kinesis shards and ignores `taskCountMax`.|Yes||
+|`taskCountMin`|The minimum number of ingestion tasks. When you enable the autoscaler, Druid ignores the value of `taskCount` in `ioConfig` and starts with the `taskCountMin` number of tasks to launch.|Yes||
+|`taskCountStart`|Optional config to specify the number of ingestion tasks to start with. When you enable the autoscaler, Druid ignores the value of `taskCount` in `ioConfig` and, if specified, starts with the `taskCountStart` number of tasks. Otherwise, defaults to `taskCountMin`.|No|`taskCountMin`|
+|`minTriggerScaleActionFrequencyMillis`|The minimum time interval between two scale actions.| No|600000|
+|`autoScalerStrategy`|The algorithm of autoscaler. Druid only supports the `lagBased` strategy. See [Autoscaler strategy](#autoscaler-strategy) for more information.|No|`lagBased`|
+|`stopTaskCountRatio`|A variable version of `ioConfig.stopTaskCount` with a valid range of (0.0, 1.0]. Allows the maximum number of stoppable tasks in steady state to be proportional to the number of tasks currently running.|No||
+
+##### Autoscaler strategy
+
+:::info
+Unlike the Kafka indexing service, Kinesis reports lag metrics as the time difference in milliseconds between the current sequence number and the latest sequence number, rather than message count.
+:::
+
+The following table outlines the configuration properties related to the `lagBased` autoscaler strategy:
+
+|Property|Description|Required|Default|
+|--------|-----------|--------|-------|
+|`lagCollectionIntervalMillis`|The time period during which Druid collects lag metric points.|No|30000|
+|`lagCollectionRangeMillis`|The total time window of lag collection. Use with `lagCollectionIntervalMillis` to specify the intervals at which to collect lag metric points.|No|600000|
+|`scaleOutThreshold`|The threshold of scale out action. |No|6000000|
+|`triggerScaleOutFractionThreshold`|Enables scale out action if `triggerScaleOutFractionThreshold` percent of lag points is higher than `scaleOutThreshold`.|No|0.3|
+|`scaleInThreshold`|The threshold of scale in action.|No|1000000|
+|`triggerScaleInFractionThreshold`|Enables scale in action if `triggerScaleInFractionThreshold` percent of lag points is lower than `scaleOutThreshold`.|No|0.9|
+|`scaleActionStartDelayMillis`|The number of milliseconds to delay after the supervisor starts before the first scale logic check.|No|300000|
+|`scaleActionPeriodMillis`|The frequency in milliseconds to check if a scale action is triggered.|No|60000|
+|`scaleInStep`|The number of tasks to reduce at once when scaling down.|No|1|
+|`scaleOutStep`|The number of tasks to add at once when scaling out.|No|2|
+|`lagAggregate`|The aggregate function used to compute the lag metric for scaling decisions. Possible values are `MAX`, `SUM` and `AVERAGE`. |No|`SUM`|
+
+The following example shows a supervisor spec with `lagBased` autoscaler:
+
+<details>
+  <summary>Click to view the example</summary>
+
+```json
+{
+  "type": "kinesis",
+  "dataSchema": {
+    "dataSource": "metrics-kinesis",
+    "timestampSpec": {
+      "column": "timestamp",
+      "format": "auto"
+    },
+    "dimensionsSpec": {
+      "dimensions": [],
+      "dimensionExclusions": [
+        "timestamp",
+        "value"
+      ]
+    },
+    "metricsSpec": [
+      {
+        "name": "count",
+        "type": "count"
+      },
+      {
+        "name": "value_sum",
+        "fieldName": "value",
+        "type": "doubleSum"
+      },
+      {
+        "name": "value_min",
+        "fieldName": "value",
+        "type": "doubleMin"
+      },
+      {
+        "name": "value_max",
+        "fieldName": "value",
+        "type": "doubleMax"
+      }
+    ],
+    "granularitySpec": {
+      "type": "uniform",
+      "segmentGranularity": "HOUR",
+      "queryGranularity": "NONE"
+    }
+  },
+  "ioConfig": {
+    "stream": "metrics",
+    "autoScalerConfig": {
+      "enableTaskAutoScaler": true,
+      "taskCountMax": 6,
+      "taskCountMin": 2,
+      "minTriggerScaleActionFrequencyMillis": 600000,
+      "autoScalerStrategy": "lagBased",
+      "lagCollectionIntervalMillis": 30000,
+      "lagCollectionRangeMillis": 600000,
+      "scaleOutThreshold": 600000,
+      "triggerScaleOutFractionThreshold": 0.3,
+      "scaleInThreshold": 100000,
+      "triggerScaleInFractionThreshold": 0.9,
+      "scaleActionStartDelayMillis": 300000,
+      "scaleActionPeriodMillis": 60000,
+      "scaleInStep": 1,
+      "scaleOutStep": 2
+    },
+    "inputFormat": {
+      "type": "json"
+    },
+    "endpoint": "kinesis.us-east-1.amazonaws.com",
+    "taskCount": 1,
+    "replicas": 1,
+    "taskDuration": "PT1H"
+  },
+  "tuningConfig": {
+    "type": "kinesis",
+    "maxRowsPerSegment": 5000000
+  }
+}
+```
+</details>
+
+#### `stopTaskCount`
+
+Before you set `stopTaskCount`, note the following: 
+
+- Some operations require all tasks to cycle at the same time, for example changes to the supervisor spec and change to the number of Kafka partitions. These operations can cause lag without sufficient task slot capacity.
+- The [task autoscaler](#task-autoscaler) ignores `stopTaskCount` when shutting down tasks in response to a task count change. The task autoscaler needs to redistribute partitions across tasks, which requires all tasks to be shut down.
+- If you set `stopTaskCount` to a value less than `taskCount`, Druid cycles the longest running tasks first, then other tasks up to the value set.
+
+### Tuning configuration
+
+The `tuningConfig` object is optional. If you don't specify the `tuningConfig` object, Druid uses the default configuration settings.
+
+The following table outlines the `tuningConfig` configuration properties that apply to both Kafka and Kinesis ingestion methods.
+For configuration properties specific to Kafka and Kinesis, see [Kafka tuning configuration](kafka-ingestion.md#tuning-configuration) and [Kinesis tuning configuration](kinesis-ingestion.md#tuning-configuration) respectively.
+
+|Property|Type|Description|Required|Default|
+|--------|----|-----------|--------|-------|
+|`type`|String|The tuning type code for the ingestion method. One of `kafka` or `kinesis`.|Yes||
+|`maxRowsInMemory`|Integer|The number of rows to accumulate before persisting. This number represents the post-aggregation rows. It is not equivalent to the number of input events, but the resulting number of aggregated rows. Druid uses `maxRowsInMemory` to manage the required JVM heap size. The maximum heap memory usage for indexing scales is `maxRowsInMemory * (2 + maxPendingPersists)`. Normally, you don't need to set this, but depending on the nature of data, if rows are short in terms of bytes, you may not want to store a million rows in memory and this value should be set.|No|150000|
+|`maxBytesInMemory`|Long|The number of bytes to accumulate in heap memory before persisting. The value is based on a rough estimate of memory usage and not actual usage. Normally, Druid computes the value internally. The maximum heap memory usage for indexing is `maxBytesInMemory * (2 + maxPendingPersists)`.|No|One-sixth of max JVM memory|
+|`skipBytesInMemoryOverheadCheck`|Boolean|The calculation of `maxBytesInMemory` takes into account overhead objects created during ingestion and each intermediate persist. To exclude the bytes of these overhead objects from the `maxBytesInMemory` check, set `skipBytesInMemoryOverheadCheck` to `true`.|No|`false`|
+|`maxRowsPerSegment`|Integer|The number of rows to store in a segment. This number is post-aggregation rows. Handoff occurs when `maxRowsPerSegment` or `maxTotalRows` is reached or every `intermediateHandoffPeriod`, whichever happens first.|No|5000000|
+|`maxTotalRows`|Long|The number of rows to aggregate across all segments; this number is post-aggregation rows. Handoff happens either if `maxRowsPerSegment` or `maxTotalRows` is reached or every `intermediateHandoffPeriod`, whichever happens earlier.|No|20000000|
+|`intermediateHandoffPeriod`|ISO 8601 period|The period that determines how often tasks hand off segments. Handoff occurs if `maxRowsPerSegment` or `maxTotalRows` is reached or every `intermediateHandoffPeriod`, whichever happens first.|No|`P2147483647D`|
+|`intermediatePersistPeriod`|ISO 8601 period|The period that determines the rate at which intermediate persists occur.|No|`PT10M`|
+|`maxPendingPersists`|Integer|Maximum number of persists that can be pending but not started. If a new intermediate persist exceeds this limit, Druid blocks ingestion until the currently running persist finishes. One persist can be running concurrently with ingestion, and none can be queued up. The maximum heap memory usage for indexing scales is `maxRowsInMemory * (2 + maxPendingPersists)`.|No|0|
+|`indexSpec`|Object|Defines segment storage format options to use at indexing time. See [IndexSpec](../ingestion/ingestion-spec.md#indexspec) for more information.|No||
+|`indexSpecForIntermediatePersists`|Object|Defines segment storage format options to use at indexing time for intermediate persisted temporary segments. You can use `indexSpecForIntermediatePersists` to disable dimension/metric compression on intermediate segments to reduce memory required for final merging. However, disabling compression on intermediate segments might increase page cache use while they are used before getting merged into final segment published.|No||
+|`reportParseExceptions`|Boolean|DEPRECATED. If `true`, Druid throws exceptions encountered during parsing causing ingestion to halt. If `false`, Druid skips unparseable rows and fields. Setting `reportParseExceptions` to `true` overrides existing configurations for `maxParseExceptions` and `maxSavedParseExceptions`, setting `maxParseExceptions` to 0 and limiting `maxSavedParseExceptions` to not more than 1.|No|`false`|
+|`handoffConditionTimeout`|Long|Number of milliseconds to wait for segment handoff. Set to a value >= 0, where 0 means to wait indefinitely.|No|900000 (15 minutes) for Kafka. 0 for Kinesis.|
+|`resetOffsetAutomatically`|Boolean|Resets partitions when the offset is unavailable. If set to `true`, Druid resets partitions to the earliest or latest offset, based on the value of `useEarliestOffset` or `useEarliestSequenceNumber` (earliest if `true`, latest if `false`). If set to `false`, Druid surfaces the exception causing tasks to fail and ingestion to halt. If this occurs, manual intervention is required to correct the situation, potentially through [resetting the supervisor](../api-reference/supervisor-api.md#reset-a-supervisor).|No|`false`|
+|`workerThreads`|Integer|The number of threads that the supervisor uses to handle requests/responses for worker tasks, along with any other internal asynchronous operation.|No|`min(10, taskCount)`|
+|`chatRetries`|Integer|The number of times Druid retries HTTP requests to indexing tasks before considering tasks unresponsive.|No|8|
+|`httpTimeout`|ISO 8601 period|The period of time to wait for a HTTP response from an indexing task.|No|`PT10S`|
+|`shutdownTimeout`|ISO 8601 period|The period of time to wait for the supervisor to attempt a graceful shutdown of tasks before exiting.|No|`PT80S`|
+|`offsetFetchPeriod`|ISO 8601 period|Determines how often the supervisor queries the streaming source and the indexing tasks to fetch current offsets and calculate lag. If the user-specified value is below the minimum value of `PT5S`, the supervisor ignores the value and uses the minimum value instead.|No|`PT30S`|
+|`segmentWriteOutMediumFactory`|Object|The segment write-out medium to use when creating segments. See [Additional Peon configuration: SegmentWriteOutMediumFactory](../configuration/index.md#segmentwriteoutmediumfactory) for explanation and available options.|No|If not specified, Druid uses the value from `druid.peon.defaultSegmentWriteOutMediumFactory.type`.|
+|`logParseExceptions`|Boolean|If `true`, Druid logs an error message when a parsing exception occurs, containing information about the row where the error occurred.|No|`false`|
+|`maxParseExceptions`|Integer|The maximum number of parse exceptions that can occur before the task halts ingestion and fails. Setting `reportParseExceptions` overrides this limit.|No|unlimited|
+|`maxSavedParseExceptions`|Integer|When a parse exception occurs, Druid keeps track of the most recent parse exceptions. `maxSavedParseExceptions` limits the number of saved exception instances. These saved exceptions are available after the task finishes in the [task completion report](../ingestion/tasks.md#task-reports). Setting `reportParseExceptions` overrides this limit.|No|0|
+|`maxColumnsToMerge`|Integer|Limit of the number of segments to merge in a single phase when merging segments for publishing. This limit affects the total number of columns present in a set of segments to merge. If the limit is exceeded, segment merging occurs in multiple phases. Druid merges at least 2 segments per phase, regardless of this setting.|No|-1|
+
+## Start a supervisor
+
+Druid starts a new supervisor when you submit a supervisor spec.
+You can submit the supervisor spec in the Druid web console [data loader](../operations/web-console.md#data-loader) or with the [Supervisor API](../api-reference/supervisor-api.md).
+
+The following screenshot shows the [Supervisors](../operations/web-console.md#supervisors) view of the web console for a cluster with two supervisors:
+
+![Supervisors view](../assets/supervisor-view.png)
+
+Once started, the supervisor persists in the configured metadata database. There can only be one supervisor per datasource. Submitting a second supervisor spec for the same datasource overwrites the previous one.
+
+When an Overlord gains leadership, either by being started or as a result of another Overlord failing, it spawns a supervisor for each supervisor spec in the metadata database. The supervisor then discovers running indexing tasks and attempts to adopt them if they are compatible with the supervisor's configuration. If they are not compatible, the tasks are terminated and the supervisor creates a new set of tasks. This way, the supervisor ingestion tasks persist across Overlord restarts and failovers.
+
+### Schema and configuration changes
+
+To make schema or configuration changes, you must submit a new supervisor spec. The Overlord initiates a graceful shutdown of the existing supervisor. The running supervisor signals its tasks to stop reading and begin publishing, exiting itself. Druid then uses the new configuration to create a new supervisor. Druid submits the updated schema while retaining existing publishing tasks. It also starts new tasks at the previous task offsets.
+This way, configuration changes can be applied without requiring any pause in ingestion.
+
+## Status report
+
+The supervisor status report contains the state of the supervisor tasks and an array of recently thrown exceptions reported as `recentErrors`.
+You can control the maximum size of the exceptions using the `druid.supervisor.maxStoredExceptionEvents` configuration.
+
+To view the supervisor status in the web console, navigate to the **Supervisors** view and click the supervisor ID to open the **Supervisor** dialog.
+Click **Status** in the left navigation pane to display the status:
+
+![Supervisors info dialog](../assets/supervisor-info-dialog.png)
+
+The following example shows the status of a supervisor with the name `social_media`:
+
+<details>
+  <summary>Click to view the example</summary>
+
+```json
+{
+  "dataSource": "social_media",
+  "stream": "social_media",
+  "partitions": 1,
+  "replicas": 1,
+  "durationSeconds": 3600,
+  "activeTasks": [
+    {
+      "id": "index_kafka_social_media_8ff3096f21fe448_jajnddno",
+      "startingOffsets": {
+        "0": 0
+      },
+      "startTime": "2024-01-30T21:21:41.696Z",
+      "remainingSeconds": 479,
+      "type": "ACTIVE",
+      "currentOffsets": {
+        "0": 50000
+      },
+      "lag": {
+        "0": 0
+      }
+    }
+  ],
+  "publishingTasks": [],
+  "latestOffsets": {
+    "0": 50000
+  },
+  "minimumLag": {
+    "0": 0
+  },
+  "aggregateLag": 0,
+  "offsetsLastUpdated": "2024-01-30T22:13:19.335Z",
+  "suspended": false,
+  "healthy": true,
+  "state": "RUNNING",
+  "detailedState": "RUNNING",
+  "recentErrors": []
+}
+```
+</details>
+
+The status report contains two properties that correspond to the state of the supervisor: `state` and `detailedState`. The `state` property contains a small number of generic states that apply to any type of supervisor. The `detailedState` property contains a more descriptive, implementation-specific state that may provide more insight into the supervisor's activities.
+
+Possible `state` values are `PENDING`, `RUNNING`, `SUSPENDED`, `STOPPING`, `UNHEALTHY_SUPERVISOR`, and `UNHEALTHY_TASKS`.
+
+The following table lists `detailedState` values and their corresponding `state` mapping:
+
+|`detailedState`|`state`|Description|
+|--------------|-------------------|-----------|
+|`UNHEALTHY_SUPERVISOR`|`UNHEALTHY_SUPERVISOR`|The supervisor encountered errors on previous `druid.supervisor.unhealthinessThreshold` iterations.|
+|`UNHEALTHY_TASKS`|`UNHEALTHY_TASKS`|The last `druid.supervisor.taskUnhealthinessThreshold` tasks all failed.|
+|`UNABLE_TO_CONNECT_TO_STREAM`|`UNHEALTHY_SUPERVISOR`|The supervisor is encountering connectivity issues with the stream and hasn't successfully connected in the past.|
+|`LOST_CONTACT_WITH_STREAM`|`UNHEALTHY_SUPERVISOR`|The supervisor is encountering connectivity issues with the stream but has successfully connected in the past.|
+|`PENDING` (first iteration only)|`PENDING`|The supervisor has been initialized but hasn't started connecting to the stream.|
+|`CONNECTING_TO_STREAM` (first iteration only)|`RUNNING`|The supervisor is trying to connect to the stream and update partition data.|
+|`DISCOVERING_INITIAL_TASKS` (first iteration only)|`RUNNING`|The supervisor is discovering already-running tasks.|
+|`CREATING_TASKS` (first iteration only)|`RUNNING`|The supervisor is creating tasks and discovering state.|
+|`RUNNING`|`RUNNING`|The supervisor has started tasks and is waiting for `taskDuration` to elapse.|
+|`IDLE`|`IDLE`|The supervisor is not creating tasks since the input stream has not received any new data and all the existing data is read.|
+|`SUSPENDED`|`SUSPENDED`|The supervisor is suspended.|
+|`STOPPING`|`STOPPING`|The supervisor is stopping.|
+
+On each iteration of the supervisor's run loop, the supervisor completes the following tasks in sequence:
+
+1. Retrieve the list of partitions and determine the starting offset for each partition. If continuing, Druid uses the last processed offset. For new streams, Druid starts from either the beginning or end of the stream, depending on the `useEarliestOffset` property.
+2. Discover any running indexing tasks that are writing to the supervisor's datasource and adopt them if they match the supervisor's configuration, else signal them to stop.
+3. Send a status request to each supervised task to update the view of the state of the tasks under supervision.
+4. Handle tasks that have exceeded `taskDuration` and should transition from reading to publishing.
+5. Handle tasks that have finished publishing and signal redundant replica tasks to stop.
+6. Handle tasks that have failed and clean up the supervisor's internal state.
+7. Compare the list of healthy tasks to the requested `taskCount` and `replicas` configurations and create additional tasks if required.
+
+The `detailedState` property shows additional values (marked with "first iteration only" in the preceding table) the first time the
+supervisor executes this run loop after startup or after resuming from a suspension. This is intended to surface
+initialization-type issues, where the supervisor is unable to reach a stable state. For example, if the supervisor can't connect to
+the stream, if it's unable to read from the stream, or if it can't communicate with existing tasks. Once the supervisor is stable;
+that is, once it has completed a full execution without encountering any issues, `detailedState` will show a `RUNNING`
+state until it is stopped, suspended, or hits a failure threshold and transitions to an unhealthy state.
+
+:::info
+For the Kafka indexing service, Druid may report the consumer lag per partition as a negative value if the supervisor hasn't received the latest offset response from Kafka. The aggregate lag value is always >= 0.
+:::
+
+## SUPERVISORS system table
+
+Druid exposes system information through special system schemas. You can query the `sys.supervisors` table to retrieve information about the supervisor internals.
+The following example shows how to retrieve supervisor tasks information filtered by health status:
+
+```sql
+SELECT * FROM sys.supervisors WHERE healthy=0;
+```
+
+For more information on the supervisors system table, see [SUPERVISORS table](../querying/sql-metadata-tables.md#supervisors-table).
+
+## Manage a supervisor
+
+You can manage a supervisor from the web console or with the [Supervisor API](../api-reference/supervisor-api.md).
+In the web console, navigate to the **Supervisors** view and click the ellipsis in the **Actions** column. Select the desired action from the menu that appears.
+
+![Actions menu](../assets/supervisor-actions.png)
+
+The supervisor must be running for some of these actions to be available.
+
+### Suspend
+
+**Suspend** pauses a running supervisor.
+The suspended supervisor continues to emit logs and metrics.
+Indexing tasks remain suspended until you resume the supervisor.
+For information on how to suspend a supervisor by API, see [Supervisors: Suspend a running supervisor](../api-reference/supervisor-api.md#suspend-a-running-supervisor).
+
+### Set offsets
+
+:::info
+Perform this action with caution as it may result in skipped messages and lead to data loss or duplicate data.
+:::
+
+**Set offsets** resets the offsets for supervisor partitions.
+This action clears the stored offsets and instructs the supervisor to resume reading data from the specified offsets. If there are no stored offsets, Druid saves the specified offsets in the metadata store.
+**Set offsets** terminates and recreates active tasks for the specified partitions to begin reading from the reset offsets.
+For partitions not specified in this operation, the supervisor resumes from the last stored offset.
+
+For information on how to reset offsets by API, see [Supervisors: Reset offsets for a supervisor](../api-reference/supervisor-api.md#reset-offsets-for-a-supervisor).
+
+### Hard reset
+
+:::info
+Perform this action with caution as it may result in skipped messages and lead to data loss or duplicate data.
+:::
+
+**Hard reset** clears supervisor metadata, causing the supervisor to resume data reading from either the earliest or latest available position, depending on the `useEarliestOffset` setting. **Hard reset** terminates and recreates active tasks, so that tasks begin reading from valid positions.
+
+Use this action to recover from a stopped state due to missing offsets.
+
+For information on how to reset a supervisor by API, see [Supervisors: Reset a supervisor](../api-reference/supervisor-api.md#reset-a-supervisor).
+
+### Terminate
+
+**Terminate** stops a supervisor and its indexing tasks, triggering the publishing of their segments. When you terminate a supervisor, Druid places a tombstone marker in the metadata store to prevent reloading on restart.
+The terminated supervisor still exists in the metadata store and its history can be retrieved.
+
+For information on how to terminate a supervisor by API, see [Supervisors: Terminate a supervisor](../api-reference/supervisor-api.md#terminate-a-supervisor).
+
+## Capacity planning
+
+Indexing tasks run on Middle Managers and are limited by the resources available in the Middle Manager cluster. In particular, you should make sure that you have sufficient worker capacity, configured using the
+`druid.worker.capacity` property, to handle the configuration in the supervisor spec. Note that worker capacity is
+shared across all types of indexing tasks, so you should plan your worker capacity to handle your total indexing load, such as batch processing, streaming tasks, and merging tasks. If your workers run out of capacity, indexing tasks queue and wait for the next available worker. This may cause queries to return partial results but will not result in data loss, assuming the tasks run before the stream purges those offsets.
+
+A running task can be in one of two states: reading or publishing. A task remains in reading state for the period defined in `taskDuration`, at which point it transitions to publishing state. A task remains in publishing state for as long as it takes to generate segments, push segments to deep storage, and have them loaded and served by a Historical service or until `completionTimeout` elapses.
+
+The number of reading tasks is controlled by `replicas` and `taskCount`. In general, there are `replicas * taskCount` reading tasks. An exception occurs if `taskCount` is over the number of shards in Kinesis or partitions in Kafka, in which case Druid uses the number of shards or partitions. When `taskDuration` elapses, these tasks transition to publishing state and `replicas * taskCount` new reading tasks are created. To allow for reading tasks and publishing tasks to run concurrently, there should be a minimum capacity of:
+
+```text
+workerCapacity = 2 * replicas * taskCount
+```
+
+This value is for the ideal situation in which there is at most one set of tasks publishing while another set is reading.
+In some circumstances, it is possible to have multiple sets of tasks publishing simultaneously. This would happen if the
+time-to-publish (generate segment, push to deep storage, load on Historical) is greater than `taskDuration`. This is a valid and correct scenario but requires additional worker capacity to support. In general, it is a good idea to have `taskDuration` be large enough that the previous set of tasks finishes publishing before the current set begins.
+
+## Multi-Supervisor Support (Experimental)
+Druid supports multiple stream supervisors ingesting into the same datasource. This means you can have any number of stream supervisors (Kafka, Kinesis, etc.) ingesting into the same datasource at the same time.
+In order to ensure proper synchronization between ingestion tasks with multiple supervisors, it's important to set `useConcurrentLocks=true` in the `context` field of the supervisor spec. Read more [here](concurrent-append-replace.md).
+
+## Learn more
+
+See the following topics for more information:
+
+* [Supervisor API](../api-reference/supervisor-api.md) for how to manage and monitor supervisors using the API.
+* [Apache Kafka ingestion](../ingestion/kafka-ingestion.md) to learn about ingesting data from an Apache Kafka stream.
+* [Amazon Kinesis ingestion](../ingestion/kinesis-ingestion.md) to learn about ingesting data from an Amazon Kinesis stream.
diff --git a/docs/35.0.0/ingestion/tasks.md b/docs/35.0.0/ingestion/tasks.md
new file mode 100644
index 0000000000..2dc82b7dc4
--- /dev/null
+++ b/docs/35.0.0/ingestion/tasks.md
@@ -0,0 +1,547 @@
+---
+id: tasks
+title: Task reference
+sidebar_label: Task reference
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+Tasks do all [ingestion](index.md)-related work in Druid.
+
+For batch ingestion, you will generally submit tasks directly to Druid using the
+[Tasks APIs](../api-reference/tasks-api.md). For streaming ingestion, tasks are generally submitted for you by a
+supervisor.
+
+## Task API
+
+Task APIs are available in two main places:
+
+- The [Overlord](../design/overlord.md) process offers HTTP APIs to submit tasks, cancel tasks, check their status,
+review logs and reports, and more. Refer to the [Tasks API reference](../api-reference/tasks-api.md) for a
+full list.
+- Druid SQL includes a [`sys.tasks`](../querying/sql-metadata-tables.md#tasks-table) table that provides information about active
+and recently completed tasks. This table is read-only and has a subset of the full task report available through
+the Overlord APIs.
+
+<a name="reports"></a>
+
+## Task reports
+
+A report containing information about the number of rows ingested, and any parse exceptions that occurred is available for both completed tasks and running tasks.
+
+The reporting feature is supported by [native batch tasks](native-batch.md), the Hadoop batch task, and Kafka and Kinesis ingestion tasks.
+
+### Completion report
+
+After a task completes, if it supports reports, its report can be retrieved at:
+
+```
+http://<OVERLORD-HOST>:<OVERLORD-PORT>/druid/indexer/v1/task/{taskId}/reports
+```
+
+An example output is shown below:
+
+```json
+{
+  "ingestionStatsAndErrors": {
+    "taskId": "compact_twitter_2018-09-24T18:24:23.920Z",
+    "payload": {
+      "ingestionState": "COMPLETED",
+      "unparseableEvents": {},
+      "rowStats": {
+        "determinePartitions": {
+          "processed": 0,
+          "processedBytes": 0,
+          "processedWithError": 0,
+          "thrownAway": 0,
+          "unparseable": 0
+        },
+        "buildSegments": {
+          "processed": 5390324,
+          "processedBytes": 5109573212,
+          "processedWithError": 0,
+          "thrownAway": 0,
+          "unparseable": 0
+        }
+      },
+      "segmentAvailabilityConfirmed": false,
+      "segmentAvailabilityWaitTimeMs": 0,
+      "recordsProcessed": {
+        "partition-a": 5789
+      },
+      "errorMsg": null
+    },
+    "type": "ingestionStatsAndErrors"
+  },
+  "taskContext": {
+    "type": "taskContext",
+    "taskId": "compact_twitter_2018-09-24T18:24:23.920Z",
+    "payload": {
+      "forceTimeChunkLock": true,
+      "useLineageBasedSegmentAllocation": true
+    }
+  }
+}
+```
+
+Compaction tasks can generate multiple sets of segment output reports based on how the input interval is split. So the overall report contains mappings from each split to each report.
+Example report could be:
+
+```json
+{
+  "ingestionStatsAndErrors_0": {
+    "taskId": "compact_twitter_2018-09-24T18:24:23.920Z",
+    "payload": {
+      "ingestionState": "COMPLETED",
+      "unparseableEvents": {},
+      "rowStats": {
+        "buildSegments": {
+          "processed": 5390324,
+          "processedBytes": 5109573212,
+          "processedWithError": 0,
+          "thrownAway": 0,
+          "unparseable": 0
+        }
+      },
+      "segmentAvailabilityConfirmed": false,
+      "segmentAvailabilityWaitTimeMs": 0,
+      "recordsProcessed": null,
+      "errorMsg": null
+    },
+    "type": "ingestionStatsAndErrors"
+  },
+  "ingestionStatsAndErrors_1": {
+   "taskId": "compact_twitter_2018-09-25T18:24:23.920Z",
+   "payload": {
+    "ingestionState": "COMPLETED",
+    "unparseableEvents": {},
+    "rowStats": {
+     "buildSegments": {
+      "processed": 12345,
+      "processedBytes": 132456789,
+      "processedWithError": 0,
+      "thrownAway": 0,
+      "unparseable": 0
+     }
+    },
+    "segmentAvailabilityConfirmed": false,
+    "segmentAvailabilityWaitTimeMs": 0,
+    "recordsProcessed": null,
+    "errorMsg": null
+   },
+   "type": "ingestionStatsAndErrors"
+  }
+}
+```
+
+
+
+#### Segment Availability Fields
+
+For some task types, the indexing task can wait for the newly ingested segments to become available for queries after ingestion completes. The below fields inform the end user regarding the duration and result of the availability wait. For batch ingestion task types, refer to `tuningConfig` docs to see if the task supports an availability waiting period.
+
+|Field|Description|
+|---|---|
+|`segmentAvailabilityConfirmed`|Whether all segments generated by this ingestion task had been confirmed as available for queries in the cluster before the task completed.|
+|`segmentAvailabilityWaitTimeMs`|Milliseconds waited by the ingestion task for the newly ingested segments to be available for query after completing ingestion was completed.|
+|`recordsProcessed`| Partitions that were processed by an ingestion task and includes count of records processed from each partition.|
+
+
+#### Compaction task segment info fields
+
+|Field|Description|
+|---|---|
+|`segmentsRead`|Number of segments read by compaction task.|
+|`segmentsPublished`|Number of segments published by compaction task.|
+
+### Live report
+
+When a task is running, a live report containing ingestion state, unparseable events and moving average for number of events processed for 1 min, 5 min, 15 min time window can be retrieved at:
+
+```
+http://<OVERLORD-HOST>:<OVERLORD-PORT>/druid/indexer/v1/task/{taskId}/reports
+```
+
+An example output is shown below:
+
+```json
+{
+  "ingestionStatsAndErrors": {
+    "taskId": "compact_twitter_2018-09-24T18:24:23.920Z",
+    "payload": {
+      "ingestionState": "RUNNING",
+      "unparseableEvents": {},
+      "rowStats": {
+        "movingAverages": {
+          "buildSegments": {
+            "5m": {
+              "processed": 3.392158326408501,
+              "processedBytes": 627.5492903856,
+              "unparseable": 0,
+              "thrownAway": 0,
+              "processedWithError": 0
+            },
+            "15m": {
+              "processed": 1.736165476881023,
+              "processedBytes": 321.1906130223,
+              "unparseable": 0,
+              "thrownAway": 0,
+              "processedWithError": 0
+            },
+            "1m": {
+              "processed": 4.206417693750045,
+              "processedBytes": 778.1872733438,
+              "unparseable": 0,
+              "thrownAway": 0,
+              "processedWithError": 0
+            }
+          }
+        },
+        "totals": {
+          "buildSegments": {
+            "processed": 1994,
+            "processedBytes": 3425110,
+            "processedWithError": 0,
+            "thrownAway": 0,
+            "unparseable": 0
+          }
+        }
+      },
+      "errorMsg": null
+    },
+    "type": "ingestionStatsAndErrors"
+  }
+}
+```
+
+A description of the fields:
+
+The `ingestionStatsAndErrors` report provides information about row counts and errors.
+
+The `ingestionState` shows what step of ingestion the task reached. Possible states include:
+- `NOT_STARTED`: The task has not begun reading any rows
+- `DETERMINE_PARTITIONS`: The task is processing rows to determine partitioning
+- `BUILD_SEGMENTS`: The task is processing rows to construct segments
+- `SEGMENT_AVAILABILITY_WAIT`: The task has published its segments and is waiting for them to become available.
+- `COMPLETED`: The task has finished its work.
+
+Only batch tasks have the DETERMINE_PARTITIONS phase. Realtime tasks such as those created by the Kafka Indexing Service do not have a DETERMINE_PARTITIONS phase.
+
+`unparseableEvents` contains lists of exception messages that were caused by unparseable inputs. This can help with identifying problematic input rows. There will be one list each for the DETERMINE_PARTITIONS and BUILD_SEGMENTS phases. Note that the Hadoop batch task does not support saving of unparseable events.
+
+the `rowStats` map contains information about row counts. There is one entry for each ingestion phase. The definitions of the different row counts are shown below:
+- `processed`: Number of rows successfully ingested without parsing errors
+- `processedBytes`: Total number of uncompressed bytes processed by the task. This reports the total byte size of all rows i.e. even those that are included in `processedWithError`, `unparseable` or `thrownAway`.
+- `processedWithError`: Number of rows that were ingested, but contained a parsing error within one or more columns. This typically occurs where input rows have a parseable structure but invalid types for columns, such as passing in a non-numeric String value for a numeric column.
+- `thrownAway`: Number of rows skipped. This includes rows with timestamps that were outside of the ingestion task's defined time interval and rows that were filtered out with a [`transformSpec`](ingestion-spec.md#transformspec), but doesn't include the rows skipped by explicit user configurations. For example, the rows skipped by `skipHeaderRows` or `hasHeaderRow` in the CSV format are not counted.
+- `unparseable`: Number of rows that could not be parsed at all and were discarded. This tracks input rows without a parseable structure, such as passing in non-JSON data when using a JSON parser.
+
+The `errorMsg` field shows a message describing the error that caused a task to fail. It will be null if the task was successful.
+
+## Live reports
+
+### Row stats
+
+The [native batch task](native-batch.md), the Hadoop batch task, and Kafka and Kinesis ingestion tasks support retrieval of row stats while the task is running.
+
+The live report can be accessed with a GET to the following URL on a Peon running a task:
+
+```
+http://<middlemanager-host>:<worker-port>/druid/worker/v1/chat/{taskId}/rowStats
+```
+
+An example report is shown below. The `movingAverages` section contains 1 minute, 5 minute, and 15 minute moving averages of increases to the four row counters, which have the same definitions as those in the completion report. The `totals` section shows the current totals.
+
+```json
+{
+  "movingAverages": {
+    "buildSegments": {
+      "5m": {
+        "processed": 3.392158326408501,
+        "processedBytes": 627.5492903856,
+        "unparseable": 0,
+        "thrownAway": 0,
+        "processedWithError": 0
+      },
+      "15m": {
+        "processed": 1.736165476881023,
+        "processedBytes": 321.1906130223,
+        "unparseable": 0,
+        "thrownAway": 0,
+        "processedWithError": 0
+      },
+      "1m": {
+        "processed": 4.206417693750045,
+        "processedBytes": 778.1872733438,
+        "unparseable": 0,
+        "thrownAway": 0,
+        "processedWithError": 0
+      }
+    }
+  },
+  "totals": {
+    "buildSegments": {
+      "processed": 1994,
+      "processedBytes": 3425110,
+      "processedWithError": 0,
+      "thrownAway": 0,
+      "unparseable": 0
+    }
+  }
+}
+```
+
+For the Kafka Indexing Service, a GET to the following Overlord API will retrieve live row stat reports from each task being managed by the supervisor and provide a combined report.
+
+```
+http://<OVERLORD-HOST>:<OVERLORD-PORT>/druid/indexer/v1/supervisor/{supervisorId}/stats
+```
+
+### Unparseable events
+
+Lists of recently-encountered unparseable events can be retrieved from a running task with a GET to the following Peon API:
+
+```
+http://<middlemanager-host>:<worker-port>/druid/worker/v1/chat/{taskId}/unparseableEvents
+```
+
+Note that this functionality is not supported by all task types. Currently, it is only supported by the
+non-parallel [native batch task](native-batch.md) (type `index`) and the tasks created by the Kafka
+and Kinesis indexing services.
+
+<a name="locks"></a>
+
+## Task lock system
+
+This section explains the task locking system in Druid. Druid's locking system
+and versioning system are tightly coupled with each other to guarantee the correctness of ingested data.
+
+### "Overshadowing" between segments
+
+You can run a task to overwrite existing data. The segments created by an overwriting task _overshadows_ existing segments.
+Note that the overshadow relation holds only for the same time chunk and the same data source.
+These overshadowed segments are not considered in query processing to filter out stale data.
+
+Each segment has a _major_ version and a _minor_ version. The major version is
+represented as a timestamp in the format of [`"yyyy-MM-dd'T'hh:mm:ss"`](https://www.joda.org/joda-time/apidocs/org/joda/time/format/DateTimeFormat)
+while the minor version is an integer number. These major and minor versions
+are used to determine the overshadow relation between segments as seen below.
+
+A segment `s1` overshadows another `s2` if
+
+- `s1` has a higher major version than `s2`, or
+- `s1` has the same major version and a higher minor version than `s2`.
+
+Here are some examples.
+
+- A segment of the major version of `2019-01-01T00:00:00.000Z` and the minor version of `0` overshadows
+ another of the major version of `2018-01-01T00:00:00.000Z` and the minor version of `1`.
+- A segment of the major version of `2019-01-01T00:00:00.000Z` and the minor version of `1` overshadows
+ another of the major version of `2019-01-01T00:00:00.000Z` and the minor version of `0`.
+
+### Locking
+
+If you are running two or more [Druid tasks](./tasks.md) which generate segments for the same data source and the same time chunk,
+the generated segments could potentially overshadow each other, which could lead to incorrect query results.
+
+To avoid this problem, tasks will attempt to get locks prior to creating any segment in Druid.
+There are two types of locks, i.e., _time chunk lock_ and _segment lock_.
+
+When the time chunk lock is used, a task locks the entire time chunk of a data source where generated segments will be written.
+For example, suppose we have a task ingesting data into the time chunk of `2019-01-01T00:00:00.000Z/2019-01-02T00:00:00.000Z` of the `wikipedia` data source.
+With the time chunk locking, this task will lock the entire time chunk of `2019-01-01T00:00:00.000Z/2019-01-02T00:00:00.000Z` of the `wikipedia` data source
+before it creates any segments. As long as it holds the lock, any other tasks will be unable to create segments for the same time chunk of the same data source.
+The segments created with the time chunk locking have a _higher_ major version than existing segments. Their minor version is always `0`.
+
+When the segment lock is used, a task locks individual segments instead of the entire time chunk.
+As a result, two or more tasks can create segments for the same time chunk of the same data source simultaneously
+if they are reading different segments.
+For example, a Kafka indexing task and a compaction task can always write segments into the same time chunk of the same data source simultaneously.
+The reason for this is because a Kafka indexing task always appends new segments, while a compaction task always overwrites existing segments.
+The segments created with the segment locking have the _same_ major version and a _higher_ minor version.
+
+:::info
+ The segment locking is still experimental. It could have unknown bugs which potentially lead to incorrect query results.
+:::
+
+To enable segment locking, you may need to set `forceTimeChunkLock` to `false` in the [task context](#context).
+Once `forceTimeChunkLock` is unset, the task will choose a proper lock type to use automatically.
+Please note that segment lock is not always available. The most common use case where time chunk lock is enforced is
+when an overwriting task changes the segment granularity.
+Also, the segment locking is supported by only native indexing tasks and Kafka/Kinesis indexing tasks.
+Hadoop indexing tasks don't support it.
+
+`forceTimeChunkLock` in the task context is only applied to individual tasks.
+If you want to unset it for all tasks, you would want to set `druid.indexer.tasklock.forceTimeChunkLock` to false in the [overlord configuration](../configuration/index.md#overlord-operations).
+
+Lock requests can conflict with each other if two or more tasks try to get locks for the overlapped time chunks of the same data source.
+Note that the lock conflict can happen between different locks types.
+
+The behavior on lock conflicts depends on the [task priority](#lock-priority).
+If all tasks of conflicting lock requests have the same priority, then the task who requested first will get the lock.
+Other tasks will wait for the task to release the lock.
+
+If a task of a lower priority asks a lock later than another of a higher priority,
+this task will also wait for the task of a higher priority to release the lock.
+If a task of a higher priority asks a lock later than another of a lower priority,
+then this task will _preempt_ the other task of a lower priority. The lock
+of the lower-prioritized task will be revoked and the higher-prioritized task will acquire a new lock.
+
+This lock preemption can happen at any time while a task is running except
+when it is _publishing segments_ in a critical section. Its locks become preemptible again once publishing segments is finished.
+
+Note that locks are shared by the tasks of the same groupId.
+For example, Kafka indexing tasks of the same supervisor have the same groupId and share all locks with each other.
+
+<a name="priority"></a>
+
+### Lock priority
+
+Each task type has a different default lock priority. The below table shows the default priorities of different task types. Higher the number, higher the priority.
+
+|task type|default priority|
+|---------|----------------|
+|Realtime index task|75|
+|Batch index tasks, including [native batch](native-batch.md), [SQL](../multi-stage-query/index.md), and [Hadoop-based](hadoop.md)|50|
+|Merge/Append/Compaction task|25|
+|Other tasks|0|
+
+You can override the task priority by setting your priority in the task context as below.
+
+```json
+"context" : {
+  "priority" : 100
+}
+```
+<a name="actions"></a>
+
+## Task actions
+
+Task actions are overlord actions performed by tasks during their lifecycle. Some typical task actions are:
+- `lockAcquire`: acquires a time-chunk lock on an interval for the task
+- `lockRelease`: releases a lock acquired by the task on an interval
+- `segmentTransactionalInsert`: publishes new segments created by a task and optionally overwrites and/or drops existing segments in a single transaction
+- `segmentAllocate`: allocates pending segments to a task to write rows
+
+### Batching `segmentAllocate` actions
+
+In a cluster with several concurrent tasks, `segmentAllocate` actions on the overlord can take a long time to finish, causing spikes in the `task/action/run/time`. This can result in ingestion lag building up while a task waits for a segment to be allocated.
+The root cause of such spikes is likely to be one or more of the following:
+- several concurrent tasks trying to allocate segments for the same datasource and interval
+- large number of metadata calls made to the segments and pending segments tables 
+- concurrency limitations while acquiring a task lock required for allocating a segment
+
+Since the contention typically arises from tasks allocating segments for the same datasource and interval, you can improve the run times by batching the actions together.
+To enable batched segment allocation on the overlord, set  `druid.indexer.tasklock.batchSegmentAllocation` to `true`. See [overlord configuration](../configuration/index.md#overlord-operations) for more details.
+
+<a name="context"></a>
+
+## Context parameters
+
+The task context is used for various individual task configuration.
+Specify task context configurations in the `context` field of the ingestion spec.
+When configuring [automatic compaction](../data-management/automatic-compaction.md), set the task context configurations in `taskContext` rather than in `context`.
+The settings get passed into the `context` field of the compaction tasks issued to Middle Managers.
+
+The following parameters apply to all task types.
+
+|Property|Description|Default|
+|--------|-------|-----------|
+|`forceTimeChunkLock`|_Setting this to false is still experimental._<br/> Force to use time chunk lock. When `true`, this parameter overrides the overlord runtime property `druid.indexer.tasklock.forceTimeChunkLock` [configuration for the overlord](../configuration/index.md#overlord-operations). If neither this parameter nor the runtime property is `true`, each task automatically chooses a lock type to use. See [Locking](#locking) for more details.|`true`|
+|`priority`|Task priority|Depends on the task type. See [Priority](#priority) for more details.|
+|`storeCompactionState`|Enables the task to store the compaction state of created segments in the metadata store. When `true`, the segments created by the task fill `lastCompactionState` in the segment metadata. This parameter is set automatically on compaction tasks. |`true` for compaction tasks, `false` for other task types|
+|`storeEmptyColumns`|Enables the task to store empty columns during ingestion. When `true`, Druid stores every column specified in the [`dimensionsSpec`](ingestion-spec.md#dimensionsspec). When `false`, Druid SQL queries referencing empty columns will fail. If you intend to leave `storeEmptyColumns` disabled, you should either ingest dummy data for empty columns or else not query on empty columns.<br/><br/>When set in the task context, `storeEmptyColumns` overrides the system property [`druid.indexer.task.storeEmptyColumns`](../configuration/index.md#additional-peon-configuration).|`true`|
+|`taskLockTimeout`|Task lock timeout in milliseconds. For more details, see [Locking](#locking).<br/><br/>When a task acquires a lock, it sends a request via HTTP and awaits until it receives a response containing the lock acquisition result. As a result, an HTTP timeout error can occur if `taskLockTimeout` is greater than `druid.server.http.maxIdleTime` of Overlords.|300000|
+|`useLineageBasedSegmentAllocation`|Enables the new lineage-based segment allocation protocol for the native Parallel task with dynamic partitioning. This option should be off during the replacing rolling upgrade from one of the Druid versions between 0.19 and 0.21 to Druid 0.22 or higher. Once the upgrade is done, it must be set to `true` to ensure data correctness.|`false` in 0.21 or earlier, `true` in 0.22 or later|
+|`lookupLoadingMode`|Controls the lookup loading behavior in tasks. This property supports three values: `ALL` mode loads all the lookups, `NONE` mode does not load any lookups and `ONLY_REQUIRED` mode loads the lookups specified with context key `lookupsToLoad`. This property must not be specified for `MSQ` and `kill` tasks as the task engine enforces `ONLY_REQUIRED` mode for `MSQWorkerTask` and `NONE` mode for `MSQControllerTask` and `kill` tasks.|`ALL`|
+|`lookupsToLoad`|List of lookup names to load in tasks. This property is required only if the `lookupLoadingMode` is set to `ONLY_REQUIRED`. For `MSQWorkerTask` type, the lookup names to load are identified by the controller task by parsing the SQL. |`null`|
+|`subTaskTimeoutMillis`|Maximum time (in milliseconds) to wait before cancelling a long-running sub-task. Applicable only for `index_parallel` tasks and `compact` tasks (when running in parallel mode). Set to 0 for no timeout (infinite).|0 (unlimited)|
+
+## Task logs
+
+Logs are created by ingestion tasks as they run. You can configure Druid to push these into a repository for long-term storage after they complete.
+
+Once the task has been submitted to the Overlord it remains `WAITING` for locks to be acquired. Worker slot allocation is then `PENDING` until the task can actually start executing.
+
+The task then starts creating logs in a local directory of the middle manager (or indexer) in a `log` directory for the specific `taskId` at [`druid.worker.baseTaskDirs`](../configuration/index.md#middle-manager-configuration).
+
+When the task completes - whether it succeeds or fails - the middle manager (or indexer) will push the task log file into the location specified in [`druid.indexer.logs`](../configuration/index.md#task-logging).
+
+Task logs on the Druid web console are retrieved via an [API](../api-reference/service-status-api.md#overlord) on the Overlord. It automatically detects where the log file is, either in the Middle Manager / indexer or in long-term storage, and passes it back.
+
+If you don't see the log file in long-term storage, it means either:
+
+- the Middle Manager / indexer failed to push the log file to deep storage or
+- the task did not complete.
+
+You can check the Middle Manager / indexer logs locally to see if there was a push failure. If there was not, check the Overlord's own process logs to see why the task failed before it started.
+
+:::info
+ If you are running the indexing service in remote mode, the task logs must be stored in S3, Azure Blob Store, Google Cloud Storage or HDFS.
+:::
+
+You can configure retention periods for logs in milliseconds by setting `druid.indexer.logs.kill` properties in [configuration](../configuration/index.md#task-logging).  The Overlord will then automatically manage task logs in log directories along with entries in task-related metadata storage tables.
+
+:::info
+ Automatic log file deletion typically works based on the log file's 'modified' timestamp in the back-end store. Large clock skews between Druid processes and the long-term store might result in unintended behavior.
+:::
+
+## Configuring task storage sizes
+
+Tasks sometimes need to use local disk for storage of things while the task is active.  For example, for realtime ingestion tasks to accept broadcast segments for broadcast joins.  Or intermediate data sets for Multi-stage Query jobs
+
+Task storage sizes are configured through a combination of three properties:
+1. `druid.worker.capacity` - i.e. the "number of task slots"
+2. `druid.worker.baseTaskDirs` - i.e. the list of directories to use for task storage. 
+3. `druid.worker.baseTaskDirSize` - i.e. the amount of storage to use on each storage location
+
+While it seems like one task might use multiple directories, only one directory from the list of base directories will be used for any given task, as such, each task is only given a singular directory for scratch space.
+
+The actual amount of memory assigned to any given task is computed by determining the largest size that enables all task slots to be given an equivalent amount of disk storage. For example, with 5 slots, 2 directories (A and B) and a size of 300 GB, 3 slots would be given to directory A, 2 slots to directory B and each slot would be allowed 100 GB 
+
+## All task types
+
+### `index_parallel`
+
+See [Native batch ingestion (parallel task)](native-batch.md).
+
+### `index_hadoop`
+
+See [Hadoop-based ingestion](hadoop.md).
+
+### `index_kafka`
+
+Submitted automatically, on your behalf, by a
+[Kafka-based ingestion supervisor](../ingestion/kafka-ingestion.md).
+
+### `index_kinesis`
+
+Submitted automatically, on your behalf, by a
+[Kinesis-based ingestion supervisor](../ingestion/kinesis-ingestion.md).
+
+### `compact`
+
+Compaction tasks merge all segments of the given interval. See the documentation on
+[compaction](../data-management/compaction.md) for details.
+
+### `kill`
+
+Kill tasks delete all metadata about certain segments and removes them from deep storage.
+See the documentation on [deleting data](../data-management/delete.md) for details.
diff --git a/docs/35.0.0/ingestion/tranquility.md b/docs/35.0.0/ingestion/tranquility.md
new file mode 100644
index 0000000000..9124ff04b8
--- /dev/null
+++ b/docs/35.0.0/ingestion/tranquility.md
@@ -0,0 +1,30 @@
+---
+id: tranquility
+title: "Tranquility"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+[Tranquility](https://github.com/druid-io/tranquility/) was a separately distributed package for pushing
+streams to Druid in real-time. It is not compatible with recent versions of Druid.
+
+For new projects that require streaming ingestion, we recommend using Druid's native support for
+[Apache Kafka](../ingestion/kafka-ingestion.md) or
+[Amazon Kinesis](../ingestion/kinesis-ingestion.md).
diff --git a/docs/35.0.0/misc/papers-and-talks.md b/docs/35.0.0/misc/papers-and-talks.md
new file mode 100644
index 0000000000..b2abc1832d
--- /dev/null
+++ b/docs/35.0.0/misc/papers-and-talks.md
@@ -0,0 +1,43 @@
+---
+id: papers-and-talks
+title: "Papers"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+## Papers
+
+* [Druid: A Real-time Analytical Data Store](http://static.druid.io/docs/druid.pdf) - Discusses the Druid architecture in detail.
+
+* [The RADStack: Open Source Lambda Architecture for Interactive Analytics](http://static.druid.io/docs/radstack.pdf) - Discusses how Druid supports real-time and batch workflows.
+
+## Presentations
+
+* [Introduction to Druid](https://www.youtube.com/watch?v=hgmxVPx4vVw) - Discusses the motivations behind Druid and the architecture of the system.
+
+* [Druid: Interactive Queries Meet Real-Time Data](https://www.youtube.com/watch?v=Dlqj34l2upk) - Discusses how real-time ingestion in Druid works and use cases at Netflix.
+
+* [Not Exactly! Fast Queries via Approximation Algorithms](https://www.youtube.com/watch?v=Hpd3f_MLdXo) - Discusses how approximate algorithms work in Druid.
+
+* [Real-time Analytics with Open Source Technologies](https://www.youtube.com/watch?v=3Qb_2GGRz24) - Discusses Lambda architectures with Druid.
+
+* [Stories from the Trenches - The Challenges of Building an Analytics Stack](https://www.youtube.com/watch?v=yuSLeIzG98w&t=55s) - Discusses features that were added to scale Druid.
+
+* [Building Interactive Applications at Scale](https://www.youtube.com/watch?v=bZ3LqG3iHbM) - Discusses building applications on top of Druid.
diff --git a/docs/35.0.0/multi-stage-query/concepts.md b/docs/35.0.0/multi-stage-query/concepts.md
new file mode 100644
index 0000000000..dee6f80bdd
--- /dev/null
+++ b/docs/35.0.0/multi-stage-query/concepts.md
@@ -0,0 +1,307 @@
+---
+id: concepts
+title: "SQL-based ingestion concepts"
+sidebar_label: "Key concepts"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ This page describes SQL-based batch ingestion using the [`druid-multi-stage-query`](../multi-stage-query/index.md)
+ extension, new in Druid 24.0. Refer to the [ingestion methods](../ingestion/index.md#batch) table to determine which
+ ingestion method is right for you.
+:::
+
+## Multi-stage query task engine
+
+The `druid-multi-stage-query` extension adds a multi-stage query (MSQ) task engine that executes SQL statements as batch
+tasks in the indexing service, which execute on [Middle Managers](../design/architecture.md#druid-services).
+[INSERT](reference.md#insert) and [REPLACE](reference.md#replace) tasks publish
+[segments](../design/storage.md) just like [all other forms of batch
+ingestion](../ingestion/index.md#batch). Each query occupies at least two task slots while running: one controller task,
+and at least one worker task. As an experimental feature, the MSQ task engine also supports running SELECT queries as
+batch tasks. The behavior and result format of plain SELECT (without INSERT or REPLACE) is subject to change.
+
+You can execute SQL statements using the MSQ task engine through the **Query** view in the [web
+console](../operations/web-console.md) or through the [`/druid/v2/sql/task` API](../api-reference/sql-ingestion-api.md).
+
+For more details on how SQL queries are executed using the MSQ task engine, see [multi-stage query
+tasks](#multi-stage-query-tasks).
+
+## SQL extensions
+
+To support ingestion, additional SQL functionality is available through the MSQ task engine.
+
+<a name="extern"></a>
+
+### Read external data with `EXTERN`
+
+Query tasks can access external data through the `EXTERN` function, using any native batch [input
+source](../ingestion/input-sources.md) and [input format](../ingestion/data-formats.md#input-format).
+
+`EXTERN` can read multiple files in parallel across different worker tasks. However, `EXTERN` does not split individual
+files across multiple worker tasks. If you have a small number of very large input files, you can increase query
+parallelism by splitting up your input files.
+
+For more information about the syntax, see [`EXTERN`](./reference.md#extern-function).
+
+See also the set of SQL-friendly input-source-specific table functions which may be more convenient
+than `EXTERN`.
+
+<a name="insert"></a>
+
+### Load data with `INSERT`
+
+`INSERT` statements can create a new datasource or append to an existing datasource. In Druid SQL, unlike standard SQL,
+there is no syntactical difference between creating a table and appending data to a table. Druid does not include a
+`CREATE TABLE` statement.
+
+Nearly all `SELECT` capabilities are available for `INSERT ... SELECT` queries. Certain exceptions are listed on the [Known
+issues](./known-issues.md#select-statement) page.
+
+`INSERT` statements acquire a shared lock to the target datasource. Multiple `INSERT` statements can run at the same time,
+for the same datasource, if your cluster has enough task slots.
+
+Like all other forms of [batch ingestion](../ingestion/index.md#batch), each `INSERT` statement generates new segments and
+publishes them at the end of its run. For this reason, it is best suited to loading data in larger batches. Do not use
+`INSERT` statements to load data in a sequence of microbatches; for that, use [streaming
+ingestion](../ingestion/index.md#streaming) instead.
+
+When deciding whether to use `REPLACE` or `INSERT`, keep in mind that segments generated with `REPLACE` can be pruned
+with dimension-based pruning but those generated with `INSERT` cannot. For more information about the requirements
+for dimension-based pruning, see [Clustering](#clustering).
+
+For more information about the syntax, see [INSERT](./reference.md#insert).
+
+<a name="replace"></a>
+
+### Overwrite data with REPLACE
+
+`REPLACE` statements can create a new datasource or overwrite data in an existing datasource. In Druid SQL, unlike
+standard SQL, there is no syntactical difference between creating a table and overwriting data in a table. Druid does
+not include a `CREATE TABLE` statement.
+
+`REPLACE` uses an [OVERWRITE clause](reference.md#replace-specific-time-ranges) to determine which data to overwrite. You
+can overwrite an entire table, or a specific time range of a table. When you overwrite a specific time range, that time
+range must align with the granularity specified in the `PARTITIONED BY` clause.
+
+`REPLACE` statements acquire an exclusive write lock to the target time range of the target datasource. No other ingestion
+or compaction operations may proceed for that time range while the task is running. However, ingestion and compaction
+operations may proceed for other time ranges.
+
+Nearly all `SELECT` capabilities are available for `REPLACE ... SELECT` queries. Certain exceptions are listed on the [Known
+issues](./known-issues.md#select-statement) page.
+
+For more information about the syntax, see [REPLACE](./reference.md#replace).
+
+When deciding whether to use `REPLACE` or `INSERT`, keep in mind that segments generated with `REPLACE` can be pruned
+with dimension-based pruning but those generated with `INSERT` cannot. For more information about the requirements
+for dimension-based pruning, see [Clustering](#clustering).
+
+### Write to an external destination with `EXTERN`
+
+Query tasks can write data to an external destination through the `EXTERN` function, when it is used with the `INTO`
+clause, such as `INSERT INTO EXTERN(...)`. The EXTERN function takes arguments that specify where to write the files.
+The format can be specified using an `AS` clause.
+
+For more information about the syntax, see [`EXTERN`](./reference.md#extern-function).
+
+### Primary timestamp
+
+Druid tables always include a primary timestamp named `__time`.
+
+It is common to set a primary timestamp by using [date and time
+functions](../querying/sql-scalar.md#date-and-time-functions); for example: `TIME_FORMAT("timestamp", 'yyyy-MM-dd
+HH:mm:ss') AS __time`.
+
+The `__time` column is used for [partitioning by time](#partitioning-by-time). If you use `PARTITIONED BY ALL` or
+`PARTITIONED BY ALL TIME`, partitioning by time is disabled. In these cases, you do not need to include a `__time`
+column in your `INSERT` statement. However, Druid still creates a `__time` column in your Druid table and sets all
+timestamps to 1970-01-01 00:00:00.
+
+For more information, see [Primary timestamp](../ingestion/schema-model.md#primary-timestamp).
+
+<a name="partitioning"></a>
+
+### Partitioning by time
+
+`INSERT` and `REPLACE` statements require the `PARTITIONED BY` clause, which determines how time-based partitioning is done.
+In Druid, data is split into one or more segments per time chunk, defined by the PARTITIONED BY granularity.
+
+Partitioning by time is important for three reasons:
+
+1. Queries that filter by `__time` (SQL) or `intervals` (native) are able to use time partitioning to prune the set of
+   segments to consider.
+2. Certain data management operations, such as overwriting and compacting existing data, acquire exclusive write locks
+   on time partitions. Finer-grained partitioning allows finer-grained exclusive write locks.
+3. Each segment file is wholly contained within a time partition. Too-fine-grained partitioning may cause a large number
+   of small segments, which leads to poor performance.
+
+`PARTITIONED BY HOUR` and `PARTITIONED BY DAY` are the most common choices to balance these considerations. `PARTITIONED
+BY ALL` is suitable if your dataset does not have a [primary timestamp](#primary-timestamp).
+
+For more information about the syntax, see [PARTITIONED BY](./reference.md#partitioned-by).
+
+### Clustering
+
+Within each time chunk defined by [time partitioning](#partitioning-by-time), data can be further split by the optional
+[CLUSTERED BY](reference.md#clustered-by) clause.
+
+For example, suppose you ingest 100 million rows per hour using `PARTITIONED BY HOUR` and `CLUSTERED BY hostName`. The
+ingestion task will generate segments of roughly 3 million rows — the default value of
+[`rowsPerSegment`](reference.md#context-parameters) — with lexicographic ranges of `hostName`s grouped into segments.
+
+Clustering is important for two reasons:
+
+1. Lower storage footprint due to improved locality, and therefore improved compressibility.
+2. Better query performance due to dimension-based segment pruning, which removes segments from consideration when they
+   cannot possibly contain data matching a query's filter. This speeds up filters like `x = 'foo'` and
+   `x IN ('foo', 'bar')`.
+
+To activate dimension-based pruning, these requirements must be met:
+
+- Segments were generated by a `REPLACE` statement, not an `INSERT` statement.
+- `CLUSTERED BY` begins with single-valued string columns. These single-valued string columns are used for pruning.
+
+If these requirements are _not_ met, Druid still clusters data during ingestion but will not be able to perform
+dimension-based segment pruning at query time. You can tell if dimension-based segment pruning is possible by using the
+`sys.segments` table to inspect the `shard_spec` for the segments generated by an ingestion query. If they are of type
+`range` or `single`, then dimension-based segment pruning is possible. Otherwise, it is not. The shard spec type is also
+available in the **Segments** view under the **Partitioning** column.
+
+For more information about syntax, see [`CLUSTERED BY`](./reference.md#clustered-by).
+
+For more information about the mechanics of clustering, refer to
+[Secondary partitioning](../ingestion/partitioning.md#secondary-partitioning) and
+[Sorting](../ingestion/partitioning.md#sorting).
+
+### Rollup
+
+[Rollup](../ingestion/rollup.md) is a technique that pre-aggregates data during ingestion to reduce the amount of data
+stored. Intermediate aggregations are stored in the generated segments, and further aggregation is done at query time.
+This reduces storage footprint and improves performance, often dramatically.
+
+To perform ingestion with rollup:
+
+1. Use `GROUP BY`. The columns in the `GROUP BY` clause become dimensions, and aggregation functions become metrics.
+2. Set [`finalizeAggregations: false`](reference.md#context-parameters) in your context. This causes aggregation
+   functions to write their internal state to the generated segments, instead of the finalized end result, and enables
+   further aggregation at query time.
+3. See [ARRAY types](../querying/arrays.md#sql-based-ingestion) for information about ingesting `ARRAY` columns
+4. See [multi-value dimensions](../querying/multi-value-dimensions.md#sql-based-ingestion) for information to ingest multi-value VARCHAR columns
+
+When you do all of these things, Druid understands that you intend to do an ingestion with rollup, and it writes
+rollup-related metadata into the generated segments. Other applications can then use [`segmentMetadata`
+queries](../querying/segmentmetadataquery.md) to retrieve rollup-related information.
+
+The following [aggregation functions](../querying/sql-aggregations.md) are supported for rollup at ingestion time:
+`COUNT` (but switch to `SUM` at query time), `SUM`, `MIN`, `MAX`, `EARLIEST` and `EARLIEST_BY`,
+`LATEST` and `LATEST_BY`, `APPROX_COUNT_DISTINCT`, `APPROX_COUNT_DISTINCT_BUILTIN`,
+`APPROX_COUNT_DISTINCT_DS_HLL`, `APPROX_COUNT_DISTINCT_DS_THETA`, and `DS_QUANTILES_SKETCH` (but switch to
+`APPROX_QUANTILE_DS` at query time). Do not use `AVG`; instead, use `SUM` and `COUNT` at ingest time and compute the
+quotient at query time.
+
+For an example, see [INSERT with rollup example](examples.md#insert-with-rollup).
+
+## Multi-stage query tasks
+
+### Execution flow
+
+When you execute a SQL statement using the task endpoint [`/druid/v2/sql/task`](../api-reference/sql-ingestion-api.md#submit-a-query), the following
+happens:
+
+1. The Broker plans your SQL query into a native query, as usual.
+
+2. The Broker wraps the native query into a task of type `query_controller`
+   and submits it to the indexing service.
+
+3. The Broker returns the task ID to you and exits.
+
+4. The controller task launches some number of worker tasks determined by
+   the `maxNumTasks` and `taskAssignment` [context parameters](./reference.md#context-parameters). You can set these settings individually for each query.
+
+5. Worker tasks of type `query_worker` execute the query.
+
+6. If the query is a `SELECT` query, the worker tasks send the results
+   back to the controller task, which writes them into its task report.
+   If the query is an INSERT or REPLACE query, the worker tasks generate and
+   publish new Druid segments to the provided datasource.
+
+### Parallelism
+
+The [`maxNumTasks`](./reference.md#context-parameters) query parameter determines the maximum number of tasks your
+query will use, including the one `query_controller` task. Generally, queries perform better with more workers. The
+lowest possible value of `maxNumTasks` is two (one worker and one controller). Do not set this higher than the number of
+free slots available in your cluster; doing so will result in a [TaskStartTimeout](./reference.md#error-codes)
+error.
+
+When [reading external data](#read-external-data-with-extern), EXTERN can read multiple files in parallel across
+different worker tasks. However, EXTERN does not split individual files across multiple worker tasks. If you have a
+small number of very large input files, you can increase query parallelism by splitting up your input files.
+
+The `druid.worker.capacity` server property on each [Middle Manager](../design/architecture.md#druid-services)
+determines the maximum number of worker tasks that can run on each server at once. Worker tasks run single-threaded,
+which also determines the maximum number of processors on the server that can contribute towards multi-stage queries.
+
+### Memory usage
+
+Increasing the amount of available memory can improve performance in certain cases:
+
+- Segment generation becomes more efficient when data doesn't spill to disk as often.
+- Sorting stage output data becomes more efficient since available memory affects the
+  number of required sorting passes.
+
+Worker tasks use both JVM heap memory and off-heap ("direct") memory.
+
+On Peons launched by Middle Managers, the bulk of the JVM heap (75%, less any space used by
+[lookups](../querying/lookups.md)) is split up into two bundles of equal size: one processor bundle and one worker
+bundle. Each one comprises 37.5% of the available JVM heap, less any space used by [lookups](../querying/lookups.md).
+
+Depending on the type of query, controller and worker tasks may use sketches for determining partition boundaries.
+The heap footprint of these sketches is capped at 10% of available memory, or 300 MB, whichever is lower.
+
+The processor memory bundle is used for query processing and segment generation. Each processor bundle must also
+provides space to buffer I/O between stages. Specifically, each downstream stage requires 1 MB of buffer space for each
+upstream worker. For example, if you have 100 workers running in stage 0, and stage 1 reads from stage 0, then each
+worker in stage 1 requires 1M * 100 = 100 MB of memory for frame buffers.
+
+The worker memory bundle is used for sorting stage output data prior to shuffle. Workers can sort more data than fits in
+memory; in this case, they will switch to using disk.
+
+Worker tasks also use off-heap ("direct") memory. Set the amount of direct memory available (`-XX:MaxDirectMemorySize`)
+to at least `(druid.processing.numThreads + 1) * druid.processing.buffer.sizeBytes`. Increasing the amount of direct
+memory available beyond the minimum does not speed up processing.
+
+### Disk usage
+
+Worker tasks use local disk for four purposes:
+
+- Temporary copies of input data. Each temporary file is deleted before the next one is read. You only need
+  enough temporary disk space to store one input file at a time per task.
+- Temporary data related to segment generation. You only need enough temporary disk space to store one segments' worth
+  of data at a time per task. This is generally less than 2 GB per task.
+- External sort of data prior to shuffle. Requires enough space to store a compressed copy of the entire output dataset
+  for a task.
+- Storing stage output data during a shuffle. Requires enough space to store a compressed copy of the entire output
+  dataset for a task.
+
+Workers use the task working directory, given by
+[`druid.indexer.task.baseDir`](../configuration/index.md#additional-peon-configuration), for these items. It is
+important that this directory has enough space available for these purposes.
diff --git a/docs/35.0.0/multi-stage-query/examples.md b/docs/35.0.0/multi-stage-query/examples.md
new file mode 100644
index 0000000000..d81e874d1f
--- /dev/null
+++ b/docs/35.0.0/multi-stage-query/examples.md
@@ -0,0 +1,485 @@
+---
+id: examples
+title: SQL-based ingestion query examples
+sidebar_label: Examples
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ This page describes SQL-based batch ingestion using the [`druid-multi-stage-query`](../multi-stage-query/index.md)
+ extension, new in Druid 24.0. Refer to the [ingestion methods](../ingestion/index.md#batch) table to determine which
+ ingestion method is right for you.
+:::
+
+These example queries show you some of the things you can do when modifying queries for your use case. Copy the example queries into the **Query** view of the web console and run them to see what they do.
+
+:::tip
+When you insert or replace data with SQL-based ingestion, set the context parameter `finalizeAggregations` to `false`. This context parameter is automatically set for you if you use the Druid console. If you use the API, you must explicitly set it. For an example, see [SQL-based ingestion API](../api-reference/sql-ingestion-api#sample-request). For details on aggregations, see [Rollup](./concepts.md#rollup).
+:::
+
+## INSERT with no rollup
+
+This example inserts data into a table named `w000` without performing any data rollup:
+
+<details>
+<summary>Show the query</summary>
+
+```sql
+INSERT INTO w000
+SELECT
+  TIME_PARSE("timestamp") AS __time,
+  isRobot,
+  channel,
+  flags,
+  isUnpatrolled,
+  page,
+  diffUrl,
+  added,
+  comment,
+  commentLength,
+  isNew,
+  isMinor,
+  delta,
+  isAnonymous,
+  user,
+  deltaBucket,
+  deleted,
+  namespace,
+  cityName,
+  countryName,
+  regionIsoCode,
+  metroCode,
+  countryIsoCode,
+  regionName
+FROM TABLE(
+    EXTERN(
+      '{"type":"http","uris":["https://druid.apache.org/data/wikipedia.json.gz"]}',
+      '{"type":"json"}',
+      '[{"name":"isRobot","type":"string"},{"name":"channel","type":"string"},{"name":"timestamp","type":"string"},{"name":"flags","type":"string"},{"name":"isUnpatrolled","type":"string"},{"name":"page","type":"string"},{"name":"diffUrl","type":"string"},{"name":"added","type":"long"},{"name":"comment","type":"string"},{"name":"commentLength","type":"long"},{"name":"isNew","type":"string"},{"name":"isMinor","type":"string"},{"name":"delta","type":"long"},{"name":"isAnonymous","type":"string"},{"name":"user","type":"string"},{"name":"deltaBucket","type":"long"},{"name":"deleted","type":"long"},{"name":"namespace","type":"string"},{"name":"cityName","type":"string"},{"name":"countryName","type":"string"},{"name":"regionIsoCode","type":"string"},{"name":"metroCode","type":"long"},{"name":"countryIsoCode","type":"string"},{"name":"regionName","type":"string"}]'
+    )
+  )
+PARTITIONED BY HOUR
+CLUSTERED BY channel
+```
+
+</details>
+
+## INSERT with rollup
+
+This example inserts data into a table named `kttm_rollup` and performs data rollup. This example implements the recommendations described in [Rollup](./concepts.md#rollup).
+
+<details>
+<summary>Show the query</summary>
+
+```sql
+INSERT INTO "kttm_rollup"
+
+WITH kttm_data AS (
+SELECT * FROM TABLE(
+  EXTERN(
+    '{"type":"http","uris":["https://static.imply.io/example-data/kttm-v2/kttm-v2-2019-08-25.json.gz"]}',
+    '{"type":"json"}',
+    '[{"name":"timestamp","type":"string"},{"name":"agent_category","type":"string"},{"name":"agent_type","type":"string"},{"name":"browser","type":"string"},{"name":"browser_version","type":"string"},{"name":"city","type":"string"},{"name":"continent","type":"string"},{"name":"country","type":"string"},{"name":"version","type":"string"},{"name":"event_type","type":"string"},{"name":"event_subtype","type":"string"},{"name":"loaded_image","type":"string"},{"name":"adblock_list","type":"string"},{"name":"forwarded_for","type":"string"},{"name":"number","type":"long"},{"name":"os","type":"string"},{"name":"path","type":"string"},{"name":"platform","type":"string"},{"name":"referrer","type":"string"},{"name":"referrer_host","type":"string"},{"name":"region","type":"string"},{"name":"remote_address","type":"string"},{"name":"screen","type":"string"},{"name":"session","type":"string"},{"name":"session_length","type":"long"},{"name":"timezone","type":"string"},{"name":"timezone_offset","type":"long"},{"name":"window","type":"string"}]'
+  )
+))
+
+SELECT
+  FLOOR(TIME_PARSE("timestamp") TO MINUTE) AS __time,
+  session,
+  agent_category,
+  agent_type,
+  browser,
+  browser_version
+  os,
+  city,
+  country,
+  forwarded_for AS ip_address,
+
+  COUNT(*) AS "cnt",
+  SUM(session_length) AS session_length,
+  APPROX_COUNT_DISTINCT_DS_HLL(event_type) AS unique_event_types
+FROM kttm_data
+WHERE os = 'iOS'
+GROUP BY 1, 2, 3, 4, 5, 6, 7, 8, 9, 10
+PARTITIONED BY HOUR
+CLUSTERED BY browser, session
+```
+</details>
+
+## INSERT for reindexing an existing datasource
+
+This example aggregates data from a table named `w000` and inserts the result into `w002`.
+
+<details>
+<summary>Show the query</summary>
+
+```sql
+INSERT INTO w002
+SELECT
+  FLOOR(__time TO MINUTE) AS __time,
+  channel,
+  countryIsoCode,
+  countryName,
+  regionIsoCode,
+  regionName,
+  page,
+  COUNT(*) AS cnt,
+  SUM(added) AS sum_added,
+  SUM(deleted) AS sum_deleted
+FROM w000
+GROUP BY 1, 2, 3, 4, 5, 6, 7
+PARTITIONED BY HOUR
+CLUSTERED BY page
+```
+
+</details>
+
+## INSERT with JOIN
+
+This example inserts data into a table named `w003` and joins data from two sources:
+
+<details>
+<summary>Show the query</summary>
+
+```sql
+INSERT INTO w003
+WITH
+wikidata AS (SELECT * FROM TABLE(
+  EXTERN(
+    '{"type":"http","uris":["https://druid.apache.org/data/wikipedia.json.gz"]}',
+    '{"type":"json"}',
+    '[{"name":"isRobot","type":"string"},{"name":"channel","type":"string"},{"name":"timestamp","type":"string"},{"name":"flags","type":"string"},{"name":"isUnpatrolled","type":"string"},{"name":"page","type":"string"},{"name":"diffUrl","type":"string"},{"name":"added","type":"long"},{"name":"comment","type":"string"},{"name":"commentLength","type":"long"},{"name":"isNew","type":"string"},{"name":"isMinor","type":"string"},{"name":"delta","type":"long"},{"name":"isAnonymous","type":"string"},{"name":"user","type":"string"},{"name":"deltaBucket","type":"long"},{"name":"deleted","type":"long"},{"name":"namespace","type":"string"},{"name":"cityName","type":"string"},{"name":"countryName","type":"string"},{"name":"regionIsoCode","type":"string"},{"name":"metroCode","type":"long"},{"name":"countryIsoCode","type":"string"},{"name":"regionName","type":"string"}]'
+  )
+)),
+countries AS (SELECT * FROM TABLE(
+  EXTERN(
+    '{"type":"http","uris":["https://static.imply.io/example-data/lookup/countries.tsv"]}',
+    '{"type":"tsv","findColumnsFromHeader":true}',
+    '[{"name":"Country","type":"string"},{"name":"Capital","type":"string"},{"name":"ISO3","type":"string"},{"name":"ISO2","type":"string"}]'
+  )
+))
+SELECT
+  TIME_PARSE("timestamp") AS __time,
+  isRobot,
+  channel,
+  flags,
+  isUnpatrolled,
+  page,
+  diffUrl,
+  added,
+  comment,
+  commentLength,
+  isNew,
+  isMinor,
+  delta,
+  isAnonymous,
+  user,
+  deltaBucket,
+  deleted,
+  namespace,
+  cityName,
+  countryName,
+  regionIsoCode,
+  metroCode,
+  countryIsoCode,
+  countries.Capital AS countryCapital,
+  regionName
+FROM wikidata
+LEFT JOIN countries ON wikidata.countryIsoCode = countries.ISO2
+PARTITIONED BY HOUR
+```
+
+</details>
+
+## REPLACE an entire datasource
+
+This example replaces the entire datasource used in the table `w007` with the new query data while dropping the old data:
+
+<details>
+<summary>Show the query</summary>
+
+```sql
+REPLACE INTO w007
+OVERWRITE ALL
+SELECT
+  TIME_PARSE("timestamp") AS __time,
+  isRobot,
+  channel,
+  flags,
+  isUnpatrolled,
+  page,
+  diffUrl,
+  added,
+  comment,
+  commentLength,
+  isNew,
+  isMinor,
+  delta,
+  isAnonymous,
+  user,
+  deltaBucket,
+  deleted,
+  namespace,
+  cityName,
+  countryName,
+  regionIsoCode,
+  metroCode,
+  countryIsoCode,
+  regionName
+FROM TABLE(
+    EXTERN(
+      '{"type":"http","uris":["https://druid.apache.org/data/wikipedia.json.gz"]}',
+      '{"type":"json"}',
+      '[{"name":"isRobot","type":"string"},{"name":"channel","type":"string"},{"name":"timestamp","type":"string"},{"name":"flags","type":"string"},{"name":"isUnpatrolled","type":"string"},{"name":"page","type":"string"},{"name":"diffUrl","type":"string"},{"name":"added","type":"long"},{"name":"comment","type":"string"},{"name":"commentLength","type":"long"},{"name":"isNew","type":"string"},{"name":"isMinor","type":"string"},{"name":"delta","type":"long"},{"name":"isAnonymous","type":"string"},{"name":"user","type":"string"},{"name":"deltaBucket","type":"long"},{"name":"deleted","type":"long"},{"name":"namespace","type":"string"},{"name":"cityName","type":"string"},{"name":"countryName","type":"string"},{"name":"regionIsoCode","type":"string"},{"name":"metroCode","type":"long"},{"name":"countryIsoCode","type":"string"},{"name":"regionName","type":"string"}]'
+    )
+  )
+PARTITIONED BY HOUR
+CLUSTERED BY channel
+```
+
+</details>
+
+## REPLACE for replacing a specific time segment
+
+This example replaces certain segments in a datasource with the new query data while dropping old segments:
+
+<details>
+<summary>Show the query</summary>
+
+```sql
+REPLACE INTO w007
+OVERWRITE WHERE __time >= TIMESTAMP '2019-08-25 02:00:00' AND __time < TIMESTAMP '2019-08-25 03:00:00'
+SELECT
+  FLOOR(__time TO MINUTE) AS __time,
+  channel,
+  countryIsoCode,
+  countryName,
+  regionIsoCode,
+  regionName,
+  page
+FROM w007
+WHERE __time >= TIMESTAMP '2019-08-25 02:00:00' AND __time < TIMESTAMP '2019-08-25 03:00:00' AND countryName = "Canada"
+PARTITIONED BY HOUR
+CLUSTERED BY page
+```
+
+</details>
+
+## REPLACE for reindexing an existing datasource into itself
+
+<details>
+<summary>Show the query</summary>
+
+```sql
+REPLACE INTO w000
+OVERWRITE ALL
+SELECT
+  FLOOR(__time TO MINUTE) AS __time,
+  channel,
+  countryIsoCode,
+  countryName,
+  regionIsoCode,
+  regionName,
+  page,
+  COUNT(*) AS cnt,
+  SUM(added) AS sum_added,
+  SUM(deleted) AS sum_deleted
+FROM w000
+GROUP BY 1, 2, 3, 4, 5, 6, 7
+PARTITIONED BY HOUR
+CLUSTERED BY page
+```
+
+</details>
+
+## SELECT with EXTERN and JOIN
+
+<details>
+<summary>Show the query</summary>
+
+```sql
+WITH flights AS (
+  SELECT * FROM TABLE(
+  EXTERN(
+    '{"type":"http","uris":["https://static.imply.io/example-data/flight_on_time/flights/On_Time_Reporting_Carrier_On_Time_Performance_(1987_present)_2005_11.csv.zip"]}',
+    '{"type":"csv","findColumnsFromHeader":true}',
+    '[{"name":"depaturetime","type":"string"},{"name":"arrivalime","type":"string"},{"name":"Year","type":"long"},{"name":"Quarter","type":"long"},{"name":"Month","type":"long"},{"name":"DayofMonth","type":"long"},{"name":"DayOfWeek","type":"long"},{"name":"FlightDate","type":"string"},{"name":"Reporting_Airline","type":"string"},{"name":"DOT_ID_Reporting_Airline","type":"long"},{"name":"IATA_CODE_Reporting_Airline","type":"string"},{"name":"Tail_Number","type":"string"},{"name":"Flight_Number_Reporting_Airline","type":"long"},{"name":"OriginAirportID","type":"long"},{"name":"OriginAirportSeqID","type":"long"},{"name":"OriginCityMarketID","type":"long"},{"name":"Origin","type":"string"},{"name":"OriginCityName","type":"string"},{"name":"OriginState","type":"string"},{"name":"OriginStateFips","type":"long"},{"name":"OriginStateName","type":"string"},{"name":"OriginWac","type":"long"},{"name":"DestAirportID","type":"long"},{"name":"DestAirportSeqID","type":"long"},{"name":"DestCityMarketID","type":"long"},{"name":"Dest","type":"string"},{"name":"DestCityName","type":"string"},{"name":"DestState","type":"string"},{"name":"DestStateFips","type":"long"},{"name":"DestStateName","type":"string"},{"name":"DestWac","type":"long"},{"name":"CRSDepTime","type":"long"},{"name":"DepTime","type":"long"},{"name":"DepDelay","type":"long"},{"name":"DepDelayMinutes","type":"long"},{"name":"DepDel15","type":"long"},{"name":"DepartureDelayGroups","type":"long"},{"name":"DepTimeBlk","type":"string"},{"name":"TaxiOut","type":"long"},{"name":"WheelsOff","type":"long"},{"name":"WheelsOn","type":"long"},{"name":"TaxiIn","type":"long"},{"name":"CRSArrTime","type":"long"},{"name":"ArrTime","type":"long"},{"name":"ArrDelay","type":"long"},{"name":"ArrDelayMinutes","type":"long"},{"name":"ArrDel15","type":"long"},{"name":"ArrivalDelayGroups","type":"long"},{"name":"ArrTimeBlk","type":"string"},{"name":"Cancelled","type":"long"},{"name":"CancellationCode","type":"string"},{"name":"Diverted","type":"long"},{"name":"CRSElapsedTime","type":"long"},{"name":"ActualElapsedTime","type":"long"},{"name":"AirTime","type":"long"},{"name":"Flights","type":"long"},{"name":"Distance","type":"long"},{"name":"DistanceGroup","type":"long"},{"name":"CarrierDelay","type":"long"},{"name":"WeatherDelay","type":"long"},{"name":"NASDelay","type":"long"},{"name":"SecurityDelay","type":"long"},{"name":"LateAircraftDelay","type":"long"},{"name":"FirstDepTime","type":"string"},{"name":"TotalAddGTime","type":"string"},{"name":"LongestAddGTime","type":"string"},{"name":"DivAirportLandings","type":"string"},{"name":"DivReachedDest","type":"string"},{"name":"DivActualElapsedTime","type":"string"},{"name":"DivArrDelay","type":"string"},{"name":"DivDistance","type":"string"},{"name":"Div1Airport","type":"string"},{"name":"Div1AirportID","type":"string"},{"name":"Div1AirportSeqID","type":"string"},{"name":"Div1WheelsOn","type":"string"},{"name":"Div1TotalGTime","type":"string"},{"name":"Div1LongestGTime","type":"string"},{"name":"Div1WheelsOff","type":"string"},{"name":"Div1TailNum","type":"string"},{"name":"Div2Airport","type":"string"},{"name":"Div2AirportID","type":"string"},{"name":"Div2AirportSeqID","type":"string"},{"name":"Div2WheelsOn","type":"string"},{"name":"Div2TotalGTime","type":"string"},{"name":"Div2LongestGTime","type":"string"},{"name":"Div2WheelsOff","type":"string"},{"name":"Div2TailNum","type":"string"},{"name":"Div3Airport","type":"string"},{"name":"Div3AirportID","type":"string"},{"name":"Div3AirportSeqID","type":"string"},{"name":"Div3WheelsOn","type":"string"},{"name":"Div3TotalGTime","type":"string"},{"name":"Div3LongestGTime","type":"string"},{"name":"Div3WheelsOff","type":"string"},{"name":"Div3TailNum","type":"string"},{"name":"Div4Airport","type":"string"},{"name":"Div4AirportID","type":"string"},{"name":"Div4AirportSeqID","type":"string"},{"name":"Div4WheelsOn","type":"string"},{"name":"Div4TotalGTime","type":"string"},{"name":"Div4LongestGTime","type":"string"},{"name":"Div4WheelsOff","type":"string"},{"name":"Div4TailNum","type":"string"},{"name":"Div5Airport","type":"string"},{"name":"Div5AirportID","type":"string"},{"name":"Div5AirportSeqID","type":"string"},{"name":"Div5WheelsOn","type":"string"},{"name":"Div5TotalGTime","type":"string"},{"name":"Div5LongestGTime","type":"string"},{"name":"Div5WheelsOff","type":"string"},{"name":"Div5TailNum","type":"string"},{"name":"Unnamed: 109","type":"string"}]'
+  )
+)),
+L_AIRPORT AS (
+  SELECT * FROM TABLE(
+  EXTERN(
+    '{"type":"http","uris":["https://static.imply.io/example-data/flight_on_time/dimensions/L_AIRPORT.csv"]}',
+    '{"type":"csv","findColumnsFromHeader":true}',
+    '[{"name":"Code","type":"string"},{"name":"Description","type":"string"}]'
+  )
+)),
+L_AIRPORT_ID AS (
+  SELECT * FROM TABLE(
+  EXTERN(
+    '{"type":"http","uris":["https://static.imply.io/example-data/flight_on_time/dimensions/L_AIRPORT_ID.csv"]}',
+    '{"type":"csv","findColumnsFromHeader":true}',
+    '[{"name":"Code","type":"long"},{"name":"Description","type":"string"}]'
+  )
+)),
+L_AIRLINE_ID AS (
+  SELECT * FROM TABLE(
+  EXTERN(
+    '{"type":"http","uris":["https://static.imply.io/example-data/flight_on_time/dimensions/L_AIRLINE_ID.csv"]}',
+    '{"type":"csv","findColumnsFromHeader":true}',
+    '[{"name":"Code","type":"long"},{"name":"Description","type":"string"}]'
+  )
+)),
+L_CITY_MARKET_ID AS (
+  SELECT * FROM TABLE(
+  EXTERN(
+    '{"type":"http","uris":["https://static.imply.io/example-data/flight_on_time/dimensions/L_CITY_MARKET_ID.csv"]}',
+    '{"type":"csv","findColumnsFromHeader":true}',
+    '[{"name":"Code","type":"long"},{"name":"Description","type":"string"}]'
+  )
+)),
+L_CANCELLATION AS (
+  SELECT * FROM TABLE(
+  EXTERN(
+    '{"type":"http","uris":["https://static.imply.io/example-data/flight_on_time/dimensions/L_CANCELLATION.csv"]}',
+    '{"type":"csv","findColumnsFromHeader":true}',
+    '[{"name":"Code","type":"string"},{"name":"Description","type":"string"}]'
+  )
+)),
+L_STATE_FIPS AS (
+  SELECT * FROM TABLE(
+  EXTERN(
+    '{"type":"http","uris":["https://static.imply.io/example-data/flight_on_time/dimensions/L_STATE_FIPS.csv"]}',
+    '{"type":"csv","findColumnsFromHeader":true}',
+    '[{"name":"Code","type":"long"},{"name":"Description","type":"string"}]'
+  )
+))
+SELECT
+  depaturetime,
+  arrivalime,
+  -- "Year",
+  -- Quarter,
+  -- "Month",
+  -- DayofMonth,
+  -- DayOfWeek,
+  -- FlightDate,
+  Reporting_Airline,
+
+  DOT_ID_Reporting_Airline,
+  DOTAirlineLookup.Description AS DOT_Reporting_Airline,
+
+  IATA_CODE_Reporting_Airline,
+  Tail_Number,
+  Flight_Number_Reporting_Airline,
+
+  OriginAirportID,
+  OriginAirportIDLookup.Description AS OriginAirport,
+
+  OriginAirportSeqID,
+
+  OriginCityMarketID,
+  OriginCityMarketIDLookup.Description AS OriginCityMarket,
+
+  Origin,
+  OriginAirportLookup.Description AS OriginDescription,
+
+  OriginCityName,
+  OriginState,
+
+  OriginStateFips,
+  OriginStateFipsLookup.Description AS OriginStateFipsDescription,
+
+  OriginStateName,
+  OriginWac,
+
+  DestAirportID,
+  DestAirportIDLookup.Description AS DestAirport,
+
+  DestAirportSeqID,
+
+  DestCityMarketID,
+  DestCityMarketIDLookup.Description AS DestCityMarket,
+
+  Dest,
+  DestAirportLookup.Description AS DestDescription,
+
+  DestCityName,
+  DestState,
+
+  DestStateFips,
+  DestStateFipsLookup.Description AS DestStateFipsDescription,
+
+  DestStateName,
+  DestWac,
+
+  CRSDepTime,
+  DepTime,
+  DepDelay,
+  DepDelayMinutes,
+  DepDel15,
+  DepartureDelayGroups,
+  DepTimeBlk,
+  TaxiOut,
+  WheelsOff,
+  WheelsOn,
+  TaxiIn,
+  CRSArrTime,
+  ArrTime,
+  ArrDelay,
+  ArrDelayMinutes,
+  ArrDel15,
+  ArrivalDelayGroups,
+  ArrTimeBlk,
+
+  Cancelled,
+  CancellationCode,
+  CancellationCodeLookup.Description AS CancellationReason,
+
+  Diverted,
+  CRSElapsedTime,
+  ActualElapsedTime,
+  AirTime,
+  Flights,
+  Distance,
+  DistanceGroup,
+  CarrierDelay,
+  WeatherDelay,
+  NASDelay,
+  SecurityDelay,
+  LateAircraftDelay,
+  FirstDepTime,
+  TotalAddGTime,
+  LongestAddGTime
+FROM "flights"
+LEFT JOIN L_AIRLINE_ID AS DOTAirlineLookup ON DOT_ID_Reporting_Airline = DOTAirlineLookup.Code
+LEFT JOIN L_AIRPORT AS OriginAirportLookup ON Origin = OriginAirportLookup.Code
+LEFT JOIN L_AIRPORT AS DestAirportLookup ON Dest = DestAirportLookup.Code
+LEFT JOIN L_AIRPORT_ID AS OriginAirportIDLookup ON OriginAirportID = OriginAirportIDLookup.Code
+LEFT JOIN L_AIRPORT_ID AS DestAirportIDLookup ON DestAirportID = DestAirportIDLookup.Code
+LEFT JOIN L_CITY_MARKET_ID AS OriginCityMarketIDLookup ON OriginCityMarketID = OriginCityMarketIDLookup.Code
+LEFT JOIN L_CITY_MARKET_ID AS DestCityMarketIDLookup ON DestCityMarketID = DestCityMarketIDLookup.Code
+LEFT JOIN L_STATE_FIPS AS OriginStateFipsLookup ON OriginStateFips = OriginStateFipsLookup.Code
+LEFT JOIN L_STATE_FIPS AS DestStateFipsLookup ON DestStateFips = DestStateFipsLookup.Code
+LEFT JOIN L_CANCELLATION AS CancellationCodeLookup ON CancellationCode = CancellationCodeLookup.Code
+LIMIT 1000
+```
+
+</details>
diff --git a/docs/35.0.0/multi-stage-query/index.md b/docs/35.0.0/multi-stage-query/index.md
new file mode 100644
index 0000000000..39bb40748a
--- /dev/null
+++ b/docs/35.0.0/multi-stage-query/index.md
@@ -0,0 +1,77 @@
+---
+id: index
+title: SQL-based ingestion
+sidebar_label: SQL-based ingestion
+description: Introduces multi-stage query architecture and its task engine
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ This page describes SQL-based batch ingestion using the [`druid-multi-stage-query`](../multi-stage-query/index.md)
+ extension, new in Druid 24.0. Refer to the [ingestion methods](../ingestion/index.md#batch) table to determine which
+ ingestion method is right for you.
+:::
+
+Apache Druid supports SQL-based ingestion using the bundled [`druid-multi-stage-query` extension](#load-the-extension).
+This extension adds a [multi-stage query task engine for SQL](concepts.md#multi-stage-query-task-engine) that allows running SQL
+[INSERT](concepts.md#load-data-with-insert) and [REPLACE](concepts.md#overwrite-data-with-replace) statements as batch tasks. As an experimental feature,
+the task engine also supports running `SELECT` queries as batch tasks.
+
+Nearly all `SELECT` capabilities are available in the multi-stage query (MSQ) task engine, with certain exceptions listed on the [Known
+issues](./known-issues.md#select-statement) page. This allows great flexibility to apply transformations, filters, JOINs,
+aggregations, and so on as part of `INSERT ... SELECT` and `REPLACE ... SELECT` statements. This also allows in-database
+transformation: creating new tables based on queries of other tables.
+
+## Vocabulary
+
+- **Controller**: An indexing service task of type `query_controller` that manages
+  the execution of a query. There is one controller task per query.
+
+- **Worker**: Indexing service tasks of type `query_worker` that execute a
+  query. There can be multiple worker tasks per query. Internally,
+  the tasks process items in parallel using their processing pools (up to `druid.processing.numThreads` of execution parallelism
+  within a worker task).
+
+- **Stage**: A stage of query execution that is parallelized across
+  worker tasks. Workers exchange data with each other between stages.
+
+- **Partition**: A slice of data output by worker tasks. In INSERT or REPLACE
+  queries, the partitions of the final stage become Druid segments.
+
+- **Shuffle**: Workers exchange data between themselves on a per-partition basis in a process called
+  shuffling. During a shuffle, each output partition is sorted by a clustering key.
+
+## Load the extension
+
+To add the extension to an existing cluster, add `druid-multi-stage-query` to `druid.extensions.loadlist` in your
+`common.runtime.properties` file.
+
+For more information about how to load an extension, see [Loading extensions](../configuration/extensions.md#loading-extensions).
+
+To use [EXTERN](reference.md#extern-function), you need READ permission on the resource named "EXTERNAL" of the resource type
+"EXTERNAL". If you encounter a 403 error when trying to use `EXTERN`, verify that you have the correct permissions.
+The same is true of any of the input-source specific table function such as `S3` or `LOCALFILES`.
+
+## Next steps
+
+- [Read about key concepts](./concepts.md) to learn more about how SQL-based ingestion and multi-stage queries work.
+- [Check out the examples](./examples.md) to see SQL-based ingestion in action.
+- [Explore the Query view](../operations/web-console.md) to get started in the web console.
diff --git a/docs/35.0.0/multi-stage-query/known-issues.md b/docs/35.0.0/multi-stage-query/known-issues.md
new file mode 100644
index 0000000000..76649d5ab8
--- /dev/null
+++ b/docs/35.0.0/multi-stage-query/known-issues.md
@@ -0,0 +1,83 @@
+---
+id: known-issues
+title: SQL-based ingestion known issues
+sidebar_label: Known issues
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ This page describes SQL-based batch ingestion using the [`druid-multi-stage-query`](../multi-stage-query/index.md)
+ extension, new in Druid 24.0. Refer to the [ingestion methods](../ingestion/index.md#batch) table to determine which
+ ingestion method is right for you.
+:::
+
+## Multi-stage query task runtime
+
+- Fault tolerance is partially implemented. Workers get relaunched when they are killed unexpectedly. The controller does not get relaunched if it is killed unexpectedly.
+
+- Worker task stage outputs are stored in the working directory given by `druid.indexer.task.baseDir`. Stages that
+generate a large amount of output data may exhaust all available disk space. In this case, the query fails with
+an [UnknownError](./reference.md#error-codes) with a message including "No space left on device".
+
+## `SELECT` Statement
+
+- `GROUPING SETS` are not implemented. Queries using these features return a
+  [QueryNotSupported](./reference.md#error-codes) error.
+
+## `INSERT` and `REPLACE` Statements
+
+- The `INSERT` and `REPLACE` statements with column lists, like `INSERT INTO tbl (a, b, c) SELECT ...`, is not implemented.
+
+- `INSERT ... SELECT` and `REPLACE ... SELECT` insert columns from the `SELECT` statement based on column name. This
+differs from SQL standard behavior, where columns are inserted based on position.
+
+- `INSERT` and `REPLACE` do not support all options available in [ingestion specs](../ingestion/ingestion-spec.md),
+including the `createBitmapIndex` and `multiValueHandling` [dimension](../ingestion/ingestion-spec.md#dimension-objects)
+properties, and the `indexSpec` [`tuningConfig`](../ingestion/ingestion-spec.md#tuningconfig) property.
+
+## `EXTERN` Function
+
+- The [schemaless dimensions](../ingestion/ingestion-spec.md#inclusions-and-exclusions)
+  feature is not available. All columns and their types must be specified explicitly using the `signature` parameter
+  of the [`EXTERN` function](reference.md#extern-function).
+
+- `EXTERN` with input sources that match large numbers of files may exhaust available memory on the controller task.
+
+- `EXTERN` refers to external files. Use `FROM` to access `druid` input sources.
+
+## `WINDOW` Function
+
+- The maximum number of elements in a window cannot exceed a value of 100,000. 
+- To avoid `leafOperators` in MSQ engine, window functions have an extra scan stage after the window stage for cases 
+where native engine has a non-empty `leafOperator`.
+
+## Automatic compaction
+
+<!-- If you update this list, also update data-management/automatic-compaction.md -->
+
+The following known issues and limitations affect automatic compaction with the MSQ task engine:
+
+- The `metricSpec` field is only supported for certain aggregators. For more information, see [Supported aggregators](../data-management/automatic-compaction.md#supported-aggregators).
+- Only dynamic and range-based partitioning are supported.
+- Set `rollup`  to `true` if and only if `metricSpec` is not empty or null.
+- You can only partition on string dimensions. However, multi-valued string dimensions are not supported.
+- The `maxTotalRows` config is not supported in `DynamicPartitionsSpec`. Use `maxRowsPerSegment` instead.
+- Segments can only be sorted on `__time` as the first column.
\ No newline at end of file
diff --git a/docs/35.0.0/multi-stage-query/reference.md b/docs/35.0.0/multi-stage-query/reference.md
new file mode 100644
index 0000000000..a3ecd01abe
--- /dev/null
+++ b/docs/35.0.0/multi-stage-query/reference.md
@@ -0,0 +1,627 @@
+---
+id: reference
+title: SQL-based ingestion reference
+sidebar_label: Reference
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ This page describes SQL-based batch ingestion using the [`druid-multi-stage-query`](../multi-stage-query/index.md)
+ extension, new in Druid 24.0. Refer to the [ingestion methods](../ingestion/index.md#batch) table to determine which
+ ingestion method is right for you.
+:::
+
+## SQL reference
+
+This topic is a reference guide for the multi-stage query architecture in Apache Druid. For examples of real-world
+usage, refer to the [Examples](examples.md) page.
+
+`INSERT` and `REPLACE` load data into a Druid datasource from either an external input source, or from another
+datasource. When loading from an external datasource, you typically must provide the kind of input source,
+the data format, and the schema (signature) of the input file. Druid provides *table functions* to allow you to
+specify the external file. There are two kinds. `EXTERN` works with the JSON-serialized specs for the three
+items, using the same JSON you would use in native ingest. A set of other, input-source-specific functions
+use SQL syntax to specify the format and the input schema. There is one function for each input source. The
+input-source-specific functions allow you to use SQL query parameters to specify the set of files (or URIs),
+making it easy to reuse the same SQL statement for each ingest: just specify the set of files to use each time.
+
+### `EXTERN` Function
+
+Use the `EXTERN` function to read external data or write to an external location.
+
+#### `EXTERN` as an input source
+
+The function has two variations.
+Function variation 1, with the input schema expressed as JSON:
+
+```sql
+SELECT
+ <column>
+FROM TABLE(
+  EXTERN(
+    '<Druid input source>',
+    '<Druid input format>',
+    '<row signature>'
+  )
+)
+```
+
+`EXTERN` consists of the following parts:
+
+1. Any [Druid input source](../ingestion/input-sources.md) as a JSON-encoded string.
+2. Any [Druid input format](../ingestion/data-formats.md) as a JSON-encoded string.
+3. A row signature, as a JSON-encoded array of column descriptors. Each column descriptor must have a
+   `name` and a `type`. The type can be `string`, `long`, `double`, or `float`. This row signature is
+   used to map the external data into the SQL layer.
+
+Variation 2, with the input schema expressed in SQL using an `EXTEND` clause. See the next
+section for more detail on `EXTEND`. This format also uses named arguments to make the SQL easier to read:
+
+```sql
+SELECT
+ <column>
+FROM TABLE(
+  EXTERN(
+    inputSource => '<Druid input source>',
+    inputFormat => '<Druid input format>'
+  )) (<columns>)
+
+```
+
+The input source and format are as above. The columns are expressed as in a SQL `CREATE TABLE`.
+Example: `(timestamp VARCHAR, metricType VARCHAR, value BIGINT)`. The optional `EXTEND` keyword
+can precede the column list: `EXTEND (timestamp VARCHAR...)`.
+
+For more information, see [Read external data with EXTERN](concepts.md#read-external-data-with-extern).
+
+#### `EXTERN` to export to a destination
+
+You can use `EXTERN` to specify a destination to export data.
+This variation of `EXTERN` accepts the details of the destination as the only argument and requires an `AS` clause to specify the format of the exported rows.
+
+When you export data, Druid creates metadata files in a subdirectory named `_symlink_format_manifest`.
+Within the `_symlink_format_manifest/manifest` directory, the `manifest` file lists absolute paths to exported files using the symlink manifest format. For example:
+
+```text
+s3://export-bucket/export/query-6564a32f-2194-423a-912e-eead470a37c4-worker2-partition2.csv
+s3://export-bucket/export/query-6564a32f-2194-423a-912e-eead470a37c4-worker1-partition1.csv
+s3://export-bucket/export/query-6564a32f-2194-423a-912e-eead470a37c4-worker0-partition0.csv
+...
+s3://export-bucket/export/query-6564a32f-2194-423a-912e-eead470a37c4-worker0-partition24.csv
+```
+
+Keep the following in mind when using EXTERN to export rows:
+- Only INSERT statements are supported.
+- Only `CSV` format is supported as an export format.
+- Partitioning (PARTITIONED BY) and clustering (CLUSTERED BY) aren't supported with EXTERN statements.
+- You can export to Amazon S3, Google GCS, or local storage.
+- The destination provided should contain no other files or directories.
+
+When you export data, use the `rowsPerPage` context parameter to restrict the size of exported files.
+When the number of rows in the result set exceeds the value of the parameter, Druid splits the output into multiple files.
+The following statement shows the format of a SQL query using EXTERN to export rows:
+
+```sql
+SET rowsPerPage=<number_of_rows>;
+INSERT INTO
+  EXTERN(<destination function>)
+AS CSV
+SELECT
+  <column>
+FROM <table>
+```
+
+For details on applying context parameters using SET, see [SET](../querying/sql.md#set).
+
+
+##### S3 - Amazon S3
+
+To export results to S3, pass the `s3()` function as an argument to the `EXTERN` function.
+Export to S3 requires the `druid-s3-extensions` extension.
+For a list of S3 permissions the MSQ task engine requires to perform export, see [Permissions for durable storage](./security.md#s3).
+
+The `s3()` function configures the connection to AWS.
+Pass all arguments for `s3()` as named parameters with their values enclosed in single quotes. For example:
+
+```sql
+INSERT INTO
+  EXTERN(
+    s3(bucket => 'your_bucket', prefix => 'prefix/to/files')
+  )
+AS CSV
+SELECT
+  <column>
+FROM <table>
+```
+
+Supported arguments for the function:
+
+| Parameter | Required | Description | Default |
+|---|---|---|---|
+| `bucket` | Yes  | S3 bucket destination for exported files. You must add the bucket and prefix combination to the `druid.export.storage.s3.allowedExportPaths` allow list. | n/a |
+| `prefix` | Yes  | Destination path in the bucket to create exported files. The export query expects the destination path to be empty. If the location includes other files, the query will fail. You must add the bucket and prefix combination to the `druid.export.storage.s3.allowedExportPaths` allow list. | n/a |
+
+Configure the following runtime parameters to export to an S3 destination:
+
+| Runtime parameter | Required | Description | Default |
+|---|---|---|---|
+| `druid.export.storage.s3.allowedExportPaths` | Yes | Array of S3 prefixes allowed as export destinations. Export queries fail if the export destination does not match any of the configured prefixes. For example: `[\"s3://bucket1/export/\", \"s3://bucket2/export/\"]` | n/a |
+| `druid.export.storage.s3.tempLocalDir` | No | Directory for local storage where the worker stores temporary files before uploading the data to S3. | n/a |
+| `druid.export.storage.s3.maxRetry` | No | Maximum number of  attempts for S3 API calls to avoid failures due to transient errors. | 10 |
+| `druid.export.storage.s3.chunkSize` | No | Individual chunk size to store temporarily in `tempDir`. Large chunk sizes reduce the number of API calls to S3, but require more disk space to store temporary chunks. | 100MiB |
+
+##### GOOGLE - Google Cloud Storage
+
+To export query results to Google Cloud Storage (GCS), pass the `google()` function as an argument to the `EXTERN` function.
+Export to GCS requires the `druid-google-extensions` extension.
+
+The `google()` function configures the connection to GCS. Pass the arguments for `google()` as named parameters with their values enclosed in single quotes. For example:
+
+```sql
+INSERT INTO
+  EXTERN(
+    google(bucket => 'your_bucket', prefix => 'prefix/to/files')
+  )
+AS CSV
+SELECT
+  <column>
+FROM <table>
+```
+
+Supported arguments for the function:
+
+| Parameter   | Required | Description | Default |
+|---|---|---|---|
+| `bucket`    | Yes | GCS bucket destination for exported files. You must add the bucket and prefix combination to the `druid.export.storage.google.allowedExportPaths` allow list. | n/a |
+| `prefix` | Yes  | Destination path in the bucket to create exported files. The export query expects the destination path to be empty. If the location includes other files, the query will fail. You must add the bucket and prefix combination to the `druid.export.storage.google.allowedExportPaths` allow list. | n/a |
+
+Configure the following runtime parameters to export query results to a GCS destination:
+
+| Runtime parameter | Required | Description | Default |
+|---|---|---|---|
+| `druid.export.storage.google.allowedExportPaths` | Yes | Array of GCS prefixes allowed as export destinations. Export queries fail if the export destination does not match any of the configured prefixes. For example: `[\"gs://bucket1/export/\", \"gs://bucket2/export/\"]` | n/a     |
+| `druid.export.storage.google.tempLocalDir` | No | Directory for local storage where the worker stores temporary files before uploading the data to GCS. | n/a |
+| `druid.export.storage.google.maxRetry` | No |  Maximum number of attempts for GCS API calls to avoid failures due to transient errors. | 10 |
+| `druid.export.storage.google.chunkSize` | No | Individual chunk size to store temporarily in `tempDir`. Large chunk sizes reduce the number of API calls to GS, but require more disk space to store temporary chunks. | 4 MiB |
+
+
+##### LOCAL - local file storage
+
+You can export queries to local storage. This process writes the results to the filesystem on the MSQ worker.
+This is useful in a single node setup or for testing but is not suitable for production use cases.
+
+To export results to local storage, pass the `LOCAL()` function as an argument to the EXTERN function.
+You must configure the runtime property `druid.export.storage.baseDir` as an absolute path on the Indexer or Middle Manager to use local storage as an export destination.
+You can export data to paths that match this value as a prefix.
+Pass all arguments to `LOCAL()` as named parameters with values enclosed in single quotes. For example:
+
+```sql
+INSERT INTO
+  EXTERN(
+    local(exportPath => 'exportLocation/query1')
+  )
+AS CSV
+SELECT
+  <column>
+FROM <table>
+```
+
+Supported arguments for the function:
+
+| Parameter | Required | Description | Default |
+|---|---|---|---|
+| `exportPath`  | Yes | Absolute path to a subdirectory of `druid.export.storage.baseDir` where Druid exports the query results. The destination must be empty. If the location includes other files or directories, the query will fail. | n/a |
+
+For more information, see [Export external data with EXTERN](concepts.md#write-to-an-external-destination-with-extern).
+
+### `INSERT`
+
+Use the `INSERT` statement to insert data.
+
+Unlike standard SQL, `INSERT` loads data into the target table according to column name, not positionally. If necessary,
+use `AS` in your `SELECT` column list to assign the correct names. Do not rely on their positions within the SELECT
+clause.
+
+Statement format:
+
+```sql
+INSERT INTO <table name>
+< SELECT query >
+PARTITIONED BY <time frame>
+[ CLUSTERED BY <column list> ]
+```
+
+INSERT consists of the following parts:
+
+1. Optional [context parameters](./reference.md#context-parameters).
+2. An `INSERT INTO <dataSource>` clause at the start of your query, such as `INSERT INTO your-table`.
+3. A clause for the data you want to insert, such as `SELECT ... FROM ...`. You can use [`EXTERN`](#extern-function)
+   to reference external tables using `FROM TABLE(EXTERN(...))`.
+4. A [PARTITIONED BY](#partitioned-by) clause, such as `PARTITIONED BY DAY`.
+5. An optional [CLUSTERED BY](#clustered-by) clause.
+
+For more information, see [Load data with INSERT](concepts.md#load-data-with-insert).
+
+### `REPLACE`
+
+You can use the `REPLACE` function to replace all or some of the data.
+
+Unlike standard SQL, `REPLACE` loads data into the target table according to column name, not positionally. If necessary,
+use `AS` in your `SELECT` column list to assign the correct names. Do not rely on their positions within the SELECT
+clause.
+
+#### `REPLACE` all data
+
+Function format to replace all data:
+
+```sql
+REPLACE INTO <target table>
+OVERWRITE ALL
+< SELECT query >
+PARTITIONED BY <time granularity>
+[ CLUSTERED BY <column list> ]
+```
+
+#### `REPLACE` specific time ranges
+
+Function format to replace specific time ranges:
+
+```sql
+REPLACE INTO <target table>
+OVERWRITE WHERE __time >= TIMESTAMP '<lower bound>' AND __time < TIMESTAMP '<upper bound>'
+< SELECT query >
+PARTITIONED BY <time granularity>
+[ CLUSTERED BY <column list> ]
+```
+
+`REPLACE` consists of the following parts:
+
+1. Optional [context parameters](./reference.md#context-parameters).
+2. A `REPLACE INTO <dataSource>` clause at the start of your query, such as `REPLACE INTO "your-table".`
+3. An OVERWRITE clause after the datasource, either OVERWRITE ALL or OVERWRITE WHERE:
+    - OVERWRITE ALL replaces the entire existing datasource with the results of the query.
+    - OVERWRITE WHERE drops the time segments that match the condition you set. Conditions are based on the `__time`
+        column and use the format `__time [< > = <= >=] TIMESTAMP`. Use them with AND, OR, and NOT between them, inclusive
+        of the timestamps specified. No other expressions or functions are valid in OVERWRITE.
+4. A clause for the actual data you want to use for the replacement.
+5. A [PARTITIONED BY](#partitioned-by) clause, such as `PARTITIONED BY DAY`.
+6. An optional [CLUSTERED BY](#clustered-by) clause.
+
+For more information, see [Overwrite data with REPLACE](concepts.md#overwrite-data-with-replace).
+
+### `PARTITIONED BY`
+
+The `PARTITIONED BY <time granularity>` clause is required for [INSERT](#insert) and [REPLACE](#replace). See
+[Partitioning](concepts.md#partitioning-by-time) for details.
+
+The following granularity arguments are accepted:
+
+- Time unit keywords: `HOUR`, `DAY`, `MONTH`, or `YEAR`. Equivalent to `FLOOR(__time TO TimeUnit)`.
+- Time units as ISO 8601 period strings: `'PT1H'`, `'P1D'`, etc. (Druid 26.0 and later.)
+- `TIME_FLOOR(__time, 'granularity_string')`, where granularity_string is one of the ISO 8601 periods listed below. The
+  first argument must be `__time`.
+- `FLOOR(__time TO TimeUnit)`, where `TimeUnit` is any unit supported by the [FLOOR function](../querying/sql-scalar.md#date-and-time-functions). The first argument must be `__time`.
+- `ALL` or `ALL TIME`, which effectively disables time partitioning by placing all data in a single time chunk. To use
+  LIMIT or OFFSET at the outer level of your `INSERT` or `REPLACE` query, you must set `PARTITIONED BY` to `ALL` or `ALL TIME`.
+
+Earlier versions required the `TIME_FLOOR` notation to specify a granularity other than the keywords.
+In the current version, the string constant provides a simpler equivalent solution.
+
+The following ISO 8601 periods are supported for `TIME_FLOOR` and the string constant:
+
+- PT1S
+- PT1M
+- PT5M
+- PT10M
+- PT15M
+- PT30M
+- PT1H
+- PT6H
+- P1D
+- P1W*
+- P1M
+- P3M
+- P1Y
+
+The string constant can also include any of the keywords mentioned above:
+
+- `HOUR` - Same as `'PT1H'`
+- `DAY` - Same as `'P1D'`
+- `MONTH` - Same as `'P1M'`
+- `YEAR` - Same as `'P1Y'`
+- `ALL TIME`
+- `ALL` - Alias for `ALL TIME`
+
+Examples:
+
+```SQL
+-- Keyword
+PARTITIONED BY HOUR
+
+-- String literal
+PARTITIONED BY 'HOUR'
+
+-- ISO 8601 period
+PARTITIONED BY 'PT1H'
+
+-- TIME_FLOOR function
+PARTITIONED BY TIME_FLOOR(__time, 'PT1H')
+```
+
+For more information about partitioning, see [Partitioning](concepts.md#partitioning-by-time). <br /><br />
+*Avoid  partitioning by week, `P1W`, because weeks don't align neatly with months and years, making it difficult to partition by coarser granularities later.
+
+### `CLUSTERED BY`
+
+The `CLUSTERED BY <column list>` clause is optional for [INSERT](#insert) and [REPLACE](#replace). It accepts a list of
+column names or expressions.
+
+This column list is used for [secondary partitioning](../ingestion/partitioning.md#secondary-partitioning) of segments
+within a time chunk, and [sorting](../ingestion/partitioning.md#sorting) of rows within a segment. For sorting purposes,
+Druid implicitly prepends `__time` to the `CLUSTERED BY` column list, unless
+[`forceSegmentSortByTime`](#context-parameters) is set to `false`
+(an experimental feature; see [Sorting](../ingestion/partitioning.md#sorting) for details).
+
+For more information about clustering, see [Clustering](concepts.md#clustering).
+
+<a name="context"></a>
+
+## Context parameters
+
+The multi-stage query task engine supports the [SQL context parameters](../querying/sql-query-context.md), as well as its own context parameters described in this section. Use these parameters to tailor how Druid executes your query.
+
+You can specify the context parameters in SELECT, INSERT, or REPLACE statements.
+
+For detailed instructions on configuring query context parameters, refer to [Set query context](../querying/query-context.md).
+
+The following table lists the context parameters for the MSQ task engine:
+
+| Parameter | Description | Default value |
+|---|---|---|
+| `maxNumTasks` | SELECT, INSERT, REPLACE<br /><br />The maximum total number of tasks to launch, including the controller task. The lowest possible value for this setting is 2: one controller and one worker. All tasks must be able to launch simultaneously. If they cannot, the query returns a `TaskStartTimeout` error code after approximately 10 minutes.<br /><br />May also be provided as `numTasks`. If both are present, `maxNumTasks` takes priority. | 2 |
+| `taskAssignment` | SELECT, INSERT, REPLACE<br /><br />Determines how many tasks to use. Possible values include: <ul><li>`max`: Uses as many tasks as possible, up to `maxNumTasks`.</li><li>`auto`: When file sizes can be determined through directory listing (for example: local files, S3, GCS, HDFS) uses as few tasks as possible without exceeding 512 MiB or 10,000 files per task, unless exceeding these limits is necessary to stay within `maxNumTasks`. When calculating the size of files, the weighted size is used, which considers the file format and compression format used if any. When file sizes cannot be determined through directory listing (for example: http), behaves the same as `max`.</li></ul> | `max` |
+| `finalizeAggregations` | SELECT, INSERT, REPLACE<br /><br />Determines the type of aggregation to return. If true, Druid finalizes the results of complex aggregations that directly appear in query results. If false, Druid returns the aggregation's intermediate type rather than finalized type. This parameter is useful during ingestion, where it enables storing sketches directly in Druid tables. For more information about aggregations, see [SQL aggregation functions](../querying/sql-aggregations.md). | `true` |
+| `arrayIngestMode` | INSERT, REPLACE<br /><br /> Controls how ARRAY type values are stored in Druid segments. When set to `array` (recommended for SQL compliance), Druid will store all ARRAY typed values in [ARRAY typed columns](../querying/arrays.md), and supports storing both VARCHAR and numeric typed arrays. When set to `mvd` (the default, for backwards compatibility), Druid only supports VARCHAR typed arrays, and will store them as [multi-value string columns](../querying/multi-value-dimensions.md). See [`arrayIngestMode`] in the [Arrays](../querying/arrays.md) page for more details. | `mvd` (for backwards compatibility, recommended to use `array` for SQL compliance)|
+| `sqlJoinAlgorithm` | SELECT, INSERT, REPLACE<br /><br />Algorithm to use for JOIN. Use `broadcast` (the default) for broadcast hash join or `sortMerge` for sort-merge join. Affects all JOIN operations in the query. This is a hint to the MSQ engine and the actual joins in the query may proceed in a different way than specified. See [Joins](#joins) for more details. | `broadcast` |
+| `rowsInMemory` | INSERT or REPLACE<br /><br />Maximum number of rows to store in memory at once before flushing to disk during the segment generation process. Ignored for non-INSERT queries. In most cases, use the default value. You may need to override the default if you run into one of the [known issues](./known-issues.md) around memory usage. | 100,000 |
+| `segmentSortOrder` | INSERT or REPLACE<br /><br />Normally, Druid sorts rows in individual segments using `__time` first, followed by the [CLUSTERED BY](#clustered-by) clause. When you set `segmentSortOrder`, Druid uses the order from this context parameter instead. Provide the column list as comma-separated values or as a JSON array in string form.<br />< br/>For example, consider an INSERT query that uses `CLUSTERED BY country` and has `segmentSortOrder` set to `__time,city,country`. Within each time chunk, Druid assigns rows to segments based on `country`, and then within each of those segments, Druid sorts those rows by `__time` first, then `city`, then `country`. | empty list |
+| `forceSegmentSortByTime` | INSERT or REPLACE<br /><br />When set to `true` (the default), Druid prepends `__time` to [CLUSTERED BY](#clustered-by) when determining the sort order for individual segments. Druid also requires that `segmentSortOrder`, if provided, starts with `__time`.<br /><br />When set to `false`, Druid uses the [CLUSTERED BY](#clustered-by) alone to determine the sort order for individual segments, and does not require that `segmentSortOrder` begin with `__time`. Setting this parameter to `false` is an experimental feature; see [Sorting](../ingestion/partitioning.md#sorting) for details. | `true` |
+| `maxParseExceptions`| SELECT, INSERT, REPLACE<br /><br />Maximum number of parse exceptions that are ignored while executing the query before it stops with `TooManyWarningsFault`. To ignore all the parse exceptions, set the value to -1. | 0 |
+| `rowsPerSegment` | INSERT or REPLACE<br /><br />The number of rows per segment to target. The actual number of rows per segment may be somewhat higher or lower than this number. In most cases, use the default. For general information about sizing rows per segment, see [Segment Size Optimization](../operations/segment-optimization.md). | 3,000,000 |
+| `indexSpec` | INSERT or REPLACE<br /><br />An [`indexSpec`](../ingestion/ingestion-spec.md#indexspec) to use when generating segments. May be a JSON string or object. See [Front coding](../ingestion/ingestion-spec.md#front-coding) for details on configuring an `indexSpec` with front coding. | See [`indexSpec`](../ingestion/ingestion-spec.md#indexspec). |
+| `durableShuffleStorage` | SELECT, INSERT, REPLACE <br /><br />Whether to use durable storage for shuffle mesh. To use this feature, configure the durable storage at the server level using `druid.msq.intermediate.storage.enable=true`). If these properties are not configured, any query with the context variable `durableShuffleStorage=true` fails with a configuration error. <br /><br /> | `false` |
+| `faultTolerance` | SELECT, INSERT, REPLACE<br /><br /> Whether to turn on fault tolerance mode or not. Failed workers are retried based on [Limits](#limits). Cannot be used when `durableShuffleStorage` is explicitly set to false. | `false` |
+| `selectDestination` | SELECT<br /><br /> Controls where the final result of the select query is written. <br />Use `taskReport`(the default) to write select results to the task report. <b> This is not scalable since task reports size explodes for large results </b> <br/>Use `durableStorage` to write results to durable storage location. <b>For large results sets, its recommended to use `durableStorage` </b>. To configure durable storage see [`this`](#durable-storage) section. | `taskReport` |
+| `waitUntilSegmentsLoad` | INSERT, REPLACE<br /><br /> If set, the ingest query waits for the generated segments to be loaded before exiting, else the ingest query exits without waiting. The task and live reports contain the information about the status of loading segments if this flag is set. This will ensure that any future queries made after the ingestion exits will include results from the ingestion. The drawback is that the controller task will stall till the segments are loaded. | `false` |
+| `includeSegmentSource` | SELECT, INSERT, REPLACE<br /><br /> Controls the sources, which will be queried for results in addition to the segments present on deep storage. Can be `NONE` or `REALTIME`. If this value is `NONE`, only non-realtime (published and used) segments will be downloaded from deep storage. If this value is `REALTIME`, results will also be included from realtime tasks. `REALTIME` cannot be used while writing data into the same datasource it is read from.| `NONE` |
+| `rowsPerPage` | SELECT<br /><br />The number of rows per page to target. The actual number of rows per page may be somewhat higher or lower than this number. In most cases, use the default.<br /> This property comes into effect only when `selectDestination` is set to `durableStorage` | 100000 |
+| `skipTypeVerification` | INSERT or REPLACE<br /><br />During query validation, Druid validates that [string arrays](../querying/arrays.md) and [multi-value dimensions](../querying/multi-value-dimensions.md) are not mixed in the same column. If you are intentionally migrating from one to the other, use this context parameter to disable type validation.<br /><br />Provide the column list as comma-separated values or as a JSON array in string form.| empty list |
+| `failOnEmptyInsert` | INSERT or REPLACE<br /><br /> When set to false (the default), an INSERT query generating no output rows will be no-op, and a REPLACE query generating no output rows will delete all data that matches the OVERWRITE clause.  When set to true, an ingest query generating no output rows will throw an `InsertCannotBeEmpty` fault. | `false` |
+| `storeCompactionState` | REPLACE<br /><br /> When set to true, a REPLACE query stores as part of each segment's metadata a `lastCompactionState` field that captures the various specs used to create the segment. Future compaction jobs skip segments whose `lastCompactionState` matches the desired compaction state. Works the same as [`storeCompactionState`](../ingestion/tasks.md#context-parameters) task context flag. | `false` |
+| `removeNullBytes` | SELECT, INSERT or REPLACE<br /><br /> The MSQ engine cannot process null bytes in strings and throws `InvalidNullByteFault` if it encounters them in the source data. If the parameter is set to true, The MSQ engine will remove the null bytes in string fields when reading the data. | `false` |
+| `maxFrameSize` | SELECT, INSERT or REPLACE<br /><br />Size of frames used for data transfer within the MSQ engine. You generally do not need to change this unless you have very large rows. | `1000000` (1 MB) |
+| `maxThreads` | SELECT, INSERT or REPLACE<br /><br />Maximum number of threads to use for processing. This only has an effect if it is greater than zero and less than the default thread count based on system configuration. Otherwise, it is ignored, and workers use the default thread count. | Not set (use default thread count) |
+
+## Joins
+
+Joins in multi-stage queries use one of two algorithms based on what you set the [context parameter](#context-parameters) `sqlJoinAlgorithm` to: 
+
+- [`broadcast`](#broadcast) (default) 
+- [`sortMerge`](#sort-merge).
+
+If you omit this context parameter, the MSQ task engine uses broadcast since it's the default join algorithm. The context parameter applies to the entire SQL statement, so you can't mix different
+join algorithms in the same query.
+
+`sqlJoinAlgorithm` is a hint to the planner to execute the join in the specified manner. The planner can decide to ignore
+the hint if it deduces that the specified algorithm can be detrimental to the performance of the join beforehand. This intelligence
+is very limited as of now, and the `sqlJoinAlgorithm` set would be respected in most cases, therefore the user should set it
+appropriately. See the advantages and the drawbacks for the [broadcast](#broadcast) and the [sort-merge](#sort-merge) join to 
+determine which join to use beforehand.
+
+### Broadcast
+
+The default join algorithm for multi-stage queries is a broadcast hash join, which is similar to how
+[joins are executed with native queries](../querying/query-execution.md#join). 
+
+To use broadcast joins, either omit the  `sqlJoinAlgorithm` or set it to `broadcast`.
+
+For a broadcast join, any adjacent joins are flattened
+into a structure with a "base" input (the bottom-leftmost one) and other leaf inputs (the rest). Next, any subqueries
+that are inputs the join (either base or other leafs) are planned into independent stages. Then, the non-base leaf
+inputs are all connected as broadcast inputs to the "base" stage.
+
+Together, all of these non-base leaf inputs must not exceed the [limit on broadcast table footprint](#limits). There
+is no limit on the size of the base (leftmost) input.
+
+Only LEFT JOIN, INNER JOIN, and CROSS JOIN are supported with `broadcast`.
+
+Join conditions, if present, must be equalities. It is not necessary to include a join condition; for example,
+`CROSS JOIN` and comma join do not require join conditions.
+
+The following example has a single join chain where `orders` is the base input while `products` and
+`customers` are non-base leaf inputs. The broadcast inputs (`products` and `customers`) must fall under the limit on broadcast table footprint, but the base `orders` input
+can be unlimited in size.
+
+The query reads `products` and `customers` and then broadcasts both to
+the stage that reads `orders`. That stage loads the broadcast inputs (`products` and `customers`) in memory and walks
+through `orders` row by row. The results are aggregated and written to the table `orders_enriched`. 
+
+```sql
+REPLACE INTO orders_enriched
+OVERWRITE ALL
+SELECT
+  orders.__time,
+  products.name AS product_name,
+  customers.name AS customer_name,
+  SUM(orders.amount) AS amount
+FROM orders
+LEFT JOIN products ON orders.product_id = products.id
+LEFT JOIN customers ON orders.customer_id = customers.id
+GROUP BY 1, 2
+PARTITIONED BY HOUR
+CLUSTERED BY product_name
+```
+
+### Sort-merge
+
+You can use the sort-merge join algorithm to make queries more scalable at the cost of performance. If your goal is performance, consider [broadcast joins](#broadcast).  There are various scenarios where broadcast join would return a [`BroadcastTablesTooLarge`](#error-codes) error, but a sort-merge join would succeed.
+
+To use the sort-merge join algorithm, set the context parameter `sqlJoinAlgorithm` to `sortMerge`.
+
+In a sort-merge join, each pairwise join is planned into its own stage with two inputs. The two inputs are partitioned and sorted using a hash partitioning on the same key. 
+
+When using the sort-merge algorithm, keep the following in mind:
+
+- There is no limit on the overall size of either input, so sort-merge is a good choice for performing a join of two large inputs or for performing a self-join of a large input with itself.
+
+- There is a limit on the amount of data associated with each individual key. If _both_ sides of the join exceed this limit, the query returns a [`TooManyRowsWithSameKey`](#error-codes) error. If only one side exceeds the limit, the query does not return this error.
+
+- Join conditions are optional but must be equalities if they are present. For example, `CROSS JOIN` and comma join do not require join conditions.
+
+- All join types are supported with `sortMerge`: LEFT, RIGHT, INNER, FULL, and CROSS.
+
+The following query runs a single sort-merge join stage that takes the following inputs:
+* `eventstream` partitioned on `user_id`
+* `users` partitioned on `id`
+
+There is no limit on the size of either input.
+The SET command assigns the `sqlJoinAlgorithm` context parameter so that Druid uses the sort-merge join algorithm for the query.
+
+```sql
+SET sqlJoinAlgorithm='sortMerge';
+REPLACE INTO eventstream_enriched
+OVERWRITE ALL
+SELECT
+  eventstream.__time,
+  eventstream.user_id,
+  eventstream.event_type,
+  eventstream.event_details,
+  users.signup_date AS user_signup_date
+FROM eventstream
+LEFT JOIN users ON eventstream.user_id = users.id
+PARTITIONED BY HOUR
+CLUSTERED BY user
+```
+
+## Durable storage
+
+SQL-based ingestion supports using durable storage to store intermediate files temporarily. Enabling it can improve reliability. For more information, see [Durable storage](../operations/durable-storage.md).
+
+### Durable storage configurations
+
+Durable storage is supported on Amazon S3 storage, Microsoft's Azure Blob Storage and Google Cloud Storage. 
+There are common configurations that control the behavior regardless of which storage service you use. Apart from these common configurations, there are a few properties specific to S3 and to Azure.
+
+Common properties to configure the behavior of durable storage
+
+|Parameter          | Required | Description          | Default | 
+|--|--|--|--|
+|`druid.msq.intermediate.storage.enable`  | Yes |  Whether to enable durable storage for the cluster. Set it to true to enable durable storage. For more information about enabling durable storage, see [Durable storage](../operations/durable-storage.md). | false | 
+|`druid.msq.intermediate.storage.type` |  Yes | The type of storage to use. Set it to `s3` for S3, `azure` for Azure and `google` for Google | n/a |
+|`druid.msq.intermediate.storage.tempDir`| Yes |  Directory path on the local disk to store temporary files required while uploading and downloading the data. If the property is not configured on the indexer or middle manager, it defaults to using the task temporary directory. | n/a |
+|`druid.msq.intermediate.storage.maxRetry` |  No | Defines the max number times to attempt S3 API calls to avoid failures due to transient errors. | 10 |
+|`druid.msq.intermediate.storage.chunkSize` | No | Defines the size of each chunk to temporarily store in `druid.msq.intermediate.storage.tempDir`. The chunk size must be between 5 MiB and 5 GiB. A large chunk size reduces the API calls made to the durable storage, however it requires more disk space to store the temporary chunks. Druid uses a default of 100MiB if the value is not provided.| 100MiB | 
+
+To use S3 or Google for durable storage, you also need to configure the following properties:
+
+|Parameter          | Required | Description  | Default |
+|-------------------|----------------------------------------|----------------------| --|
+|`druid.msq.intermediate.storage.bucket` | Yes | The S3 or Google bucket where the files are uploaded to and download from | n/a |
+|`druid.msq.intermediate.storage.prefix` | Yes | Path prepended to all the paths uploaded to the bucket to namespace the connector's files. Provide a unique value for the prefix and do not share the same prefix between different clusters. If the location includes other files or directories, then they might get cleaned up as well.  | n/a | 
+
+To use Azure for durable storage, you also need to configure the following properties:
+
+|Parameter          | Required  | Description          | Default |
+|-------------------|----------------------------------------|----------------------| - |
+|`druid.msq.intermediate.storage.container` | Yes | The Azure container where the files are uploaded to and downloaded from.  | n/a |
+|`druid.msq.intermediate.storage.prefix` | Yes | Path prepended to all the paths uploaded to the container to namespace the connector's files. Provide a unique value for the prefix and do not share the same prefix between different clusters. If the location includes other files or directories, then they might get cleaned up as well. | n/a |
+
+### Durable storage cleaner configurations
+
+Durable storage creates files on the remote storage, and these files get cleaned up once a job no longer requires those files. However, due to failures causing abrupt exits of tasks, these files might not get cleaned up.
+You can configure the Overlord to periodically clean up these intermediate files after a task completes and the files are no longer need. The files that get cleaned up are determined by the storage prefix you configure. Any files that match the path for the storage prefix may get cleaned up, not just intermediate files that are no longer needed.
+
+Use the following configurations to control the cleaner:
+
+|Parameter  | Required  | Description | Default | 
+|--|--|--|--|
+|`druid.msq.intermediate.storage.cleaner.enabled`|  No | Whether durable storage cleaner should be enabled for the cluster.  | false |
+|`druid.msq.intermediate.storage.cleaner.delaySeconds`| No | The delay (in seconds) after the latest run post which the durable storage cleaner cleans the up files.  | 86400 | 
+
+
+## Limits
+
+Knowing the limits for the MSQ task engine can help you troubleshoot any [errors](#error-codes) that you encounter. Many of the errors occur as a result of reaching a limit.
+
+The following table lists query limits:
+
+| Limit | Value | Error if exceeded |
+|---|---|---|
+| Size of an individual row written to a frame. Row size when written to a frame may differ from the original row size. | 1 MB | `RowTooLarge` |
+| Number of segment-granular time chunks encountered during ingestion. | 5,000 | `TooManyBuckets`|
+| Number of input files/segments per worker. | 10,000 | `TooManyInputFiles`|
+| Number of output partitions for any one stage. Number of segments generated during ingestion. |25,000 | `TooManyPartitions`|
+| Number of output columns for any one stage. | 2,000 | `TooManyColumns`|
+| Number of cluster by columns that can appear in a stage | 1,500 | `TooManyClusteredByColumns` |
+| Number of workers for any one stage. | Hard limit is 1,000. Memory-dependent soft limit may be lower. | `TooManyWorkers`|
+| Maximum memory occupied by broadcasted tables. | 30% of each [processor memory bundle](concepts.md#memory-usage). | `BroadcastTablesTooLarge` |
+| Maximum memory occupied by buffered data during sort-merge join. Only relevant when `sqlJoinAlgorithm` is `sortMerge`. | 10 MB | `TooManyRowsWithSameKey` |
+| Maximum relaunch attempts per worker. Initial run is not a relaunch. The worker will be spawned 1 + `workerRelaunchLimit` times before the job fails. | 2 | `TooManyAttemptsForWorker` |
+| Maximum relaunch attempts for a job across all workers. | 100 | `TooManyAttemptsForJob` |
+<a name="errors"></a>
+
+## Error codes
+
+The following table describes error codes you may encounter in the `multiStageQuery.payload.status.errorReport.error.errorCode` field:
+
+| Code | Meaning | Additional fields |
+|---|---|---|
+| `BroadcastTablesTooLarge` | The size of the broadcast tables used in the right hand side of the join exceeded the memory reserved for them in a worker task.<br /><br />Try increasing the peon memory or reducing the size of the broadcast tables. | `maxBroadcastTablesSize`: Memory reserved for the broadcast tables, measured in bytes. |
+| `Canceled`| The query was canceled. Common reasons for cancellation:<br /><br /><ul><li>User-initiated shutdown of the controller task via the `/druid/indexer/v1/task/{taskId}/shutdown` API.</li><li>Restart or failure of the server process that was running the controller task.</li></ul>| |
+| `CannotParseExternalData`| A worker task could not parse data from an external datasource. | `errorMessage`: More details on why parsing failed. |
+| `ColumnNameRestricted`| The query uses a restricted column name. | `columnName`: The restricted column name. |
+| `ColumnTypeNotSupported` | The column type is not supported. This can be because:<br /> <br /><ul><li>Support for writing or reading from a particular column type is not supported.</li><li>The query attempted to use a column type that is not supported by the frame format. This occurs with ARRAY types, which are not yet implemented for frames.</li></ul> | `columnName`: The column name with an unsupported type.<br /> <br />`columnType`: The unknown column type. |
+|`InsertCannotAllocateSegment`| The controller task could not allocate a new segment ID due to conflict with existing segments or pending segments. Common reasons for such conflicts:<br /> <br /><ul><li>Attempting to mix different granularities in the same intervals of the same datasource.</li><li>Prior ingestions that used non-extendable shard specs.</li></ul> <br /> <br /> Use REPLACE to overwrite the existing data or if the error contains the `allocatedInterval` then alternatively rerun the INSERT job with the mentioned granularity to append to existing data. Note that it might not always be possible to append to the existing data using INSERT and can only be done if `allocatedInterval` is present. | `dataSource`<br /> <br />`interval`: The interval for the attempted new segment allocation. <br /> <br /> `allocatedInterval`: The incorrect interval allocated by the overlord. It can be null |
+|`InsertCannotBeEmpty`| An INSERT or REPLACE query did not generate any output rows when `failOnEmptyInsert` query context is set to true. `failOnEmptyInsert` defaults to false, so an INSERT query generating no output rows will be no-op, and a REPLACE query generating no output rows will delete all data that matches the OVERWRITE clause. | `dataSource` |
+| `InsertLockPreempted` | An INSERT or REPLACE query was canceled by a higher-priority ingestion job, such as a real-time ingestion task. | |
+| `InsertTimeNull` | An INSERT or REPLACE query encountered a null timestamp in the `__time` field.<br /><br />This can happen due to using an expression like `TIME_PARSE(timestamp) AS __time` with a timestamp that cannot be parsed. ([`TIME_PARSE`](../querying/sql-scalar.md#date-and-time-functions) returns null when it cannot parse a timestamp.) In this case, try parsing your timestamps using a different function or pattern. Or, if your timestamps may genuinely be null, consider using [`COALESCE`](../querying/sql-scalar.md#other-scalar-functions) to provide a default value. One option is [`CURRENT_TIMESTAMP`](../querying/sql-scalar.md#date-and-time-functions), which represents the start time of the job.|
+| `InsertTimeOutOfBounds`| A REPLACE query generated a timestamp outside the bounds of the TIMESTAMP parameter for your OVERWRITE WHERE clause.<br /> <br />To avoid this error, verify that the you specified is valid. | `interval`: time chunk interval corresponding to the out-of-bounds timestamp |
+| `InvalidField`| An error was encountered while writing a field. | `error`: Encountered error. <br /><br /> `source`: Source for the error. <br /><br /> `rowNumber`: Row number (1-indexed) for the error. <br /><br /> `column`: Column for the error. |
+| `InvalidNullByte`| A string column included a null byte. Null bytes in strings are not permitted. |`source`: The source that included the null byte <br /><br /> `rowNumber`: The row number (1-indexed) that included the null byte <br /><br /> `column`: The column that included the null byte <br /><br /> `value`: Actual string containing the null byte <br /><br /> `position`: Position (1-indexed) of occurrence of null byte|
+| `QueryNotSupported`| QueryKit could not translate the provided native query to a multi-stage query.<br /> <br />This can happen if the query uses features that aren't supported, like GROUPING SETS. | |
+| `QueryRuntimeError` | MSQ uses the native query engine to run the leaf stages. This error tells MSQ that error is in native query runtime.<br /> <br /> Since this is a generic error, the user needs to look at logs for the error message and stack trace to figure out the next course of action. If the user is stuck, consider raising a `github` issue for assistance. |  `baseErrorMessage` error message from the native query runtime. |
+| `RowTooLarge`| The query tried to process a row that was too large to write to a single frame. See the [Limits](#limits) table for specific limits on frame size. Note that the effective maximum row size is smaller than the maximum frame size due to alignment considerations during frame writing. | `maxFrameSize`: The limit on the frame size. |
+| `TaskStartTimeout` | Unable to launch `pendingTasks` worker out of total `totalTasks` workers tasks within `timeout` seconds of the last successful worker launch.<br /><br />There may be insufficient available slots to start all the worker tasks simultaneously. Try splitting up your query into smaller chunks using a smaller value of [`maxNumTasks`](#context-parameters). Another option is to increase capacity. | `pendingTasks`: Number of tasks not yet started.<br /><br />`totalTasks`: The number of tasks attempted to launch.<br /><br />`timeout`: Timeout, in milliseconds, that was exceeded. |
+| `TooManyAttemptsForJob` | Total relaunch attempt count across all workers exceeded max relaunch attempt limit. See the [Limits](#limits) table for the specific limit. | `maxRelaunchCount`: Max number of relaunches across all the workers defined in the [Limits](#limits) section. <br /><br /> `currentRelaunchCount`: current relaunch counter for the job across all workers. <br /><br /> `taskId`: Latest task id which failed <br /> <br /> `rootErrorMessage`: Error message of the latest failed task.|
+| `TooManyAttemptsForWorker`| Worker exceeded maximum relaunch attempt count as defined in the [Limits](#limits) section. |`maxPerWorkerRelaunchCount`: Max number of relaunches allowed per worker as defined in the [Limits](#limits) section. <br /><br /> `workerNumber`: the worker number for which the task failed <br /><br /> `taskId`: Latest task id which failed <br /> <br /> `rootErrorMessage`: Error message of the latest failed task.|
+| `TooManyBuckets` | Exceeded the maximum number of partition buckets for a stage (5,000 partition buckets).<br />< br />Partition buckets are created for each [`PARTITIONED BY`](#partitioned-by) time chunk for INSERT and REPLACE queries. The most common reason for this error is that your `PARTITIONED BY` is too narrow relative to your data. | `maxBuckets`: The limit on partition buckets. |
+| `TooManyInputFiles` | Exceeded the maximum number of input files or segments per worker (10,000 files or segments).<br /><br />If you encounter this limit, consider adding more workers, or breaking up your query into smaller queries that process fewer files or segments per query. | `numInputFiles`: The total number of input files/segments for the stage.<br /><br />`maxInputFiles`: The maximum number of input files/segments per worker per stage.<br /><br />`minNumWorker`: The minimum number of workers required for a successful run. |
+| `TooManyPartitions`| Exceeded the maximum number of partitions for a stage (25,000 partitions).<br /><br />This can occur with INSERT or REPLACE statements that generate large numbers of segments, since each segment is associated with a partition. If you encounter this limit, consider breaking up your INSERT or REPLACE statement into smaller statements that process less data per statement. | `maxPartitions`: The limit on partitions which was exceeded |
+| `TooManyClusteredByColumns` | Exceeded the maximum number of clustering columns for a stage (1,500 columns).<br /><br />This can occur with `CLUSTERED BY`, `ORDER BY`, or `GROUP BY` with a large number of columns. | `numColumns`: The number of columns requested.<br /><br />`maxColumns`: The limit on columns which was exceeded.`stage`: The stage number exceeding the limit<br /><br /> |
+| `TooManyRowsWithSameKey` | The number of rows for a given key exceeded the maximum number of buffered bytes on both sides of a join. See the [Limits](#limits) table for the specific limit. Only occurs when join is executed via the sort-merge join algorithm. | `key`: The key that had a large number of rows.<br /><br />`numBytes`: Number of bytes buffered, which may include other keys.<br /><br />`maxBytes`: Maximum number of bytes buffered. |
+| `TooManyColumns` | Exceeded the maximum number of columns for a stage (2,000 columns). | `numColumns`: The number of columns requested.<br /><br />`maxColumns`: The limit on columns which was exceeded. |
+| `TooManyWarnings` | Exceeded the maximum allowed number of warnings of a particular type. | `rootErrorCode`: The error code corresponding to the exception that exceeded the required limit. <br /><br />`maxWarnings`: Maximum number of warnings that are allowed for the corresponding `rootErrorCode`. |
+| `TooManyWorkers`| Exceeded the maximum number of simultaneously-running workers. See the [Limits](#limits) table for more details. | `workers`: The number of simultaneously running workers that exceeded a hard or soft limit. This may be larger than the number of workers in any one stage if multiple stages are running simultaneously. <br /><br />`maxWorkers`: The hard or soft limit on workers that was exceeded. If this is lower than the hard limit (1,000 workers), then you can increase the limit by adding more memory to each task. |
+| `NotEnoughMemory` | Insufficient memory to launch a stage. | `suggestedServerMemory`: Suggested number of bytes of memory to allocate to a given process. <br /><br />`serverMemory`: The number of bytes of memory available to a single process.<br /><br />`usableMemory`: The number of usable bytes of memory for a single process.<br /><br />`serverWorkers`: The number of workers running in a single process.<br /><br />`serverThreads`: The number of threads in a single process. |
+| `NotEnoughTemporaryStorage` | Insufficient temporary storage configured to launch a stage. This limit is set by the property `druid.indexer.task.tmpStorageBytesPerTask`. This property should be increased to the minimum suggested limit to resolve this.| `suggestedMinimumStorage`: Suggested number of bytes of temporary storage space to allocate to a given process. <br /><br />`configuredTemporaryStorage`: The number of bytes of storage currently configured. |
+| `WorkerFailed` | A worker task failed unexpectedly. | `errorMsg`<br /><br />`workerTaskId`: The ID of the worker task. |
+| `WorkerRpcFailed` | A remote procedure call to a worker task failed and could not recover. | `workerTaskId`: the id of the worker task |
+| `UnknownError` | All other errors. | `message` |
diff --git a/docs/35.0.0/multi-stage-query/security.md b/docs/35.0.0/multi-stage-query/security.md
new file mode 100644
index 0000000000..d98695ebed
--- /dev/null
+++ b/docs/35.0.0/multi-stage-query/security.md
@@ -0,0 +1,86 @@
+---
+id: security
+title: SQL-based ingestion security
+sidebar_label: Security
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ This page describes SQL-based batch ingestion using the [`druid-multi-stage-query`](../multi-stage-query/index.md)
+ extension, new in Druid 24.0. Refer to the [ingestion methods](../ingestion/index.md#batch) table to determine which
+ ingestion method is right for you.
+:::
+
+All authenticated users can use the multi-stage query task engine (MSQ task engine) through the UI and API if the
+extension is loaded. However, without additional permissions, users are not able to issue queries that read or write
+Druid datasources or external data. The permission needed depends on what the user is trying to do.
+
+To submit a query:
+
+- SELECT from a Druid datasource requires the READ DATASOURCE permission on that datasource.
+- [INSERT](reference.md#insert) or [REPLACE](reference.md#replace) into a Druid datasource requires the WRITE DATASOURCE
+  permission on that datasource.
+- [EXTERN](reference.md#extern-function) and the input-source-specific table functions require READ permission on a
+  resource named "EXTERNAL" with type "EXTERNAL". Users without the correct
+  permission encounter a 403 error when trying to run queries that include `EXTERN`.
+
+Once a query is submitted, it executes as a [`query_controller`](concepts.md#execution-flow) task. Query tasks that
+users submit to the MSQ task engine are Overlord tasks, so they follow the Overlord's security model. This means that
+users with access to the Overlord API can perform some actions even if they didn't submit the query, including
+retrieving status or canceling a query. For more information about the Overlord API and the task API, see [APIs for
+SQL-based ingestion](../api-reference/sql-ingestion-api.md). 
+
+:::info
+ Keep in mind that any user with access to Overlord APIs can submit `query_controller` tasks with only the WRITE DATASOURCE permission.
+:::
+
+Depending on what a user is trying to do, they might also need the following permissions:
+
+- `INSERT` or `REPLACE` queries: Users must have DATASOURCE READ permission on the output datasource.
+- `SELECT` queries: Users must have READ permission on the `__query_select` datasource, which is a stub datasource that gets created.
+  
+
+
+
+## Permissions for durable storage
+
+The MSQ task engine can use Amazon S3 or Azure Blob Storage to store intermediate files when running queries. To upload, read, move and delete these intermediate files, the MSQ task engine requires certain permissions specific to the storage provider. 
+
+### S3
+
+The MSQ task engine needs the following permissions for pushing,  fetching, and removing intermediate stage results to and from S3:
+
+- `s3:GetObject` to retrieve files. Note that `GetObject` also requires read permission on the object that gets retrieved. 
+- `s3:PutObject` to upload files.
+- `s3:AbortMultipartUpload` to cancel the upload of files
+- `s3:DeleteObject` to delete files when they're no longer needed. 
+
+### Azure
+
+The MSQ task engine needs the following permissions for pushing, fetching, and removing intermediate stage results to and from Azure:
+
+- `Microsoft.Storage/storageAccounts/blobServices/containers/blobs/read` to read and list files in durable storage 
+- `Microsoft.Storage/storageAccounts/blobServices/containers/blobs/write` to write files in durable storage.
+- `Microsoft.Storage/storageAccounts/blobServices/containers/blobs/add/action` to create files in durable storage.
+- `Microsoft.Storage/storageAccounts/blobServices/containers/blobs/delete` to delete files when they're no longer needed.
+
+<!--TBD GCS-->
+
diff --git a/docs/35.0.0/operations/alerts.md b/docs/35.0.0/operations/alerts.md
new file mode 100644
index 0000000000..da9d7b1b97
--- /dev/null
+++ b/docs/35.0.0/operations/alerts.md
@@ -0,0 +1,37 @@
+---
+id: alerts
+title: "Alerts"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+Druid generates alerts on getting into unexpected situations.
+
+Alerts are emitted as JSON objects to a runtime log file or over HTTP (to a service such as Apache Kafka). Alert emission is disabled by default.
+
+All Druid alerts share a common set of fields:
+
+* `timestamp` - the time the alert was created
+* `service` - the service name that emitted the alert
+* `host` - the host name that emitted the alert
+* `severity` - severity of the alert e.g. anomaly, component-failure, service-failure etc.
+* `description` - a description of the alert
+* `data` - if there was an exception then a JSON object with fields `exceptionType`, `exceptionMessage` and `exceptionStackTrace`
diff --git a/docs/35.0.0/operations/auth-ldap.md b/docs/35.0.0/operations/auth-ldap.md
new file mode 100644
index 0000000000..f45f7419b3
--- /dev/null
+++ b/docs/35.0.0/operations/auth-ldap.md
@@ -0,0 +1,313 @@
+---
+id: auth-ldap
+title: "Configure LDAP authentication"
+sidebar_label: "LDAP auth"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+You can use [Lightweight Directory Access Protocol (LDAP)](https://en.wikipedia.org/wiki/Lightweight_Directory_Access_Protocol) to secure access to Apache Druid. This topic describes how to set up Druid authentication and authorization with LDAP and LDAP over TLS (LDAPS). The examples on this page show the configuration for an Active Directory LDAP system.
+
+The first step is to enable LDAP authentication and authorization for Druid. You then map an LDAP group to Druid roles and assign permissions to those roles. After you've completed this configuration you can optionally choose to enable LDAPS to make LDAP traffic confidential and secure.
+
+## Prerequisites
+
+Before you start to configure LDAP for Druid, test your LDAP connection and perform a sample search.
+
+### Check your LDAP connection
+
+Test your LDAP connection to verify it works with user credentials. Later in the process you [configure Druid for LDAP authentication](#configure-druid-for-ldap-authentication) with this user as the `bindUser`.
+
+The following example command tests the connection for the user `myuser@example.com`. Insert your LDAP server IP address. Modify the port number of your LDAP instance if it listens on a port other than `389`.
+
+```bash
+ldapwhoami -vv -H ldap://ip_address:389  -D "myuser@example.com" -W
+```
+
+Enter the password for the user when prompted and verify that the command succeeded. If it failed, check the following:
+
+- Make sure you're using the correct port for your LDAP instance.
+- Check if a network firewall is preventing connections to the LDAP port.
+- Review your LDAP implementation details to see whether you need to specifically allow LDAP clients at the LDAP server. If so, add the Druid Coordinator server to the allow list.
+
+### Test your LDAP search
+
+Once your LDAP connection is working, search for a user. For example, the following command searches for the user `myuser` in an Active Directory system. The `sAMAccountName` attribute is specific to Active Directory and contains the authenticated user identity:
+
+```bash
+ldapsearch -x -W -H ldap://ip_address:389  -D "cn=admin,dc=example,dc=com" -b "dc=example,dc=com" "(sAMAccountName=myuser)" +
+```
+
+The `memberOf` attribute in the results shows the groups the user belongs to. For example, the following response shows that the user is a member of the `mygroup` group:
+
+```bash
+memberOf: cn=mygroup,ou=groups,dc=example,dc=com
+```
+
+You use this information to map the LDAP group to Druid roles in a later step. 
+
+:::info
+ Druid uses the `memberOf` attribute to determine a group's membership using LDAP. If your LDAP server implementation doesn't include this attribute, you must complete some additional steps when you [map LDAP groups to Druid roles](#map-ldap-groups-to-druid-roles).
+:::
+
+## Configure Druid for LDAP authentication
+
+To configure Druid to use LDAP authentication, follow these steps. See [Configuration reference](../configuration/index.md) for the location of the configuration files. 
+
+1. Create a user in your LDAP system that you'll use both for internal communication with Druid and as the LDAP initial admin user. See [Security overview](./security-overview.md) for more information.
+In the example below, the LDAP user is `internal@example.com`.
+
+2. Enable the `druid-basic-security` extension in the `common.runtime.properties` file.
+
+3. In the `common.runtime.properties` file, add the following lines for LDAP properties and substitute the values for your own. See [Druid basic security](../development/extensions-core/druid-basic-security.md#properties-for-ldap-user-authentication) for details about these properties.
+ 
+   ```
+   druid.auth.authenticatorChain=["ldap"]
+   druid.auth.authenticator.ldap.type=basic
+   druid.auth.authenticator.ldap.enableCacheNotifications=true
+   druid.auth.authenticator.ldap.credentialsValidator.type=ldap
+   druid.auth.authenticator.ldap.credentialsValidator.url=ldap://ip_address:port
+   druid.auth.authenticator.ldap.credentialsValidator.bindUser=administrator@example.com
+   druid.auth.authenticator.ldap.credentialsValidator.bindPassword=adminpassword
+   druid.auth.authenticator.ldap.credentialsValidator.baseDn=dc=example,dc=com
+   druid.auth.authenticator.ldap.credentialsValidator.userSearch=(&(sAMAccountName=%s)(objectClass=user))
+   druid.auth.authenticator.ldap.credentialsValidator.userAttribute=sAMAccountName
+   druid.auth.authenticator.ldap.authorizerName=ldapauth
+   druid.escalator.type=basic
+   druid.escalator.internalClientUsername=internal@example.com
+   druid.escalator.internalClientPassword=internaluserpassword
+   druid.escalator.authorizerName=ldapauth
+   druid.auth.authorizers=["ldapauth"]
+   druid.auth.authorizer.ldapauth.type=basic
+   druid.auth.authorizer.ldapauth.initialAdminUser=internal@example.com
+   druid.auth.authorizer.ldapauth.initialAdminRole=admin
+   druid.auth.authorizer.ldapauth.roleProvider.type=ldap
+   ```
+   Note the following:
+
+   - `bindUser`: A user for connecting to LDAP. This should be the same user you used to [test your LDAP search](#test-your-ldap-search).
+   - `userSearch`: Your LDAP search syntax.
+   - `userAttribute`: The user search attribute.
+   - `internal@example.com` is the LDAP user you created in step 1. In the example it serves as both the internal client user and the initial admin user.
+
+:::info
+ In the above example, the [Druid escalator](../development/extensions-core/druid-basic-security.md#escalator) and LDAP initial admin user are set to the same user - `internal@example.com`. If the escalator is set to a different user, you must follow steps 4 and 5 to create the group mapping and allocate initial roles before the rest of the cluster can function.
+:::
+
+4. Save your group mapping to a JSON file. An example file `groupmap.json` looks like this:
+   
+   ```
+   {
+      "name": "mygroupmap",
+      "groupPattern": "CN=mygroup,CN=Users,DC=example,DC=com",
+      "roles": [
+         "readRole"
+      ]
+   }
+   ```
+   In the example, the LDAP group `mygroup` maps to Druid role `readRole` and the name of the mapping is `mygroupmap`.
+
+5. Use the Druid API to create the group mapping and allocate initial roles according to your JSON file. The following example uses curl to create the mapping defined in `groupmap.json` for the LDAP group `mygroup`:
+   
+   ```
+   curl -i -v  -H "Content-Type: application/json" -u internal -X POST -d @groupmap.json http://localhost:8081/druid-ext/basic-security/authorization/db/ldapauth/groupMappings/mygroupmap
+   ```
+6. Check that the group mapping was created successfully. The following example request lists all group mappings:
+
+   ```
+   curl -i -v  -H "Content-Type: application/json" -u internal -X GET  http://localhost:8081/druid-ext/basic-security/authorization/db/ldapauth/groupMappings
+   ```
+
+## Map LDAP groups to Druid roles
+
+Once you've completed the initial setup and mapping, you can map more LDAP groups to Druid roles. Members of an LDAP group get access to the permissions of the corresponding Druid role.
+
+### Create a Druid role
+
+To create a Druid role, you can submit a POST request to the Coordinator process using the Druid REST API or you can use the Druid console.
+
+The examples below use `localhost` as the Coordinator host and `8081` as the port. Amend these properties according to the details of your deployment. 
+
+Example request to create a role named `readRole`:
+
+```
+curl -i -v  -H "Content-Type: application/json" -u internal -X POST  http://localhost:8081/druid-ext/basic-security/authorization/db/ldapauth/roles/readRole 
+```
+
+Check that Druid created the role successfully. The following example request lists all roles:
+
+```
+curl -i -v  -H "Content-Type: application/json" -u internal -X GET  http://localhost:8081/druid-ext/basic-security/authorization/db/ldapauth/roles
+```
+
+### Add permissions to the Druid role
+
+Once you have a Druid role you can add permissions to it. The following example adds read-only access to a `wikipedia` data source.
+
+Given the following JSON in a file named `perm.json`:
+
+```
+[
+	{ "resource": { "name": "wikipedia", "type": "DATASOURCE" }, "action": "READ" },
+    { "resource": { "name": ".*", "type": "STATE" }, "action": "READ" },
+	{ "resource": {"name": ".*", "type": "CONFIG"}, "action": "READ"}
+]
+```
+
+The following request associates the permissions in the JSON file with the `readRole` role:
+
+```
+curl -i -v  -H "Content-Type: application/json" -u internal -X POST -d@perm.json  http://localhost:8081/druid-ext/basic-security/authorization/db/ldapauth/roles/readRole/permissions
+```
+
+Druid users need the `STATE` and `CONFIG` permissions to view the data source in the Druid console. If you only want to assign querying permissions you can apply just the `READ` permission with the first line in the `perm.json` file.
+
+You can also provide the data source name in the form of a regular expression. For example, to give access to all data sources starting with `wiki`, you would specify the data source name as `{ "name": "wiki.*" }` .
+
+### Create the group mapping
+
+You can now map an LDAP group to the Druid role. The following example request creates a mapping with name `mygroupmap`. It assumes that a group named `mygroup` exists in the directory.
+
+```
+{
+    "name": "mygroupmap",
+    "groupPattern": "CN=mygroup,CN=Users,DC=example,DC=com",
+    "roles": [
+        "readRole"
+    ]
+}
+```
+
+The following example request configures the mapping&mdash;the role mapping is in the file `groupmap.json`. See [Configure Druid for LDAP authentication](#configure-druid-for-ldap-authentication) for the contents of an example file.
+
+```
+curl -i -v  -H "Content-Type: application/json" -u internal -X POST -d @groupmap.json http://localhost:8081/druid-ext/basic-security/authorization/db/ldapauth/groupMappings/mygroupmap
+```
+
+To check whether the group mapping was created successfully, the following request lists all group mappings:
+
+```
+curl -i -v  -H "Content-Type: application/json" -u internal -X GET http://localhost:8081/druid-ext/basic-security/authorization/db/ldapauth/groupMappings
+```
+
+The following example request returns the details of the `mygroupmap` group:
+
+```
+curl -i -v  -H "Content-Type: application/json" -u internal -X GET http://localhost:8081/druid-ext/basic-security/authorization/db/ldapauth/groupMappings/mygroupmap
+```
+
+The following example request adds the role `queryRole` to the `mygroupmap` mapping:
+
+```
+curl -i -v  -H "Content-Type: application/json" -u internal -X POST http://localhost:8081/druid-ext/basic-security/authorization/db/ldapauth/groupMappings/mygroup/roles/queryrole
+```
+
+### Add an LDAP user to Druid and assign a role
+
+You only need to complete this step if:
+- Your LDAP user doesn't belong to any of your LDAP groups, or
+- You want to configure a user with additional Druid roles that are not mapped to the LDAP groups that the user belongs to.
+
+Example request to add the LDAP user `myuser` to Druid:
+
+```
+curl -i -v  -H "Content-Type: application/json" -u internal -X POST http://localhost:8081/druid-ext/basic-security/authorization/db/ldapauth/users/myuser 
+```
+
+Example request to assign the `myuser` user to the `queryRole` role:
+
+```
+curl -i -v  -H "Content-Type: application/json" -u internal -X POST http://localhost:8081/druid-ext/basic-security/authorization/db/ldapauth/users/myuser/roles/queryRole
+```
+
+## Enable LDAP over TLS (LDAPS)
+
+Once you've configured LDAP authentication in Druid, you can optionally make LDAP traffic confidential and secure by using Transport Layer Security (TLS)&mdash;previously Secure Socket Layer(SSL)&mdash;technology. 
+
+Configuring LDAPS establishes trust between Druid and the LDAP server.
+
+## Prerequisites
+
+Before you start to set up LDAPS in Druid, you must [configure Druid for LDAP authentication](#configure-druid-for-ldap-authentication). You also need:
+
+- A certificate issued by a public certificate authority (CA) or a self-signed certificate by an internal CA.
+- The root certificate for the CA that signed the certificate for the LDAP server. If you're using a common public CA, the certificate may already be in the Java truststore. Otherwise you need to import the certificate for the CA.
+
+## Configure Druid for LDAPS
+
+Complete the following steps to set up LDAPS for Druid. See [Configuration reference](../configuration/index.md) for the location of the configuration files. 
+
+1. Import the CA or self-signed certificate for your LDAP server into either a newly created LDAP trust store or the trust store specified by the `druid.client.https.trustStorePath`  property located in your `common.runtime.properties` file.
+
+   The example below illustrates the option with one key store for both HTTPS clients and LDAP clients, but you can use a separate dedicated trust store just for ldap if you wish. 
+
+  ```
+  keytool -import -trustcacerts -keystore path/to/cacerts -storepass truststorepassword -alias aliasName -file path/to/certificate.cer
+  ```
+
+  Replace `path/to/cacerts` with the path to your truststore, `truststorepassword` with your truststore password, `aliasName` with an alias name for the keystore, and `path/to/certificate.cer` with the location and name of your certificate. For example:
+
+   ```
+  keytool -import -trustcacerts -keystore /Library/Java/JavaVirtualMachines/adoptopenjdk-8.jdk/Contents/Home/jre/lib/security/cacerts -storepass mypassword -alias myAlias -file /etc/ssl/certs/my-certificate.cer
+  ```
+
+
+2. If the root certificate for the CA isn't already in the Java truststore, import it:
+
+   ```
+   keytool -importcert -keystore path/to/cacerts -storepass truststorepassword -alias aliasName -file path/to/certificate.cer
+   ```
+
+   Replace `path/to/cacerts` with the path to your truststore, `truststorepassword` with your truststore password, `aliasName` with an alias name for the keystore, and `path/to/certificate.cer` with the location and name of your certificate. For example:
+	
+   ```
+   keytool -importcert -keystore /Library/Java/JavaVirtualMachines/adoptopenjdk-8.jdk/Contents/Home/jre/lib/security/cacerts -storepass mypassword -alias myAlias -file /etc/ssl/certs/my-certificate.cer
+   ```
+
+3. In your `common.runtime.properties` file, add the following lines to the LDAP configuration section, substituting your own trust store path and password. Note that the property to point to the trust store is `druid.auth.basic.ssl.trustStorePath` and not `druid.client.https.trustStorePath` . Regardless of if you use the same trust store for HTTPS clients and LDAP or if you use a separate LDAP trust store, ensure the correct property points to the trust store where you imported the LDAP certificates. 
+
+   ```
+   druid.auth.basic.ssl.trustStorePath=/Library/Java/JavaVirtualMachines/adoptopenjdk-8.jdk/Contents/Home/jre/lib/security/cacerts
+   druid.auth.basic.ssl.protocol=TLS
+   druid.auth.basic.ssl.trustStorePassword=xxxxxx
+   ```
+
+   See [Druid basic security](../development/extensions-core/druid-basic-security.md#properties-for-ldaps) for details about these properties.
+
+4. You can optionally configure additional LDAPS properties in the `common.runtime.properties` file. See [Druid basic security](../development/extensions-core/druid-basic-security.md#properties-for-ldaps) for more information.
+
+5. Restart Druid.
+
+
+## Troubleshooting tips
+
+The following are some ideas to help you troubleshoot issues with LDAP and LDAPS.
+
+### Check the coordinator logs
+
+If your LDAP connection isn't working, check the coordinator logs. See [Logging](../configuration/logging.md) for details.
+
+### Check the Druid escalator configuration
+
+If the coordinator is working but the rest of the cluster isn't, check the escalator configuration. See the [Configuration reference](../configuration/index.md) for details. You can also check other service logs to see why the services are unable to fetch authorization details from the coordinator.
+
+### Check your LDAP server response time
+
+If a user can log in to the Druid console but the landing page shows a 401 error, check your LDAP server response time. In a large organization with a high number of LDAP users, LDAP may be slow to respond, and this can result in a connection timeout.
diff --git a/docs/35.0.0/operations/auth.md b/docs/35.0.0/operations/auth.md
new file mode 100644
index 0000000000..95b79ef5fa
--- /dev/null
+++ b/docs/35.0.0/operations/auth.md
@@ -0,0 +1,200 @@
+---
+id: auth
+title: "Authentication and Authorization"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+This document describes non-extension specific Apache Druid authentication and authorization configurations.
+
+|Property|Type|Description|Default|Required|
+|--------|-----------|--------|--------|--------|
+|`druid.auth.authenticatorChain`|JSON List of Strings|List of Authenticator type names|["allowAll"]|no|
+|`druid.escalator.type`|String|Type of the Escalator that should be used for internal Druid communications. This Escalator must use an authentication scheme that is supported by an Authenticator in `druid.auth.authenticatorChain`.|"noop"|no|
+|`druid.auth.authorizers`|JSON List of Strings|List of Authorizer type names |["allowAll"]|no|
+|`druid.auth.unsecuredPaths`| List of Strings|List of paths for which security checks will not be performed. All requests to these paths will be allowed.|[]|no|
+|`druid.auth.allowUnauthenticatedHttpOptions`|Boolean|If true, allow HTTP OPTIONS requests by unauthenticated users. This is primarily useful for supporting CORS preflight requests, which Druid does not support directly, but which can be enabled using third-party extensions.<br /><br />Note that you must add "OPTIONS" to `druid.server.http.allowedHttpMethods`.<br /><br />Also note that disabling authentication checks for OPTIONS requests will allow unauthenticated users to determine what Druid endpoints are valid (by checking if the OPTIONS request returns a 200 instead of 404). Enabling this option will reveal information about server configuration, including information about what extensions are loaded, to unauthenticated users.|false|no|
+
+## Enabling Authentication/AuthorizationLoadingLookupTest
+
+## Authenticator chain
+Authentication decisions are handled by a chain of Authenticator instances. A request will be checked by Authenticators in the sequence defined by the `druid.auth.authenticatorChain`.
+
+Authenticator implementations are provided by extensions.
+
+For example, the following authenticator chain definition enables the Kerberos and HTTP Basic authenticators, from the `druid-kerberos` and `druid-basic-security` core extensions, respectively:
+
+```
+druid.auth.authenticatorChain=["kerberos", "basic"]
+```
+
+A request will pass through all Authenticators in the chain, until one of the Authenticators successfully authenticates the request or sends an HTTP error response. Authenticators later in the chain will be skipped after the first successful authentication or if the request is terminated with an error response.
+
+If no Authenticator in the chain successfully authenticated a request or sent an HTTP error response, an HTTP error response will be sent at the end of the chain.
+
+Druid includes two built-in Authenticators, one of which is used for the default unsecured configuration.
+
+### AllowAll authenticator
+
+This built-in Authenticator authenticates all requests, and always directs them to an Authorizer named `allowAll`. It's not intended to be used for anything other than the default unsecured configuration.
+
+```properties
+druid.auth.authorizer.allowAll.type=allowAll
+```
+
+### Anonymous authenticator
+
+This built-in Authenticator authenticates all requests, and directs them to an Authorizer specified in the configuration by the user. It is intended to be used for adding a default level of access so
+the Anonymous Authenticator should be added to the end of the authenticator chain. A request that reaches the Anonymous Authenticator at the end of the chain will succeed or fail depending on how the Authorizer linked to the Anonymous Authenticator is configured.
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|--------|
+|`druid.auth.authenticator.<authenticatorName>.authorizerName`|Authorizer that requests should be directed to.|N/A|Yes|
+|`druid.auth.authenticator.<authenticatorName>.identity`|The identity of the requester.|defaultUser|No|
+
+To use the Anonymous Authenticator, add an authenticator with type `anonymous` to the authenticatorChain.
+
+For example, the following enables the Anonymous Authenticator with the `druid-basic-security` extension:
+
+```
+druid.auth.authenticatorChain=["basic", "anonymous"]
+
+druid.auth.authenticator.anonymous.type=anonymous
+druid.auth.authenticator.anonymous.identity=defaultUser
+druid.auth.authenticator.anonymous.authorizerName=myBasicAuthorizer
+
+# ... usual configs for basic authentication would go here ...
+```
+
+### Trusted domain Authenticator
+
+This built-in Trusted Domain Authenticator authenticates requests originating from the configured trusted domain, and directs them to an Authorizer specified in the configuration by the user. It is intended to be used for adding a default level of trust and allow access for hosts within same domain. 
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|--------|
+|`druid.auth.authenticator.<authenticatorName>.name`|authenticator name.|N/A|Yes|
+|`druid.auth.authenticator.<authenticatorName>.domain`|Trusted Domain from which requests should be authenticated. If authentication is allowed for connections from only a given host, fully qualified hostname of that host needs to be specified.|N/A|Yes|
+|`druid.auth.authenticator.<authenticatorName>.useForwardedHeaders`|Clients connecting to druid could pass through many layers of proxy. Some proxies also append its own IP address to 'X-Forwarded-For' header before passing on the request to another proxy. Some proxies also connect on behalf of client. If this config is set to true and if 'X-Forwarded-For' is present, trusted domain authenticator will use left most host name from X-Forwarded-For header. Note: It is possible to spoof X-Forwarded-For headers in HTTP requests, enable this with caution.|false|No|
+|`druid.auth.authenticator.<authenticatorName>.authorizerName`|Authorizer that requests should be directed to.|N/A|Yes|
+|`druid.auth.authenticator.<authenticatorName>.identity`|The identity of the requester.|defaultUser|No|
+
+To use the Trusted Domain Authenticator, add an authenticator with type `trustedDomain` to the authenticatorChain.
+
+For example, the following enables the Trusted Domain Authenticator :
+
+```
+druid.auth.authenticatorChain=["trustedDomain"]
+
+druid.auth.authenticator.trustedDomain.type=trustedDomain
+druid.auth.authenticator.trustedDomain.domain=trustedhost.mycompany.com
+druid.auth.authenticator.trustedDomain.identity=defaultUser
+druid.auth.authenticator.trustedDomain.authorizerName=myBasicAuthorizer
+druid.auth.authenticator.trustedDomain.name=myTrustedAutenticator
+# ... usual configs for druid would go here ...
+```
+
+
+## Escalator
+The `druid.escalator.type` property determines what authentication scheme should be used for internal Druid cluster communications (such as when a Broker process communicates with Historical processes for query processing).
+
+The Escalator chosen for this property must use an authentication scheme that is supported by an Authenticator in `druid.auth.authenticatorChain`. Authenticator extension implementers must also provide a corresponding Escalator implementation if they intend to use a particular authentication scheme for internal Druid communications.
+
+### Noop escalator
+
+This built-in default Escalator is intended for use only with the default AllowAll Authenticator and Authorizer.
+
+## Authorizers
+Authorization decisions are handled by an Authorizer. The `druid.auth.authorizers` property determines what Authorizer implementations will be active.
+
+There are two built-in Authorizers, "default" and "noop". Other implementations are provided by extensions.
+
+For example, the following authorizers definition enables the "basic" implementation from `druid-basic-security`:
+
+```
+druid.auth.authorizers=["basic"]
+```
+
+
+Only a single Authorizer will authorize any given request.
+
+Druid includes one built in authorizer:
+
+### AllowAll authorizer
+
+The Authorizer with type name "allowAll" accepts all requests.
+
+## Default Unsecured Configuration
+
+When `druid.auth.authenticatorChain` is left empty or unspecified, Druid will create an authenticator chain with a single AllowAll Authenticator named "allowAll".
+
+When `druid.auth.authorizers` is left empty or unspecified, Druid will create a single AllowAll Authorizer named "allowAll".
+
+The default value of `druid.escalator.type` is "noop" to match the default unsecured Authenticator/Authorizer configurations.
+
+## Authenticator to Authorizer Routing
+
+When an Authenticator successfully authenticates a request, it must attach a AuthenticationResult to the request, containing an information about the identity of the requester, as well as the name of the Authorizer that should authorize the authenticated request.
+
+An Authenticator implementation should provide some means through configuration to allow users to select what Authorizer(s) the Authenticator should route requests to.
+
+## Internal system user
+
+Internal requests between Druid processes (non-user initiated communications) need to have authentication credentials attached.
+
+These requests should be run as an "internal system user", an identity that represents the Druid cluster itself, with full access permissions.
+
+The details of how the internal system user is defined is left to extension implementations.
+
+### Authorizer Internal System User Handling
+
+Authorizers implementations must recognize and authorize an identity for the "internal system user", with full access permissions.
+
+### Authenticator and Escalator Internal System User Handling
+
+An Authenticator implementation that is intended to support internal Druid communications must recognize credentials for the "internal system user", as provided by a corresponding Escalator implementation.
+
+An Escalator must implement three methods related to the internal system user:
+
+```java
+  public HttpClient createEscalatedClient(HttpClient baseClient);
+
+  public org.eclipse.jetty.client.HttpClient createEscalatedJettyClient(org.eclipse.jetty.client.HttpClient baseClient);
+
+  public AuthenticationResult createEscalatedAuthenticationResult();
+```
+
+`createEscalatedClient` returns an wrapped HttpClient that attaches the credentials of the "internal system user" to requests.
+
+`createEscalatedJettyClient` is similar to `createEscalatedClient`, except that it operates on a Jetty HttpClient.
+
+`createEscalatedAuthenticationResult` returns an AuthenticationResult containing the identity of the "internal system user".
+
+## Reserved Name Configuration Property
+
+For extension implementers, please note that the following configuration properties are reserved for the names of Authenticators and Authorizers:
+
+```
+druid.auth.authenticator.<authenticator-name>.name=<authenticator-name>
+druid.auth.authorizer.<authorizer-name>.name=<authorizer-name>
+
+```
+
+These properties provide the authenticator and authorizer names to the implementations as @JsonProperty parameters, potentially useful when multiple authenticators or authorizers of the same type are configured.
diff --git a/docs/35.0.0/operations/basic-cluster-tuning.md b/docs/35.0.0/operations/basic-cluster-tuning.md
new file mode 100644
index 0000000000..4cbd9c964a
--- /dev/null
+++ b/docs/35.0.0/operations/basic-cluster-tuning.md
@@ -0,0 +1,469 @@
+---
+id: basic-cluster-tuning
+title: "Basic cluster tuning"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+This document provides basic guidelines for configuration properties and cluster architecture considerations related to performance tuning of an Apache Druid deployment.
+
+Please note that this document provides general guidelines and rules-of-thumb: these are not absolute, universal rules for cluster tuning, and this introductory guide is not an exhaustive description of all Druid tuning properties, which are described in the [configuration reference](../configuration/index.md).
+
+If you have questions on tuning Druid for specific use cases, or questions on configuration properties not covered in this guide, please ask the [Druid user mailing list or other community channels](https://druid.apache.org/community/).
+
+## Process-specific guidelines
+
+### Historical
+
+#### Heap sizing
+
+The biggest contributions to heap usage on Historicals are:
+
+- Partial unmerged query results from segments
+- The stored maps for [lookups](../querying/lookups.md).
+
+A general rule-of-thumb for sizing the Historical heap is `(0.5GiB * number of CPU cores)`.
+
+This is a starting point, not a hard rule for sizing Historical heaps.
+Note that with certain garbage collectors, having a large heap can result in excessively long GC pauses. For heaps larger than about 24GiB, we recommend using a collector that can handle large heaps, such as Shenandoah or ZGC.
+
+If caching is enabled on Historicals, the cache is stored on heap, sized by `druid.cache.sizeInBytes`.
+
+Running out of heap on the Historicals can indicate misconfiguration or usage patterns that are overloading the cluster.
+
+##### Lookups
+
+If you are using lookups, calculate the total size of the lookup maps being loaded.
+
+Druid performs an atomic swap when updating lookup maps (both the old map and the new map will exist in heap during the swap), so the maximum potential heap usage from lookup maps will be (2 * total size of all loaded lookups).
+
+Be sure to add `(2 * total size of all loaded lookups)` to your heap size in addition to the `(0.5GiB * number of CPU cores)` guideline.
+
+#### Processing Threads and Buffers
+
+Please see the [General Guidelines for Processing Threads and Buffers](#processing-threads-buffers) section for an overview of processing thread/buffer configuration.
+
+On Historicals:
+
+- `druid.processing.numThreads` should generally be set to `(number of cores - 1)`: a smaller value can result in CPU underutilization, while going over the number of cores can result in unnecessary CPU contention.
+- `druid.processing.buffer.sizeBytes` can be set to 500MiB.
+- `druid.processing.numMergeBuffers`, a 1:4 ratio of  merge buffers to processing threads is a reasonable choice for general use.
+
+#### Direct Memory Sizing
+
+The processing and merge buffers described above are direct memory buffers.
+
+When a historical processes a query, it must open a set of segments for reading. This also requires some direct memory space, described in [segment decompression buffers](#segment-decompression).
+
+A formula for estimating direct memory usage follows:
+
+(`druid.processing.numThreads` + `druid.processing.numMergeBuffers` + 1) * `druid.processing.buffer.sizeBytes`
+
+The `+ 1` factor is a fuzzy estimate meant to account for the segment decompression buffers.
+
+#### Connection pool sizing
+
+Please see the [General Connection Pool Guidelines](#connection-pool) section for an overview of connection pool configuration.
+
+For Historicals, `druid.server.http.numThreads` should be set to a value slightly higher than the sum of `druid.broker.http.numConnections` across all the Brokers in the cluster.
+
+Tuning the cluster so that each Historical can accept 50 queries and 10 non-queries is a reasonable starting point.
+
+#### Segment Cache Size
+
+For better query performance, do not allocate segment data to a Historical in excess of the system free memory. The Historical uses free system memory to cache segments.
+For more detail, see [Loading and serving segments from cache](../design/historical.md#loading-and-serving-segments-from-cache).
+
+Druid uses the `druid.segmentCache.locations` to calculate the total segment data size assigned to a Historical. For rare use cases, you can override this behavior with `druid.server.maxSize` property.
+
+#### Number of Historicals
+
+The number of Historicals needed in a cluster depends on how much data the cluster has. For good performance, you will want enough Historicals such that each Historical has a good (`free system memory` / total size of all `druid.segmentCache.locations`) ratio, as described in the segment cache size section above.
+
+Having a smaller number of big servers is generally better than having a large number of small servers, as long as you have enough fault tolerance for your use case.
+
+#### SSD storage
+
+We recommend using SSDs for storage on the Historicals, as they handle segment data stored on disk.
+
+#### Total memory usage
+
+To estimate total memory usage of the Historical under these guidelines:
+
+- Heap: `(0.5GiB * number of CPU cores) + (2 * total size of lookup maps) + druid.cache.sizeInBytes`
+- Direct Memory: `(druid.processing.numThreads + druid.processing.numMergeBuffers + 1) * druid.processing.buffer.sizeBytes`
+
+The Historical will use any available free system memory (i.e., memory not used by the Historical JVM and heap/direct memory buffers or other processes on the system) for memory-mapping of segments on disk. For better query performance, you will want to ensure a good (`free system memory` / total size of all `druid.segmentCache.locations`) ratio so that a greater proportion of segments can be kept in memory.
+
+#### Segment sizes matter
+
+Be sure to check out [segment size optimization](./segment-optimization.md) to help tune your Historical processes for maximum performance.
+
+### Broker
+
+#### Heap sizing
+
+The biggest contributions to heap usage on Brokers are:
+- Partial unmerged query results from Historicals and Tasks
+- The segment timeline: this consists of location information (which Historical/Task is serving a segment) for all currently [available](../design/storage.md#segment-lifecycle) segments.
+- Cached segment metadata: this consists of metadata, such as per-segment schemas, for all currently available segments.
+
+The Broker heap requirements scale based on the number of segments in the cluster, and the total data size of the segments.
+
+The heap size will vary based on data size and usage patterns, but 4GiB to 8GiB is a good starting point for a small or medium cluster (~15 servers or less). For a rough estimate of memory requirements on the high end, very large clusters with a node count on the order of ~100 nodes may need Broker heaps of 30GiB-60GiB.
+
+If caching is enabled on the Broker, the cache is stored on heap, sized by `druid.cache.sizeInBytes`.
+
+#### Direct memory sizing
+
+On the Broker, the amount of direct memory needed depends on how many merge buffers (used for merging GroupBys) are configured. The Broker does not generally need processing threads or processing buffers, as query results are merged on-heap in the HTTP connection threads instead.
+
+- `druid.processing.buffer.sizeBytes` can be set to 500MiB.
+- `druid.processing.numMergeBuffers`: set this to the same value as on Historicals or a bit higher
+
+#### Connection pool sizing
+
+Please see the [General Connection Pool Guidelines](#connection-pool) section for an overview of connection pool configuration.
+
+On the Brokers, please ensure that the sum of `druid.broker.http.numConnections` across all the Brokers is slightly lower than the value of `druid.server.http.numThreads` on your Historicals and Tasks.
+
+`druid.server.http.numThreads` on the Broker should be set to a value slightly higher than `druid.broker.http.numConnections` on the same Broker.
+
+Tuning the cluster so that each Historical can accept 50 queries and 10 non-queries, adjusting the Brokers accordingly, is a reasonable starting point.
+
+#### Broker backpressure
+
+When retrieving query results from Historical processes or Tasks, the Broker can optionally specify a maximum buffer size for queued, unread data, and exert backpressure on the channel to the Historical or Tasks when limit is reached (causing writes to the channel to block on the Historical/Task side until the Broker is able to drain some data from the channel).
+
+This buffer size is controlled by the `druid.broker.http.maxQueuedBytes` setting.
+
+The limit is divided across the number of Historicals/Tasks that a query would hit: suppose I have `druid.broker.http.maxQueuedBytes` set to 5MiB, and the Broker receives a query that needs to be fanned out to 2 Historicals. Each per-historical channel would get a 2.5MiB buffer in this case.
+
+You can generally set this to a value of approximately `2MiB * number of Historicals`. As your cluster scales up with more Historicals and Tasks, consider increasing this buffer size and increasing the Broker heap accordingly.
+
+- If the buffer is too small, this can lead to inefficient queries due to the buffer filling up rapidly and stalling the channel
+- If the buffer is too large, this puts more memory pressure on the Broker due to more queued result data in the HTTP channels.
+
+#### Number of brokers
+
+A 1:15 ratio of Brokers to Historicals is a reasonable starting point (this is not a hard rule).
+
+If you need Broker HA, you can deploy 2 initially and then use the 1:15 ratio guideline for additional Brokers.
+
+#### Total memory usage
+
+To estimate total memory usage of the Broker under these guidelines:
+
+- Heap: allocated heap size
+- Direct Memory: `(druid.processing.numMergeBuffers + 1) * druid.processing.buffer.sizeBytes`
+
+### Middle Manager
+
+The Middle Manager is a lightweight task controller/manager that launches Task processes, which perform ingestion work.
+
+#### Middle Manager heap sizing
+
+The Middle Manager itself does not require much resources, you can set the heap to ~128MiB generally.
+
+#### SSD storage
+
+We recommend using SSDs for storage on the Middle Managers, as the Tasks launched by Middle Managers handle segment data stored on disk.
+
+#### Task Count
+
+The number of tasks a Middle Manager can launch is controlled by the `druid.worker.capacity` setting.
+
+The number of workers needed in your cluster depends on how many concurrent ingestion tasks you need to run for your use cases. The number of workers that can be launched on a given machine depends on the size of resources allocated per worker and available system resources.
+
+You can allocate more Middle Manager machines to your cluster to add task capacity.
+
+#### Task configurations
+
+The following section below describes configuration for Tasks launched by the Middle Manager. The Tasks can be queried and perform ingestion workloads, so they require more resources than the MM.
+
+##### Task heap sizing
+
+A 1GiB heap is usually enough for Tasks.
+
+###### Lookups
+
+If you are using lookups, calculate the total size of the lookup maps being loaded.
+
+Druid performs an atomic swap when updating lookup maps (both the old map and the new map will exist in heap during the swap), so the maximum potential heap usage from lookup maps will be (2 * total size of all loaded lookups).
+
+Be sure to add `(2 * total size of all loaded lookups)` to your Task heap size if you are using lookups.
+
+##### Task processing threads and buffers
+
+For Tasks, 1 or 2 processing threads are often enough, as the Tasks tend to hold much less queryable data than Historical processes.
+
+- `druid.indexer.fork.property.druid.processing.numThreads`: set this to 1 or 2
+- `druid.indexer.fork.property.druid.processing.numMergeBuffers`: set this to 2
+- `druid.indexer.fork.property.druid.processing.buffer.sizeBytes`: can be set to 100MiB
+
+##### Direct memory sizing
+
+The processing and merge buffers described above are direct memory buffers.
+
+When a Task processes a query, it must open a set of segments for reading. This also requires some direct memory space, described in [segment decompression buffers](#segment-decompression).
+
+An ingestion Task also needs to merge partial ingestion results, which requires direct memory space, described in [segment merging](#segment-merging).
+
+A formula for estimating direct memory usage follows:
+
+(`druid.processing.numThreads` + `druid.processing.numMergeBuffers` + 1) * `druid.processing.buffer.sizeBytes`
+
+The `+ 1` factor is a fuzzy estimate meant to account for the segment decompression buffers and dictionary merging buffers.
+
+##### Connection pool sizing
+
+Please see the [General Connection Pool Guidelines](#connection-pool) section for an overview of connection pool configuration.
+
+For Tasks, `druid.server.http.numThreads` should be set to a value slightly higher than the sum of `druid.broker.http.numConnections` across all the Brokers in the cluster.
+
+Tuning the cluster so that each Task can accept 50 queries and 10 non-queries is a reasonable starting point.
+
+#### Total memory usage
+
+To estimate total memory usage of a Task under these guidelines:
+
+- Heap: `1GiB + (2 * total size of lookup maps)`
+- Direct Memory: `(druid.processing.numThreads + druid.processing.numMergeBuffers + 1) * druid.processing.buffer.sizeBytes`
+
+The total memory usage of the Middle Manager + Tasks:
+
+`MM heap size + druid.worker.capacity * (single task memory usage)`
+
+##### Configuration guidelines for specific ingestion types
+
+###### Kafka/Kinesis ingestion
+
+If you use the [Kafka Indexing Service](../ingestion/kafka-ingestion.md) or [Kinesis Indexing Service](../ingestion/kinesis-ingestion.md), the number of tasks required will depend on the number of partitions and your taskCount/replica settings.
+
+On top of those requirements, allocating more task slots in your cluster is a good idea, so that you have free task
+slots available for other tasks, such as [compaction tasks](../data-management/compaction.md).
+
+###### Hadoop ingestion
+
+If you are only using [Hadoop-based batch ingestion](../ingestion/hadoop.md) with no other ingestion types, you can lower the amount of resources allocated per Task. Batch ingestion tasks do not need to answer queries, and the bulk of the ingestion workload will be executed on the Hadoop cluster, so the Tasks do not require much resources.
+
+###### Parallel native ingestion
+
+If you are using [parallel native batch ingestion](../ingestion/native-batch.md), allocating more available task slots is a good idea and will allow greater ingestion concurrency.
+
+### Coordinator
+
+The main performance-related setting on the Coordinator is the heap size.
+
+The heap requirements of the Coordinator scale with the number of servers, segments, and tasks in the cluster.
+
+You can set the Coordinator heap to the same size as your Broker heap, or slightly smaller: both services have to process cluster-wide state and answer API requests about this state.
+
+#### Dynamic Configuration
+
+`percentOfSegmentsToConsiderPerMove`
+* The default value is 100. This means that the Coordinator will consider all segments when it is looking for a segment to move. The Coordinator makes a weighted choice, with segments on Servers with the least capacity being the most likely segments to be moved.
+  * This weighted selection strategy means that the segments on the servers who have the most available capacity are the least likely to be chosen.
+  * As the number of segments in the cluster increases, the probability of choosing the Nth segment to move decreases; where N is the last segment considered for moving.
+  * An admin can use this config to skip consideration of that Nth segment.
+* Instead of skipping a precise amount of segments, we skip a percentage of segments in the cluster.
+  * For example, with the value set to 25, only the first 25% of segments will be considered as a segment that can be moved. This 25% of segments will come from the servers that have the least available capacity.
+    * In this example, each time the Coordinator looks for a segment to move, it will consider 75% less segments than it did when the configuration was 100. On clusters with hundreds of thousands of segments, this can add up to meaningful coordination time savings.
+* General recommendations for this configuration:
+  * If you are not worried about the amount of time it takes your Coordinator to complete a full coordination cycle, you likely do not need to modify this config.
+  * If you are frustrated with how long the Coordinator takes to run a full coordination cycle, and you have set the Coordinator dynamic config `maxSegmentsToMove` to a value above 0 (the default is 5), setting this config to a non-default value can help shorten coordination time.
+    * The recommended starting point value is 66. It represents a meaningful decrease in the percentage of segments considered while also not being too aggressive (You will consider 1/3 fewer segments per move operation with this value).
+* The impact that modifying this config will have on your coordination time will be a function of how low you set the config value, the value for `maxSegmentsToMove` and the total number of segments in your cluster.
+  * If your cluster has a relatively small number of segments, or you choose to move few segments per coordination cycle, there may not be much savings to be had here.
+
+### Overlord
+
+The main performance-related setting on the Overlord is the heap size.
+
+The heap requirements of the Overlord scale primarily with the number of running Tasks.
+
+The Overlord tends to require less resources than the Coordinator or Broker. You can generally set the Overlord heap to a value that's 25-50% of your Coordinator heap.
+
+### Router
+
+The Router has light resource requirements, as it proxies requests to Brokers without performing much computational work itself.
+
+You can assign it 256MiB heap as a starting point, growing it if needed.
+
+<a name="processing-threads-buffers"></a>
+
+## Guidelines for processing threads and buffers
+
+### Processing threads
+
+The `druid.processing.numThreads` configuration controls the size of the processing thread pool used for computing query results. The size of this pool limits how many queries can be concurrently processed.
+
+### Processing buffers
+
+`druid.processing.buffer.sizeBytes` is a closely related property that controls the size of the off-heap buffers allocated to the processing threads.
+
+One buffer is allocated for each processing thread. A size between 500MiB and 1GiB is a reasonable choice for general use.
+
+The TopN and GroupBy queries use these buffers to store intermediate computed results. As the buffer size increases, more data can be processed in a single pass.
+
+### GroupBy merging buffers
+
+If you plan to issue GroupBy queries, `druid.processing.numMergeBuffers` is an important configuration property.
+
+GroupBy queries use an additional pool of off-heap buffers for merging query results. These buffers have the same size as the processing buffers described above, set by the `druid.processing.buffer.sizeBytes` property.
+
+Non-nested GroupBy queries require 1 merge buffer per query, while a nested GroupBy query requires 2 merge buffers (regardless of the depth of nesting).
+
+The number of merge buffers determines the number of GroupBy queries that can be processed concurrently.
+
+<a name="connection-pool"></a>
+
+## Connection pool guidelines
+
+Each Druid process has a configuration property for the number of HTTP connection handling threads, `druid.server.http.numThreads`.
+
+The number of HTTP server threads limits how many concurrent HTTP API requests a given process can handle.
+
+### Sizing the connection pool for queries
+
+The Broker has a setting `druid.broker.http.numConnections` that controls how many outgoing connections it can make to a given Historical or Task process.
+
+These connections are used to send queries to the Historicals or Tasks, with one connection per query; the value of `druid.broker.http.numConnections` is effectively a limit on the number of concurrent queries that a given broker can process.
+
+Suppose we have a cluster with 3 Brokers and `druid.broker.http.numConnections` is set to 10.
+
+This means that each Broker in the cluster will open up to 10 connections to each individual Historical or Task (for a total of 30 incoming query connections per Historical/Task).
+
+On the Historical/Task side, this means that `druid.server.http.numThreads` must be set to a value at least as high as the sum of `druid.broker.http.numConnections` across all the Brokers in the cluster.
+
+In practice, you will want to allocate additional server threads for non-query API requests such as status checks; adding 10 threads for those is a good general guideline. Using the example with 3 Brokers in the cluster and `druid.broker.http.numConnections` set to 10, a value of 40 would be appropriate for `druid.server.http.numThreads` on Historicals and Tasks.
+
+As a starting point, allowing for 50 concurrent queries (requests that read segment data from datasources) + 10 non-query requests (other requests like status checks) on Historicals and Tasks is reasonable (i.e., set `druid.server.http.numThreads` to 60 there), while sizing `druid.broker.http.numConnections` based on the number of Brokers in the cluster to fit within the 50 query connection limit per Historical/Task.
+
+- If the connection pool across Brokers and Historicals/Tasks is too small, the cluster will be underutilized as there are too few concurrent query slots.
+- If the connection pool is too large, you may get out-of-memory errors due to excessive concurrent load, and increased resource contention.
+- The connection pool sizing matters most when you require QoS-type guarantees and use query priorities; otherwise, these settings can be more loosely configured.
+- If your cluster usage patterns are heavily biased towards a high number of small concurrent queries (where each query takes less than ~15ms), enlarging the connection pool can be a good idea.
+- The 50/10 general guideline here is a rough starting point, since different queries impose different amounts of load on the system. To size the connection pool more exactly for your cluster, you would need to know the execution times for your queries and ensure that the rate of incoming queries does not exceed your "drain" rate.
+
+## Per-segment direct memory buffers
+
+### Segment decompression
+
+When opening a segment for reading during segment merging or query processing, Druid allocates a 64KiB off-heap decompression buffer for each column being read.
+
+Thus, there is additional direct memory overhead of (64KiB * number of columns read per segment * number of segments read) when reading segments.
+
+### Segment merging
+
+In addition to the segment decompression overhead described above, when a set of segments are merged during ingestion, a direct buffer is allocated for every String typed column, for every segment in the set to be merged.
+
+The size of these buffers are equal to the cardinality of the String column within its segment, times 4 bytes (the buffers store integers).
+
+For example, if two segments are being merged, the first segment having a single String column with cardinality 1000, and the second segment having a String column with cardinality 500, the merge step would allocate (1000 + 500) * 4 = 6000 bytes of direct memory.
+
+These buffers are used for merging the value dictionaries of the String column across segments. These "dictionary merging buffers" are independent of the "merge buffers" configured by `druid.processing.numMergeBuffers`.
+
+
+## General recommendations
+
+### JVM tuning
+
+#### Garbage Collection
+We recommend using the G1GC garbage collector:
+
+`-XX:+UseG1GC`
+
+Enabling process termination on out-of-memory errors is useful as well, since the process generally will not recover from such a state, and it's better to restart the process:
+
+`-XX:+ExitOnOutOfMemoryError`
+
+#### Other generally useful JVM flags
+
+```
+-Duser.timezone=UTC
+-Dfile.encoding=UTF-8
+-Djava.io.tmpdir=<should not be volatile tmpfs and also has good read and write speed. Strongly recommended to avoid using NFS mount>
+-Djava.util.logging.manager=org.apache.logging.log4j.jul.LogManager
+-Dorg.jboss.logging.provider=slf4j
+-Dnet.spy.log.LoggerImpl=net.spy.memcached.compat.log.SLF4JLogger
+-Dlog4j.shutdownCallbackRegistry=org.apache.druid.common.config.Log4jShutdown
+-Dlog4j.shutdownHookEnabled=true
+-XX:+PrintGCDetails
+-XX:+PrintGCDateStamps
+-XX:+PrintGCTimeStamps
+-XX:+PrintGCApplicationStoppedTime
+-XX:+PrintGCApplicationConcurrentTime
+-Xloggc:/var/logs/druid/historical.gc.log
+-XX:+UseGCLogFileRotation
+-XX:NumberOfGCLogFiles=50
+-XX:GCLogFileSize=10m
+-XX:+ExitOnOutOfMemoryError
+-XX:+HeapDumpOnOutOfMemoryError
+-XX:HeapDumpPath=/var/logs/druid/historical.hprof
+-XX:MaxDirectMemorySize=1g
+```
+:::info
+ Please note that the flag settings above represent sample, general guidelines only. Be careful to use values appropriate
+for your specific scenario and be sure to test any changes in staging environments.
+:::
+
+`ExitOnOutOfMemoryError` flag is only supported starting JDK 8u92 . For older versions, `-XX:OnOutOfMemoryError='kill -9 %p'` can be used.
+
+`MaxDirectMemorySize` restricts JVM from allocating more than specified limit, by setting it to unlimited JVM restriction is lifted and OS level memory limits would still be effective. It's still important to make sure that Druid is not configured to allocate more off-heap memory than your machine has available. Important settings here include `druid.processing.numThreads`, `druid.processing.numMergeBuffers`, and `druid.processing.buffer.sizeBytes`.
+
+Additionally, for large JVM heaps, here are a few Garbage Collection efficiency guidelines that have been known to help in some cases.
+
+
+- Mount /tmp on tmpfs. See [The Four Month Bug: JVM statistics cause garbage collection pauses](http://www.evanjones.ca/jvm-mmap-pause.html).
+- On Disk-IO intensive processes (e.g., Historical and Middle Manager), GC and Druid logs should be written to a different disk than where data is written.
+- Disable [Transparent Huge Pages](https://www.kernel.org/doc/html/latest/admin-guide/mm/transhuge.html).
+- Try disabling biased locking by using `-XX:-UseBiasedLocking` JVM flag. See [Logging Stop-the-world Pauses in JVM](https://dzone.com/articles/logging-stop-world-pauses-jvm).
+
+### Use UTC timezone
+
+We recommend using UTC timezone for all your events and across your hosts, not just for Druid, but for all data infrastructure. This can greatly mitigate potential query problems with inconsistent timezones. To query in a non-UTC timezone see [query granularities](../querying/granularities.md#period-granularities)
+
+### System configuration
+
+#### SSDs
+
+SSDs are highly recommended for Historical, Middle Manager, and Indexer processes if you are not running a cluster that is entirely in memory. SSDs can greatly mitigate the time required to page data in and out of memory.
+
+#### JBOD vs RAID
+
+Historical processes store large number of segments on Disk and support specifying multiple paths for storing those. Typically, hosts have multiple disks configured with RAID which makes them look like a single disk to OS. RAID might have overheads specially if its not hardware controller based but software based. So, Historicals might get improved disk throughput with JBOD.
+
+#### Swap space
+
+We recommend _not_ using swap space for Historical, Middle Manager, and Indexer processes since due to the large number of memory mapped segment files can lead to poor and unpredictable performance.
+
+#### Linux limits
+
+For Historical, Middle Manager, and Indexer processes (and for really large clusters, Broker processes), you might need to adjust some Linux system limits to account for a large number of open files, a large number of network connections, or a large number of memory mapped files.
+
+##### ulimit
+
+The limit on the number of open files can be set permanently by editing `/etc/security/limits.conf`. This value should be substantially greater than the number of segment files that will exist on the server.
+
+##### max_map_count
+
+Historical processes and to a lesser extent, Middle Manager and Indexer processes memory map segment files, so depending on the number of segments per server, `/proc/sys/vm/max_map_count` might also need to be adjusted. Depending on the variant of Linux, this might be done via `sysctl` by placing a file in `/etc/sysctl.d/` that sets `vm.max_map_count`.
diff --git a/docs/35.0.0/operations/clean-metadata-store.md b/docs/35.0.0/operations/clean-metadata-store.md
new file mode 100644
index 0000000000..65de311230
--- /dev/null
+++ b/docs/35.0.0/operations/clean-metadata-store.md
@@ -0,0 +1,233 @@
+---
+id: clean-metadata-store
+title: "Automated cleanup for metadata records"
+sidebar_label: Automated metadata cleanup
+description: "Defines a strategy to maintain Druid metadata store performance by automatically removing leftover records for deleted entities: datasources, supervisors, rules, compaction configuration, audit records, etc. Most applicable to databases with 'high-churn' datasources."
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+Apache Druid relies on [metadata storage](../design/metadata-storage.md) to track information on data storage, operations, and system configuration.
+The metadata store includes the following:
+
+- Segment records
+- Audit records
+- Supervisor records
+- Rule records
+- Compaction configuration records
+- Datasource records created by supervisors
+- Indexer task logs
+
+When you delete some entities from Apache Druid, records related to the entity may remain in the metadata store.
+If you have a high datasource churn rate, meaning you frequently create and delete many short-lived datasources or other related entities like compaction configuration or rules, the leftover records can fill your metadata store and cause performance issues.
+To maintain metadata store performance, you can configure Apache Druid to automatically remove records associated with deleted entities from the metadata store.
+
+By default, Druid automatically cleans up metadata older than 90 days.
+This applies to all metadata entities in this topic except compaction configuration records and indexer task logs, for which cleanup is disabled by default.
+You can configure the retention period for each metadata type, when available, through the record's `durationToRetain` property.
+Certain records may require additional conditions be satisfied before clean up occurs.
+
+See the [example](#example-configuration-for-automated-metadata-cleanup) for how you can customize the automated metadata cleanup for a specific use case.
+
+
+## Automated cleanup strategies
+
+There are several cases when you should consider automated cleanup of the metadata related to deleted datasources:
+- If you know you have many high-churn datasources, for example, you have scripts that create and delete supervisors regularly.
+- If you have issues with the hard disk for your metadata database filling up.
+- If you run into performance issues with the metadata database. For example, API calls are very slow or fail to execute.
+
+If you have compliance requirements to keep audit records and you enable automated cleanup for audit records, use alternative methods to preserve audit metadata, for example, by periodically exporting audit metadata records to external storage.
+
+## Configure automated metadata cleanup
+
+You can configure cleanup for each entity separately, as described in this section.
+Define the properties in the `coordinator/runtime.properties` file.
+
+The cleanup of one entity may depend on the cleanup of another entity as follows:
+- You have to configure a [kill task for segment records](#segment-records-and-segments-in-deep-storage-kill-task) before you can configure automated cleanup for [rules](#rules-records) or [compaction configuration](#compaction-configuration-records).
+- You have to schedule the metadata management tasks to run at the same or higher frequency as your most frequent cleanup job. For example, if your most frequent cleanup job is every hour, set the metadata store management period to one hour or less: `druid.coordinator.period.metadataStoreManagementPeriod=P1H`.
+
+For details on configuration properties, see [Metadata management](../configuration/index.md#metadata-management).
+If you want to skip the details, check out the [example](#example-configuration-for-automated-metadata-cleanup) for configuring automated metadata cleanup.
+
+### Segment records and segments in deep storage (kill task)
+
+:::info
+ The kill task is the only configuration in this topic that affects actual data in deep storage and not simply metadata or logs.
+:::
+
+Segment records and segments in deep storage become eligible for deletion when both of the following conditions hold:
+
+- When they meet the eligibility requirement of kill task datasource configuration according to `killDataSourceWhitelist` set in the Coordinator dynamic configuration. See [Dynamic configuration](../configuration/index.md#dynamic-configuration).
+- When the `durationToRetain` time has passed since their creation.
+
+Refer to [Data Management on Coordinator](../configuration/index.md#data-management) to configure auto-kill of unused segments on the Coordinator.
+
+### Audit records
+
+All audit records become eligible for deletion when the `durationToRetain` time has passed since their creation.
+
+Audit cleanup uses the following configuration:
+ - `druid.coordinator.kill.audit.on`: When `true`, enables cleanup for audit records.
+ - `druid.coordinator.kill.audit.period`: Defines the frequency in [ISO 8601 format](https://en.wikipedia.org/wiki/ISO_8601#Durations) for the cleanup job to check for and delete eligible audit records. Defaults to `P1D`.
+ - `druid.coordinator.kill.audit.durationToRetain`: Defines the retention period in [ISO 8601 format](https://en.wikipedia.org/wiki/ISO_8601#Durations) after creation that audit records become eligible for deletion.
+
+### Supervisor records
+
+Supervisor records become eligible for deletion when the supervisor is terminated and the `durationToRetain` time has passed since their creation.
+
+Supervisor cleanup uses the following configuration:
+ - `druid.coordinator.kill.supervisor.on`: When `true`, enables cleanup for supervisor records.
+ - `druid.coordinator.kill.supervisor.period`: Defines the frequency in [ISO 8601 format](https://en.wikipedia.org/wiki/ISO_8601#Durations) for the cleanup job to check for and delete eligible supervisor records. Defaults to `P1D`.
+ - `druid.coordinator.kill.supervisor.durationToRetain`: Defines the retention period in [ISO 8601 format](https://en.wikipedia.org/wiki/ISO_8601#Durations) after creation that supervisor records become eligible for deletion.
+
+### Rules records
+
+Rule records become eligible for deletion when all segments for the datasource have been killed by the kill task and the `durationToRetain` time has passed since their creation. Automated cleanup for rules requires a [kill task](#segment-records-and-segments-in-deep-storage-kill-task).
+
+Rule cleanup uses the following configuration:
+ - `druid.coordinator.kill.rule.on`: When `true`, enables cleanup for rules records.
+ - `druid.coordinator.kill.rule.period`: Defines the frequency in [ISO 8601 format](https://en.wikipedia.org/wiki/ISO_8601#Durations) for the cleanup job to check for and delete eligible rules records. Defaults to `P1D`.
+ - `druid.coordinator.kill.rule.durationToRetain`: Defines the retention period in [ISO 8601 format](https://en.wikipedia.org/wiki/ISO_8601#Durations) after creation that rules records become eligible for deletion.
+
+### Compaction configuration records
+
+Druid retains all compaction configuration records by default, which should be suitable for most use cases.
+If you create and delete short-lived datasources with high frequency, and you set auto compaction configuration on those datasources, then consider turning on automated cleanup of compaction configuration records.
+
+:::info
+ With automated cleanup of compaction configuration records, if you create a compaction configuration for some datasource before the datasource exists, for example if initial ingestion is still ongoing, Druid may remove the compaction configuration.
+To prevent the configuration from being prematurely removed, wait for the datasource to be created before applying the compaction configuration to the datasource.
+:::
+
+Unlike other metadata records, compaction configuration records do not have a retention period set by `durationToRetain`. Druid deletes compaction configuration records at every cleanup cycle for inactive datasources, which do not have segments either used or unused.
+
+Compaction configuration records in the `druid_config` table become eligible for deletion after all segments for the datasource have been killed by the kill task. Automated cleanup for compaction configuration requires a [kill task](#segment-records-and-segments-in-deep-storage-kill-task).
+
+Compaction configuration cleanup uses the following configuration:
+ - `druid.coordinator.kill.compaction.on`: When `true`, enables cleanup for compaction configuration records.
+ - `druid.coordinator.kill.compaction.period`: Defines the frequency in [ISO 8601 format](https://en.wikipedia.org/wiki/ISO_8601#Durations) for the cleanup job to check for and delete eligible compaction configuration records. Defaults to `P1D`.
+
+
+:::info
+If you already have an extremely large compaction configuration, you may not be able to delete compaction configuration due to size limits with the audit log. In this case you can set `druid.audit.manager.maxPayloadSizeBytes` and `druid.audit.manager.skipNullField` to avoid the auditing issue. See [Audit logging](../configuration/index.md#audit-logging).
+:::
+
+### Datasource records created by supervisors
+
+Datasource records created by supervisors become eligible for deletion when the supervisor is terminated or does not exist in the `druid_supervisors` table and the `durationToRetain` time has passed since their creation.
+
+Datasource cleanup uses the following configuration:
+ - `druid.coordinator.kill.datasource.on`: When `true`, enables cleanup datasources created by supervisors.
+ - `druid.coordinator.kill.datasource.period`: Defines the frequency in [ISO 8601 format](https://en.wikipedia.org/wiki/ISO_8601#Durations) for the cleanup job to check for and delete eligible datasource records. Defaults to `P1D`.
+ - `druid.coordinator.kill.datasource.durationToRetain`: Defines the retention period in [ISO 8601 format](https://en.wikipedia.org/wiki/ISO_8601#Durations) after creation that datasource records become eligible for deletion.
+
+### Indexer task logs
+
+You can configure the Overlord to periodically delete indexer task logs and associated metadata. During cleanup, the Overlord removes the following:
+* Indexer task logs from deep storage.
+* Indexer task log metadata from the tasks table in [metadata storage](../configuration/index.md#metadata-storage) (named `druid_tasks` by default).
+
+To configure cleanup of task logs by the Overlord, set the following properties in the `overlord/runtime.properties` file.
+
+Indexer task log cleanup on the Overlord uses the following configuration:
+- `druid.indexer.logs.kill.enabled`: When `true`, enables cleanup of task logs.
+- `druid.indexer.logs.kill.durationToRetain`: Defines the length of time in milliseconds to retain task logs.
+- `druid.indexer.logs.kill.initialDelay`: Defines the length of time in milliseconds after the Overlord starts before it executes its first job to kill task logs.
+- `druid.indexer.logs.kill.delay`: The length of time in milliseconds between jobs to kill task logs.
+
+For more detail, see [Task logging](../configuration/index.md#task-logging).
+
+
+## Disable automated metadata cleanup
+
+Druid automatically cleans up metadata records, excluding compaction configuration records and indexer task logs.
+To disable automated metadata cleanup, set the following properties in the `coordinator/runtime.properties` file:
+
+```properties
+# Keep unused segments
+druid.coordinator.kill.on=false
+
+# Keep audit records
+druid.coordinator.kill.audit.on=false
+
+# Keep supervisor records
+druid.coordinator.kill.supervisor.on=false
+
+# Keep rules records
+druid.coordinator.kill.rule.on=false
+
+# Keep datasource records created by supervisors
+druid.coordinator.kill.datasource.on=false
+```
+
+## Example configuration for automated metadata cleanup
+
+Consider a scenario where you have scripts to create and delete hundreds of datasources and related entities a day. You do not want to fill your metadata store with leftover records. The datasources and related entities tend to persist for only one or two days. Therefore, you want to run a cleanup job that identifies and removes leftover records that are at least four days old after a seven day buffer period in case you want to recover the data. The exception is for audit logs, which you need to retain for 30 days:
+
+```properties
+...
+# Schedule the metadata management store task for every hour:
+druid.coordinator.period.metadataStoreManagementPeriod=PT1H
+
+# Set a kill task to poll every day to delete segment records and segments
+# in deep storage > 4 days old after a 7-day buffer period. When druid.coordinator.kill.on is set to true,
+# you can set killDataSourceWhitelist in the dynamic configuration to limit
+# the datasources that can be killed.
+# Required also for automated cleanup of rules and compaction configuration.
+
+druid.coordinator.kill.on=true
+druid.coordinator.kill.period=P1D
+druid.coordinator.kill.durationToRetain=P4D
+druid.coordinator.kill.bufferPeriod=P7D
+druid.coordinator.kill.maxSegments=1000
+
+# Poll every day to delete audit records > 30 days old
+druid.coordinator.kill.audit.on=true
+druid.coordinator.kill.audit.period=P1D
+druid.coordinator.kill.audit.durationToRetain=P30D
+
+# Poll every day to delete supervisor records > 4 days old
+druid.coordinator.kill.supervisor.on=true
+druid.coordinator.kill.supervisor.period=P1D
+druid.coordinator.kill.supervisor.durationToRetain=P4D
+
+# Poll every day to delete rules records > 4 days old
+druid.coordinator.kill.rule.on=true
+druid.coordinator.kill.rule.period=P1D
+druid.coordinator.kill.rule.durationToRetain=P4D
+
+# Poll every day to delete compaction configuration records
+druid.coordinator.kill.compaction.on=true
+druid.coordinator.kill.compaction.period=P1D
+
+# Poll every day to delete datasource records created by supervisors > 4 days old
+druid.coordinator.kill.datasource.on=true
+druid.coordinator.kill.datasource.period=P1D
+druid.coordinator.kill.datasource.durationToRetain=P4D
+...
+```
+
+## Learn more
+See the following topics for more information:
+- [Metadata management](../configuration/index.md#metadata-management) for metadata store configuration reference.
+- [Metadata storage](../design/metadata-storage.md) for an overview of the metadata storage database.
+
diff --git a/docs/35.0.0/operations/deep-storage-migration.md b/docs/35.0.0/operations/deep-storage-migration.md
new file mode 100644
index 0000000000..733db8bd92
--- /dev/null
+++ b/docs/35.0.0/operations/deep-storage-migration.md
@@ -0,0 +1,66 @@
+---
+id: deep-storage-migration
+title: "Deep storage migration"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+If you have been running an evaluation Druid cluster using local deep storage and wish to migrate to a
+more production-capable deep storage system such as S3 or HDFS, this document describes the necessary steps.
+
+Migration of deep storage involves the following steps at a high level:
+
+- Copying segments from local deep storage to the new deep storage
+- Exporting Druid's segments table from metadata
+- Rewriting the load specs in the exported segment data to reflect the new deep storage location
+- Reimporting the edited segments into metadata
+
+## Shut down cluster services
+
+To ensure a clean migration, shut down the non-coordinator services to ensure that metadata state will not
+change as you do the migration.
+
+When migrating from Derby, the coordinator processes will still need to be up initially, as they host the Derby database.
+
+## Copy segments from old deep storage to new deep storage.
+
+Before migrating, you will need to copy your old segments to the new deep storage.
+
+For information on what path structure to use in the new deep storage, please see [deep storage migration options](../operations/export-metadata.md#deep-storage-migration).
+
+## Export segments with rewritten load specs
+
+Druid provides an [Export Metadata Tool](../operations/export-metadata.md) for exporting metadata from Derby into CSV files
+which can then be reimported.
+
+By setting [deep storage migration options](../operations/export-metadata.md#deep-storage-migration), the `export-metadata` tool will export CSV files where the segment load specs have been rewritten to load from your new deep storage location.
+
+Run the `export-metadata` tool on your existing cluster, using the migration options appropriate for your new deep storage location, and save the CSV files it generates. After a successful export, you can shut down the coordinator.
+
+### Import metadata
+
+After generating the CSV exports with the modified segment data, you can reimport the contents of the Druid segments table from the generated CSVs.
+
+Please refer to [import commands](../operations/export-metadata.md#importing-metadata) for examples. Only the `druid_segments` table needs to be imported.
+
+### Restart cluster
+
+After importing the segment table successfully, you can now restart your cluster.
diff --git a/docs/35.0.0/operations/dump-segment.md b/docs/35.0.0/operations/dump-segment.md
new file mode 100644
index 0000000000..f80b627519
--- /dev/null
+++ b/docs/35.0.0/operations/dump-segment.md
@@ -0,0 +1,320 @@
+---
+id: dump-segment
+title: "dump-segment tool"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+The DumpSegment tool can be used to dump the metadata or contents of an Apache Druid segment for debugging purposes. Note that the
+dump is not necessarily a full-fidelity translation of the segment. In particular, not all metadata is included, and
+complex metric values may not be complete.
+
+To run the tool, point it at a segment directory and provide a file for writing output:
+
+```
+java -classpath "/my/druid/lib/*" -Ddruid.extensions.loadList="[]" org.apache.druid.cli.Main \
+  tools dump-segment \
+  --directory /home/druid/path/to/segment/ \
+  --out /home/druid/output.txt
+```
+
+If you use JDK 17 and above, you need to add the following additional parameters
+```
+--add-opens java.base/java.lang=ALL-UNNAMED
+--add-opens java.base/sun.nio.ch=ALL-UNNAMED
+```
+The following is an example
+
+```
+java --add-opens java.base/java.lang=ALL-UNNAMED --add-opens java.base/sun.nio.ch=ALL-UNNAMED \
+  -classpath "/my/druid/lib/*" \
+  -Ddruid.extensions.loadList="[]" org.apache.druid.cli.Main \
+  tools dump-segment \
+  --directory /home/druid/path/to/segment/ \
+  --out /home/druid/output.txt
+```
+
+### Output format
+
+#### Data dumps
+
+By default, or with `--dump rows`, this tool dumps rows of the segment as newline-separate JSON objects, with one
+object per line, using the default serialization for each column. Normally all columns are included, but if you like,
+you can limit the dump to specific columns with `--column name`.
+
+For example, one line might look like this when pretty-printed:
+
+```
+{
+  "__time": 1442018818771,
+  "added": 36,
+  "channel": "#en.wikipedia",
+  "cityName": null,
+  "comment": "added project",
+  "count": 1,
+  "countryIsoCode": null,
+  "countryName": null,
+  "deleted": 0,
+  "delta": 36,
+  "isAnonymous": "false",
+  "isMinor": "false",
+  "isNew": "false",
+  "isRobot": "false",
+  "isUnpatrolled": "false",
+  "iuser": "00001553",
+  "metroCode": null,
+  "namespace": "Talk",
+  "page": "Talk:Oswald Tilghman",
+  "regionIsoCode": null,
+  "regionName": null,
+  "user": "GELongstreet"
+}
+```
+
+#### Metadata dumps
+
+With `--dump metadata`, this tool dumps metadata instead of rows. Metadata dumps generated by this tool are in the same
+format as returned by the [SegmentMetadata query](../querying/segmentmetadataquery.md).
+
+#### Bitmap dumps
+
+With `--dump bitmaps`, this tool will dump bitmap indexes instead of rows. Bitmap dumps generated by this tool include
+dictionary-encoded string columns only. The output contains a field "bitmapSerdeFactory" describing the type of bitmaps
+used in the segment, and a field "bitmaps" containing the bitmaps for each value of each column. These are base64
+encoded by default, but you can also dump them as lists of row numbers with `--decompress-bitmaps`.
+
+Normally all columns are included, but if you like, you can limit the dump to specific columns with `--column name`.
+
+Sample output:
+
+```
+{
+  "bitmapSerdeFactory": {
+    "type": "roaring"
+  },
+  "bitmaps": {
+    "isRobot": {
+      "false": "//aExfu+Nv3X...",
+      "true": "gAl7OoRByQ..."
+    }
+  }
+}
+```
+
+
+#### Nested column dumps
+
+With `--dump nested`, this tool can be used to examine Druid [nested columns](../querying/nested-columns.md). Using
+`nested` always requires exactly one `--column name` argument, and takes an optional argument to specify a specific
+nested field in [JSONPath syntax](../querying/sql-json-functions.md#jsonpath-syntax), `--nested-path $.path.to.field`.
+If `--nested-path` is not specified, the output will contain the list of nested fields and their types, the global
+value dictionaries, and the list of null rows.
+
+Sample output:
+```json
+{
+  "nest": {
+    "fields": [
+      {
+        "path": "$.x",
+        "types": [
+          "LONG"
+        ]
+      },
+      {
+        "path": "$.y",
+        "types": [
+          "DOUBLE"
+        ]
+      },
+      {
+        "path": "$.z",
+        "types": [
+          "STRING"
+        ]
+      }
+    ],
+    "dictionaries": {
+      "strings": [
+        {
+          "globalId": 0,
+          "value": null
+        },
+        {
+          "globalId": 1,
+          "value": "a"
+        },
+        {
+          "globalId": 2,
+          "value": "b"
+        }
+      ],
+      "longs": [
+        {
+          "globalId": 3,
+          "value": 100
+        },
+        {
+          "globalId": 4,
+          "value": 200
+        },
+        {
+          "globalId": 5,
+          "value": 400
+        }
+      ],
+      "doubles": [
+        {
+          "globalId": 6,
+          "value": 1.1
+        },
+        {
+          "globalId": 7,
+          "value": 2.2
+        },
+        {
+          "globalId": 8,
+          "value": 3.3
+        }
+      ],
+      "nullRows": []
+    }
+  }
+}
+```
+
+If `--nested-path` is specified, the output will instead contain the types of the nested field, the local value
+dictionary, including the 'global' dictionary id and value, the uncompressed bitmap index for each value (list of row
+numbers which contain the value), and a dump of the column itself, which contains the row number, raw JSON form of the
+nested column itself, the local dictionary id of the field for that row, and the value for the field for the row.
+
+Sample output:
+```json
+{
+  "bitmapSerdeFactory": {
+    "type": "roaring"
+  },
+  "nest": {
+    "$.x": {
+      "types": [
+        "LONG"
+      ],
+      "dictionary": [
+        {
+          "localId": 0,
+          "globalId": 0,
+          "value": null,
+          "rows": [
+            4
+          ]
+        },
+        {
+          "localId": 1,
+          "globalId": 3,
+          "value": "100",
+          "rows": [
+            3
+          ]
+        },
+        {
+          "localId": 2,
+          "globalId": 4,
+          "value": "200",
+          "rows": [
+            0,
+            2
+          ]
+        },
+        {
+          "localId": 3,
+          "globalId": 5,
+          "value": "400",
+          "rows": [
+            1
+          ]
+        }
+      ],
+      "column": [
+        {
+          "row": 0,
+          "raw": {
+            "x": 200,
+            "y": 2.2
+          },
+          "fieldId": 2,
+          "fieldValue": "200"
+        },
+        {
+          "row": 1,
+          "raw": {
+            "x": 400,
+            "y": 1.1,
+            "z": "a"
+          },
+          "fieldId": 3,
+          "fieldValue": "400"
+        },
+        {
+          "row": 2,
+          "raw": {
+            "x": 200,
+            "z": "b"
+          },
+          "fieldId": 2,
+          "fieldValue": "200"
+        },
+        {
+          "row": 3,
+          "raw": {
+            "x": 100,
+            "y": 1.1,
+            "z": "a"
+          },
+          "fieldId": 1,
+          "fieldValue": "100"
+        },
+        {
+          "row": 4,
+          "raw": {
+            "y": 3.3,
+            "z": "b"
+          },
+          "fieldId": 0,
+          "fieldValue": null
+        }
+      ]
+    }
+  }
+}
+```
+
+### Command line arguments
+
+|argument|description|required?|
+|--------|-----------|---------|
+|--directory file|Directory containing segment data. This could be generated by unzipping an "index.zip" from deep storage.|yes|
+|--output file|File to write to, or omit to write to stdout.|yes|
+|--dump TYPE|Dump either 'rows' (default), 'metadata', 'bitmaps', or 'nested' for examining nested columns.|no|
+|--column columnName|Column to include. Specify multiple times for multiple columns, or omit to include all columns.|no|
+|--filter json|JSON-encoded [query filter](../querying/filters.md). Omit to include all rows. Only used if dumping rows.|no|
+|--time-iso8601|Format __time column in ISO8601 format rather than long. Only used if dumping rows.|no|
+|--decompress-bitmaps|Dump bitmaps as arrays rather than base64-encoded compressed bitmaps. Only used if dumping bitmaps.|no|
+|--nested-path|Specify a specific nested column field using [JSONPath syntax](../querying/sql-json-functions.md#jsonpath-syntax). Only used if dumping a nested column.|no| 
diff --git a/docs/35.0.0/operations/durable-storage.md b/docs/35.0.0/operations/durable-storage.md
new file mode 100644
index 0000000000..30b075cac6
--- /dev/null
+++ b/docs/35.0.0/operations/durable-storage.md
@@ -0,0 +1,122 @@
+---
+id: durable-storage
+title: "Durable storage for the multi-stage query engine"
+sidebar_label: "Durable storage"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+You can use durable storage to improve querying from deep storage and SQL-based ingestion.
+
+:::info
+ S3, Google Storage, and Azure Blob Storage are supported as durable storage locations.
+:::
+
+Durable storage for queries from deep storage provides a location where you can write the results of deep storage queries to. Durable storage for SQL-based ingestion is used to temporarily house intermediate files, which can improve reliability.
+
+Enabling durable storage also enables the use of local disk to store temporary files, such as the intermediate files produced
+while sorting the data. Tasks will use whatever has been configured for their temporary usage as described in [Configuring task storage sizes](../ingestion/tasks.md#configuring-task-storage-sizes).
+If the configured limit is too low, Druid may throw the error, `NotEnoughTemporaryStorageFault`.
+
+## Enable durable storage
+
+To enable durable storage, you need to set the following common service properties.
+
+For S3:
+
+```
+druid.msq.intermediate.storage.enable=true
+druid.msq.intermediate.storage.type=s3
+
+# Remote storage location
+druid.msq.intermediate.storage.bucket=YOUR_BUCKET
+druid.msq.intermediate.storage.prefix=YOUR_PREFIX
+
+# Local temporary directory (on each Druid server)
+druid.msq.intermediate.storage.tempDir=/path/to/your/temp/dir
+```
+
+For Google Storage:
+
+```
+druid.msq.intermediate.storage.enable=true
+druid.msq.intermediate.storage.type=google
+
+# Remote storage location
+druid.msq.intermediate.storage.bucket=YOUR_BUCKET
+druid.msq.intermediate.storage.prefix=YOUR_PREFIX
+
+# Local temporary directory (on each Druid server)
+druid.msq.intermediate.storage.tempDir=/path/to/your/temp/dir
+```
+
+For Azure Blob Storage:
+
+```
+druid.msq.intermediate.storage.enable=true
+druid.msq.intermediate.storage.type=azure
+
+# Remote storage location
+druid.msq.intermediate.storage.container=YOUR_CONTAINER
+druid.msq.intermediate.storage.prefix=YOUR_PREFIX
+
+# Local temporary directory (on each Druid server)
+druid.msq.intermediate.storage.tempDir=/path/to/your/temp/dir
+```
+
+For detailed information about these and additional settings related to durable storage, see [Durable storage configurations](../multi-stage-query/reference.md#durable-storage-configurations).
+
+
+## Use durable storage for SQL-based ingestion queries
+
+When you run a query, include the context parameter `durableShuffleStorage` and set it to `true`.
+
+For queries where you want to use fault tolerance for workers,  set `faultTolerance` to `true`, which automatically sets `durableShuffleStorage` to `true`.
+
+## Use durable storage for queries from deep storage
+
+Depending on the size of the results you're expecting, saving the final results for queries from deep storage to durable storage might be needed.
+
+By default, Druid saves the final results for queries from deep storage to task reports. Generally, this is acceptable for smaller result sets but may lead to timeouts for larger result sets. 
+
+When you run a query, include the context parameter `selectDestination` and set it to `durableStorage`:
+
+```json
+    "context":{
+        ...
+        "selectDestination": "durableStorage"
+    }
+```
+
+You can also write intermediate results to durable storage (`durableShuffleStorage`) for better reliability. The location where workers write intermediate results is different than the location where final results get stored. This means that durable storage for results can be enabled even if you don't write intermediate results to durable storage. 
+
+If you write the results for queries from deep storage to durable storage, the results are cleaned up when the task is removed from the metadata store. 
+
+## Durable storage clean up
+
+To prevent durable storage from getting filled up with temporary files in case the tasks fail to clean them up, a periodic
+cleaner can be scheduled to clean the directories corresponding to which there isn't a controller task running. It utilizes
+the storage connector to work upon the durable storage. The durable storage location should only be utilized to store the output
+for the cluster's MSQ tasks. If the location contains other files or directories, then they will get cleaned up as well.
+
+Use `druid.msq.intermediate.storage.cleaner.enabled` and `druid.msq.intermediate.storage.cleaner.delaySeconds` to configure the cleaner. For more information, see [Durable storage configurations](../multi-stage-query/reference.md#durable-storage-configurations).
+
+Note that if you choose to write query results to durable storage,the results are cleaned up when the task is removed from the metadata store.
+
diff --git a/docs/35.0.0/operations/dynamic-config-provider.md b/docs/35.0.0/operations/dynamic-config-provider.md
new file mode 100644
index 0000000000..b641efd7a0
--- /dev/null
+++ b/docs/35.0.0/operations/dynamic-config-provider.md
@@ -0,0 +1,78 @@
+---
+id: dynamic-config-provider
+title: "Dynamic Config Providers"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+Druid relies on dynamic config providers to supply multiple related sets of credentials, secrets, and configurations within a Druid extension. Dynamic config providers are intended to eventually replace [PasswordProvider](./password-provider.md).
+
+By default, Druid includes an environment variable dynamic config provider that supports Kafka consumer configuration in [Kafka ingestion](../ingestion/kafka-ingestion.md).
+
+To develop a custom extension of the `DynamicConfigProvider` interface that is registered at Druid process startup, see [Adding a new DynamicConfigProvider implementation](../development/modules.md#adding-a-new-dynamicconfigprovider-implementation).
+
+## Environment variable dynamic config provider
+
+You can use the environment variable dynamic config provider (`EnvironmentVariableDynamicConfigProvider`) to store passwords or other sensitive information using system environment variables instead of plain text configuration.
+
+The environment variable dynamic config provider uses the following syntax:
+
+```json
+druid.dynamic.config.provider={"type": "environment","variables":{"secret1": "SECRET1_VAR","secret2": "SECRET2_VAR"}}
+```
+
+|Field|Type|Description|Required|
+|-----|----|-----------|--------|
+|`type`|String|dynamic config provider type|Yes: `environment`|
+|`variables`|Map|environment variables that store the configuration information|Yes|
+
+When using the environment variable config provider, consider the following:
+- If you manually specify a configuration key-value pair and use the dynamic config provider for the same key, Druid uses the value from the dynamic config provider.
+- For use in a supervisor spec, environment variables must be available to the system user that runs the Overlord service and that runs the Peon service.
+
+The following example shows how to configure environment variables to store the SSL key and truststore passwords for Kafka.
+
+On the Overlord and Peon machines, set the following environment variables for the system user that runs the Druid services:
+
+```
+export SSL_KEY_PASSWORD=mysecretkeypassword
+export SSL_KEYSTORE_PASSWORD=mysecretkeystorepassword
+export SSL_TRUSTSTORE_PASSWORD=mysecrettruststorepassword
+```
+
+When you define the consumer properties in the supervisor spec, use the dynamic config provider to refer to the environment variables:
+```
+...
+   "consumerProperties": {
+        "bootstrap.servers": "localhost:9092",
+        "ssl.keystore.location": "/opt/kafka/config/kafka01.keystore.jks",
+        "ssl.truststore.location": "/opt/kafka/config/kafka.truststore.jks",
+        "druid.dynamic.config.provider": {
+          "type": "environment",
+          "variables": {
+            "ssl.key.password": "SSL_KEY_PASSWORD",
+            "ssl.keystore.password": "SSL_KEYSTORE_PASSWORD",
+            "ssl.truststore.password": "SSL_TRUSTSTORE_PASSWORD"
+          }
+        }
+      },
+...
+```
+When connecting to Kafka, Druid replaces the environment variables with their corresponding values.
\ No newline at end of file
diff --git a/docs/35.0.0/operations/export-metadata.md b/docs/35.0.0/operations/export-metadata.md
new file mode 100644
index 0000000000..e065e42b01
--- /dev/null
+++ b/docs/35.0.0/operations/export-metadata.md
@@ -0,0 +1,202 @@
+---
+id: export-metadata
+title: "Export Metadata Tool"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+Druid includes an `export-metadata` tool for assisting with migration of cluster metadata and deep storage.
+
+This tool exports the contents of the following Druid metadata tables:
+
+- segments
+- rules
+- config
+- datasource
+- supervisors
+
+Additionally, the tool can rewrite the local deep storage location descriptors in the rows of the segments table
+to point to new deep storage locations (S3, HDFS, and local rewrite paths are supported).
+
+The tool has the following limitations:
+
+- Only exporting from Derby metadata is currently supported
+- If rewriting load specs for deep storage migration, only migrating from local deep storage is currently supported.
+
+## `export-metadata` Options
+
+The `export-metadata` tool provides the following options:
+
+### Connection Properties
+
+- `--connectURI`: The URI of the Derby database, e.g. `jdbc:derby://localhost:1527/var/druid/metadata.db;create=true`
+- `--user`: Username
+- `--password`: Password
+- `--base`: corresponds to the value of `druid.metadata.storage.tables.base` in the configuration, `druid` by default.
+
+### Output Path
+
+- `--output-path`, `-o`: The output directory of the tool. CSV files for the Druid segments, rules, config, datasource, and supervisors tables will be written to this directory.
+
+### Export Format Options
+
+- `--use-hex-blobs`, `-x`: If set, export BLOB payload columns as hexadecimal strings. This needs to be set if importing back into Derby. Default is false.
+- `--booleans-as-strings`, `-t`: If set, write boolean values as "true" or "false" instead of "1" and "0". This needs to be set if importing back into Derby. Default is false.
+
+### Deep Storage Migration
+
+#### Migration to S3 Deep Storage
+
+By setting the options below, the tool will rewrite the segment load specs to point to a new S3 deep storage location.
+
+This helps users migrate segments stored in local deep storage to S3.
+
+- `--s3bucket`, `-b`: The S3 bucket that will hold the migrated segments
+- `--s3baseKey`, `-k`: The base S3 key where the migrated segments will be stored
+
+When copying the local deep storage segments to S3, the rewrite performed by this tool requires that the directory structure of the segments be unchanged.
+
+For example, if the cluster had the following local deep storage configuration:
+
+```
+druid.storage.type=local
+druid.storage.storageDirectory=/druid/segments
+```
+
+If the target S3 bucket was `migration`, with a base key of `example`, the contents of `s3://migration/example/` must be identical to that of `/druid/segments` on the old local filesystem.
+
+#### Migration to HDFS Deep Storage
+
+By setting the options below, the tool will rewrite the segment load specs to point to a new HDFS deep storage location.
+
+This helps users migrate segments stored in local deep storage to HDFS.
+
+`--hadoopStorageDirectory`, `-h`: The HDFS path that will hold the migrated segments
+
+When copying the local deep storage segments to HDFS, the rewrite performed by this tool requires that the directory structure of the segments be unchanged, with the exception of directory names containing colons (`:`).
+
+For example, if the cluster had the following local deep storage configuration:
+
+```
+druid.storage.type=local
+druid.storage.storageDirectory=/druid/segments
+```
+
+If the target hadoopStorageDirectory was `/migration/example`, the contents of `hdfs:///migration/example/` must be identical to that of `/druid/segments` on the old local filesystem.
+
+Additionally, the segments paths in local deep storage contain colons(`:`) in their names, e.g.:
+
+`wikipedia/2016-06-27T02:00:00.000Z_2016-06-27T03:00:00.000Z/2019-05-03T21:57:15.950Z/1/index.zip`
+
+HDFS cannot store files containing colons, and this tool expects the colons to be replaced with underscores (`_`) in HDFS.
+
+In this example, the `wikipedia` segment above under `/druid/segments` in local deep storage would need to be migrated to HDFS under `hdfs:///migration/example/` with the following path:
+
+`wikipedia/2016-06-27T02_00_00.000Z_2016-06-27T03_00_00.000Z/2019-05-03T21_57_15.950Z/1/index.zip`
+
+#### Migration to New Local Deep Storage Path
+
+By setting the options below, the tool will rewrite the segment load specs to point to a new local deep storage location.
+
+This helps users migrate segments stored in local deep storage to a new path (e.g., a new NFS mount).
+
+`--newLocalPath`, `-n`: The new path on the local filesystem that will hold the migrated segments
+
+When copying the local deep storage segments to a new path, the rewrite performed by this tool requires that the directory structure of the segments be unchanged.
+
+For example, if the cluster had the following local deep storage configuration:
+
+```
+druid.storage.type=local
+druid.storage.storageDirectory=/druid/segments
+```
+
+If the new path  was `/migration/example`, the contents of `/migration/example/` must be identical to that of `/druid/segments` on the local filesystem.
+
+## Running the tool
+
+To use the tool, you can run the following from the root of the Druid package:
+
+```bash
+cd ${DRUID_ROOT}
+mkdir -p /tmp/csv
+java -classpath "lib/*" -Dlog4j.configurationFile=conf/druid/cluster/_common/log4j2.xml -Ddruid.extensions.directory="extensions" -Ddruid.extensions.loadList=[] org.apache.druid.cli.Main tools export-metadata --connectURI "jdbc:derby://localhost:1527/var/druid/metadata.db;" -o /tmp/csv
+```
+
+In the example command above:
+
+- `lib` is the Druid lib directory
+- `extensions` is the Druid extensions directory
+- `/tmp/csv` is the output directory. Please make sure that this directory exists.
+
+## Importing Metadata
+
+After running the tool, the output directory will contain `<table-name>_raw.csv` and `<table-name>.csv` files.
+
+The `<table-name>_raw.csv` files are intermediate files used by the tool, containing the table data as exported by Derby without modification.
+
+The `<table-name>.csv` files are used for import into another database such as MySQL and PostgreSQL and have any configured deep storage location rewrites applied.
+
+Example import commands for Derby, MySQL, and PostgreSQL are shown below.
+
+These example import commands expect `/tmp/csv` and its contents to be accessible from the server. For other options, such as importing from the client filesystem, please refer to the database's documentation.
+
+### Derby
+
+```sql
+CALL SYSCS_UTIL.SYSCS_IMPORT_TABLE (null,'DRUID_SEGMENTS','/tmp/csv/druid_segments.csv',',','"',null,0);
+
+CALL SYSCS_UTIL.SYSCS_IMPORT_TABLE (null,'DRUID_RULES','/tmp/csv/druid_rules.csv',',','"',null,0);
+
+CALL SYSCS_UTIL.SYSCS_IMPORT_TABLE (null,'DRUID_CONFIG','/tmp/csv/druid_config.csv',',','"',null,0);
+
+CALL SYSCS_UTIL.SYSCS_IMPORT_TABLE (null,'DRUID_DATASOURCE','/tmp/csv/druid_dataSource.csv',',','"',null,0);
+
+CALL SYSCS_UTIL.SYSCS_IMPORT_TABLE (null,'DRUID_SUPERVISORS','/tmp/csv/druid_supervisors.csv',',','"',null,0);
+```
+
+### MySQL
+
+```sql
+LOAD DATA INFILE '/tmp/csv/druid_segments.csv' INTO TABLE druid_segments FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '\"' (id,dataSource,created_date,start,end,partitioned,version,used,payload); SHOW WARNINGS;
+
+LOAD DATA INFILE '/tmp/csv/druid_rules.csv' INTO TABLE druid_rules FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '\"' (id,dataSource,version,payload); SHOW WARNINGS;
+
+LOAD DATA INFILE '/tmp/csv/druid_config.csv' INTO TABLE druid_config FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '\"' (name,payload); SHOW WARNINGS;
+
+LOAD DATA INFILE '/tmp/csv/druid_dataSource.csv' INTO TABLE druid_dataSource FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '\"' (dataSource,created_date,commit_metadata_payload,commit_metadata_sha1); SHOW WARNINGS;
+
+LOAD DATA INFILE '/tmp/csv/druid_supervisors.csv' INTO TABLE druid_supervisors FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '\"' (id,spec_id,created_date,payload); SHOW WARNINGS;
+```
+
+### PostgreSQL
+
+```sql
+COPY druid_segments(id,dataSource,created_date,start,"end",partitioned,version,used,payload) FROM '/tmp/csv/druid_segments.csv' DELIMITER ',' CSV;
+
+COPY druid_rules(id,dataSource,version,payload) FROM '/tmp/csv/druid_rules.csv' DELIMITER ',' CSV;
+
+COPY druid_config(name,payload) FROM '/tmp/csv/druid_config.csv' DELIMITER ',' CSV;
+
+COPY druid_dataSource(dataSource,created_date,commit_metadata_payload,commit_metadata_sha1) FROM '/tmp/csv/druid_dataSource.csv' DELIMITER ',' CSV;
+
+COPY druid_supervisors(id,spec_id,created_date,payload) FROM '/tmp/csv/druid_supervisors.csv' DELIMITER ',' CSV;
+```
diff --git a/docs/35.0.0/operations/high-availability.md b/docs/35.0.0/operations/high-availability.md
new file mode 100644
index 0000000000..7d142628fa
--- /dev/null
+++ b/docs/35.0.0/operations/high-availability.md
@@ -0,0 +1,38 @@
+---
+id: high-availability
+title: "High availability"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+Apache ZooKeeper, metadata store, the coordinator, the overlord, and brokers are recommended to set up a high availability environment.
+
+- For highly-available ZooKeeper, you will need a cluster of 3 or 5 ZooKeeper nodes.
+We recommend either installing ZooKeeper on its own hardware, or running 3 or 5 Master servers (where overlords or coordinators are running)
+and configuring ZooKeeper on them appropriately. See the [ZooKeeper admin guide](https://zookeeper.apache.org/doc/current/zookeeperAdmin) for more details.
+- For highly-available metadata storage, we recommend MySQL or PostgreSQL with replication and failover enabled.
+See [MySQL Enterprise High Availability](https://www.mysql.com/products/enterprise/high_availability.html) and [PostgreSQL's High Availability, Load Balancing, and Replication](https://www.postgresql.org/docs/current/high-availability.html) for more information.
+- For highly-available Apache Druid Coordinators and Overlords, we recommend to run multiple servers.
+If they are all configured to use the same ZooKeeper cluster and metadata storage,
+then they will automatically failover between each other as necessary.
+Only one will be active at a time, but inactive servers will redirect to the currently active server.
+- Druid Brokers can be scaled out and all running servers will be active and queryable.
+We recommend placing them behind a load balancer.
diff --git a/docs/35.0.0/operations/http-compression.md b/docs/35.0.0/operations/http-compression.md
new file mode 100644
index 0000000000..58fd5aef36
--- /dev/null
+++ b/docs/35.0.0/operations/http-compression.md
@@ -0,0 +1,31 @@
+---
+id: http-compression
+title: "HTTP compression"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+Apache Druid supports http request decompression and response compression, to use this, http request header `Content-Encoding:gzip` and  `Accept-Encoding:gzip` is needed to be set.
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.server.http.compressionLevel`|The compression level. Value should be between [-1,9], -1 for default level, 0 for no compression.|-1 (default compression level)|
+|`druid.server.http.inflateBufferSize`|The buffer size used by gzip decoder. Set to 0 to disable request decompression.|4096|
diff --git a/docs/35.0.0/operations/insert-segment-to-db.md b/docs/35.0.0/operations/insert-segment-to-db.md
new file mode 100644
index 0000000000..4de93a76f0
--- /dev/null
+++ b/docs/35.0.0/operations/insert-segment-to-db.md
@@ -0,0 +1,48 @@
+---
+id: insert-segment-to-db
+title: "insert-segment-to-db tool"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+In older versions of Apache Druid, `insert-segment-to-db` was a tool that could scan deep storage and
+insert data from there into Druid metadata storage. It was intended to be used to update the segment table in the
+metadata storage after manually migrating segments from one place to another, or even to recover lost metadata storage
+by telling it where the segments are stored.
+
+In Druid 0.14.x and earlier, Druid wrote segment metadata to two places: the metadata store's `druid_segments` table, and
+`descriptor.json` files in deep storage. This practice was stopped in Druid 0.15.0 as part of
+[consolidated metadata management](https://github.com/apache/druid/issues/6849), for the following reasons:
+
+1. If any segments are manually dropped or re-enabled by cluster operators, this information is not reflected in
+deep storage. Restoring metadata from deep storage would undo any such drops or re-enables.
+2. Ingestion methods that allocate segments optimistically (such as native Kafka or Kinesis stream ingestion, or native
+batch ingestion in 'append' mode) can write segments to deep storage that are not meant to actually be used by the
+Druid cluster. There is no way, while purely looking at deep storage, to differentiate the segments that made it into
+the metadata store originally (and therefore _should_ be used) from the segments that did not (and therefore
+_should not_ be used).
+3. Nothing in Druid other than the `insert-segment-to-db` tool read the `descriptor.json` files.
+
+After this change, Druid stopped writing `descriptor.json` files to deep storage, and now only writes segment metadata
+to the metadata store. This meant the `insert-segment-to-db` tool is no longer useful, so it was removed in Druid 0.15.0.
+
+It is highly recommended that you take regular backups of your metadata store, since it is difficult to recover Druid
+clusters properly without it.
diff --git a/docs/35.0.0/operations/java.md b/docs/35.0.0/operations/java.md
new file mode 100644
index 0000000000..a035e4e239
--- /dev/null
+++ b/docs/35.0.0/operations/java.md
@@ -0,0 +1,89 @@
+---
+id: java
+title: "Java runtime"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+Apache Druid is written in Java and requires a Java runtime. This page provides details about obtaining and configuring
+a Java runtime for Druid.
+
+## Selecting a Java runtime
+
+Druid officially supports Java 17 and 21.
+
+The project team recommends using an OpenJDK-based Java distribution. There are many free and actively-supported
+distributions available, including
+[Amazon Corretto](https://docs.aws.amazon.com/corretto/latest/corretto-17-ug/what-is-corretto-17.html),
+[Azul Zulu](https://www.azul.com/downloads/?version=java-17-lts&package=jdk), and
+[Eclipse Temurin](https://adoptium.net/temurin/releases?version=17).
+The project team does not recommend any specific distribution over any other.
+
+Druid relies on the environment variables `JAVA_HOME` or `DRUID_JAVA_HOME` to find Java on the machine. You can set
+`DRUID_JAVA_HOME` if there is more than one instance of Java. To verify Java requirements for your environment, run the
+`bin/verify-java` script.
+
+## Garbage collection
+
+In general, the project team recommends using the G1 collector with default settings. This is the default collector in
+Java 17.
+
+Garbage collector selection and tuning is a form of sport in the Java community. There may be situations where adjusting
+garbage collection configuration improves or worsens performance. The project team's guidance is that most people do
+not need to stray away from G1 with default settings.
+
+## Strong encapsulation
+
+Java 9 and beyond (including Java 17) include the capability for
+[strong encapsulation](https://dev.java/learn/strong-encapsulation-\(of-jdk-internals\)/) of internal JDK APIs. Druid
+uses certain internal JDK APIs, which must be added to `--add-exports` and `--add-opens` on the Java command line.
+
+On Java 17, if these parameters are not included, you will see errors on startup like the following:
+
+```
+Exception in thread "main" java.lang.ExceptionInInitializerError
+```
+
+Druid's out-of-box configuration adds these parameters transparently when you use the bundled `bin/start-druid` or
+similar commands. In this case, there is nothing special you need to do to run successfully. However,
+if you have customized your Druid service launching system, you will need to ensure the required Java parameters are
+added. There are many ways of doing this. Choose the one that works best for you.
+
+1. The simplest approach: use Druid's bundled `bin/start-druid` script to launch Druid.
+
+2. If you launch Druid using `bin/supervise -c <config>`, ensure your config file uses `bin/run-druid`. This
+   script uses `bin/run-java` internally, and automatically adds the proper flags.
+
+3. If you launch Druid using a `java` command, replace `java` with `bin/run-java`. Druid's bundled
+   `bin/run-java` script automatically adds the proper flags.
+
+4. If you launch Druid without using its bundled scripts, ensure the following parameters are added to your Java
+   command line:
+
+```
+--add-exports=java.base/jdk.internal.misc=ALL-UNNAMED \
+--add-exports=java.base/jdk.internal.ref=ALL-UNNAMED \
+--add-opens=java.base/java.nio=ALL-UNNAMED \
+--add-opens=java.base/sun.nio.ch=ALL-UNNAMED \
+--add-opens=java.base/jdk.internal.ref=ALL-UNNAMED \
+--add-opens=java.base/java.io=ALL-UNNAMED \
+--add-opens=java.base/java.lang=ALL-UNNAMED \
+--add-opens=jdk.management/com.sun.management.internal=ALL-UNNAMED
+```
diff --git a/docs/35.0.0/operations/kubernetes.md b/docs/35.0.0/operations/kubernetes.md
new file mode 100644
index 0000000000..9d7b3b6c6b
--- /dev/null
+++ b/docs/35.0.0/operations/kubernetes.md
@@ -0,0 +1,34 @@
+---
+id: kubernetes
+title: "kubernetes"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+Apache Druid distribution is also available as [Docker](https://www.docker.com/) image from [Docker Hub](https://hub.docker.com/r/apache/druid) . For example, you can obtain latest release using the command below.
+
+```
+$ docker pull apache/druid
+```
+
+[druid-operator](https://github.com/datainfrahq/druid-operator) can be used to manage a Druid cluster on [Kubernetes](https://kubernetes.io/) .
+
+Druid clusters deployed on Kubernetes can function without Zookeeper using [druid–kubernetes-extensions](../development/extensions-core/kubernetes.md) .
diff --git a/docs/35.0.0/operations/metadata-migration.md b/docs/35.0.0/operations/metadata-migration.md
new file mode 100644
index 0000000000..ea3596784a
--- /dev/null
+++ b/docs/35.0.0/operations/metadata-migration.md
@@ -0,0 +1,97 @@
+---
+id: metadata-migration
+title: "Metadata Migration"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+If you have been running an evaluation Druid cluster using the built-in Derby metadata storage and wish to migrate to a
+more production-capable metadata store such as MySQL or PostgreSQL, this document describes the necessary steps.
+
+## Shut down cluster services
+
+To ensure a clean migration, shut down the non-coordinator services to ensure that metadata state will not
+change as you do the migration.
+
+When migrating from Derby, the coordinator processes will still need to be up initially, as they host the Derby database.
+
+## Exporting metadata
+
+Druid provides an [Export Metadata Tool](../operations/export-metadata.md) for exporting metadata from Derby into CSV files
+which can then be imported into your new metadata store.
+
+The tool also provides options for rewriting the deep storage locations of segments; this is useful
+for [deep storage migration](../operations/deep-storage-migration.md).
+
+Run the `export-metadata` tool on your existing cluster, and save the CSV files it generates. After a successful export, you can shut down the coordinator.
+
+## Initializing the new metadata store
+
+### Create database
+
+Before importing the existing cluster metadata, you will need to set up the new metadata store.
+
+The [MySQL extension](../development/extensions-core/mysql.md) and [PostgreSQL extension](../development/extensions-core/postgresql.md) docs have instructions for initial database setup.
+
+### Update configuration
+
+Update your Druid runtime properties with the new metadata configuration.
+
+### Create Druid tables
+
+**If you have set `druid.metadata.storage.connector.createTables` to `true` (which is the default), and your metadata connect user has DDL privileges, you can disregard this section as Druid will create metadata tables automatically on start up.**
+
+Druid provides a `metadata-init` tool for creating Druid's metadata tables. After initializing the Druid database, you can run the commands shown below from the root of the Druid package to initialize the tables.
+
+In the example commands below:
+
+- `lib` is the Druid lib directory
+- `extensions` is the Druid extensions directory
+- `base` corresponds to the value of `druid.metadata.storage.tables.base` in the configuration, `druid` by default.
+- The `--connectURI` parameter corresponds to the value of `druid.metadata.storage.connector.connectURI`.
+- The `--user` parameter corresponds to the value of `druid.metadata.storage.connector.user`.
+- The `--password` parameter corresponds to the value of `druid.metadata.storage.connector.password`.
+
+#### MySQL
+
+```bash
+cd ${DRUID_ROOT}
+java -classpath "lib/*" -Dlog4j.configurationFile=conf/druid/cluster/_common/log4j2.xml -Ddruid.extensions.directory="extensions" -Ddruid.extensions.loadList="[\"mysql-metadata-storage\"]" -Ddruid.metadata.storage.type=mysql -Ddruid.node.type=metadata-init org.apache.druid.cli.Main tools metadata-init --connectURI="<mysql-uri>" --user <user> --password <pass> --base druid
+```
+
+#### PostgreSQL
+
+```bash
+cd ${DRUID_ROOT}
+java -classpath "lib/*" -Dlog4j.configurationFile=conf/druid/cluster/_common/log4j2.xml -Ddruid.extensions.directory="extensions" -Ddruid.extensions.loadList="[\"postgresql-metadata-storage\"]" -Ddruid.metadata.storage.type=postgresql -Ddruid.node.type=metadata-init org.apache.druid.cli.Main tools metadata-init --connectURI="<postgresql-uri>" --user <user> --password <pass> --base druid
+```
+
+### Update Druid tables to latest compatible schema
+
+The same command as above can be used to update Druid metadata tables to the latest version. If any table already exists, it is not created again but any ALTER statements that may be required are still executed.
+
+### Import metadata
+
+After initializing the tables, please refer to the [import commands](../operations/export-metadata.md#importing-metadata) for your target database.
+
+### Restart cluster
+
+After importing the metadata successfully, you can now restart your cluster.
diff --git a/docs/35.0.0/operations/metrics.md b/docs/35.0.0/operations/metrics.md
new file mode 100644
index 0000000000..ce488676a0
--- /dev/null
+++ b/docs/35.0.0/operations/metrics.md
@@ -0,0 +1,613 @@
+---
+id: metrics
+title: "Metrics"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+You can configure Druid to [emit metrics](../configuration/index.md#metrics-monitors) that are essential for monitoring query execution, ingestion, coordination, and so on.
+
+All Druid metrics share a common set of fields:
+
+* `timestamp`: the time the metric was created
+* `metric`: the name of the metric
+* `service`: the service name that emitted the metric
+* `host`: the host name that emitted the metric
+* `value`: some numeric value associated with the metric
+
+Metrics may have additional dimensions beyond those listed above.
+
+:::info
+Most metric values reset each emission period, as specified in `druid.monitoring.emissionPeriod`.
+:::
+
+## Query metrics
+
+### Router
+
+|Metric|Description|Dimensions|Normal value|
+|------|-----------|----------|------------|
+|`query/time`|Milliseconds taken to complete a query.|Native Query: `dataSource`, `type`, `interval`, `hasFilters`, `duration`, `context`, `remoteAddress`, `id`, `statusCode`.|< 1s|
+
+### Broker
+
+|Metric|Description|Dimensions|Normal value|
+|------|-----------|----------|------------|
+|`query/time`|Milliseconds taken to complete a query.|<p>Common: `dataSource`, `type`, `interval`, `hasFilters`, `duration`, `context`, `remoteAddress`, `id`, `statusCode`.</p><p>Aggregation Queries: `numMetrics`, `numComplexMetrics`.</p><p>GroupBy: `numDimensions`.</p><p> TopN: `threshold`, `dimension`.</p>|< 1s|
+|`query/bytes`|The total number of bytes returned to the requesting client in the query response from the broker. Other services report the total bytes for their portion of the query. |<p>Common: `dataSource`, `type`, `interval`, `hasFilters`, `duration`, `context`, `remoteAddress`, `id`.</p><p> Aggregation Queries: `numMetrics`, `numComplexMetrics`.</p><p> GroupBy: `numDimensions`.</p><p> TopN: `threshold`, `dimension`.</p>| |
+|`query/node/time`|Milliseconds taken to query individual historical/realtime processes.|`id`, `status`, `server`|< 1s|
+|`query/resultCache/hit`|Whether the query hit the result cache (1) or not (0). Emission of the metric indicates the result-level cache was polled.|<p>Common: `dataSource`, `type`, `interval`, `hasFilters`, `duration`, `context`, `remoteAddress`, `id`.</p>|Varies|
+|`query/node/bytes`|Number of bytes returned from querying individual historical/realtime processes.|`id`, `status`, `server`| |
+|`query/node/ttfb`|Time to first byte. Milliseconds elapsed until Broker starts receiving the response from individual historical/realtime processes.|`id`, `status`, `server`|< 1s|
+|`query/count`|Number of total queries.|This metric is only available if the `QueryCountStatsMonitor` module is included.| |
+|`query/success/count`|Number of queries successfully processed.|This metric is only available if the `QueryCountStatsMonitor` module is included.| |
+|`query/failed/count`|Number of failed queries.|This metric is only available if the `QueryCountStatsMonitor` module is included.| |
+|`query/interrupted/count`|Number of queries interrupted due to cancellation.|This metric is only available if the `QueryCountStatsMonitor` module is included.| |
+|`query/timeout/count`|Number of timed out queries.|This metric is only available if the `QueryCountStatsMonitor` module is included.| |
+|`query/segments/count`|This metric is not enabled by default. See the `QueryMetrics` Interface for reference regarding enabling this metric. Number of segments that will be touched by the query. In the broker, it makes a plan to distribute the query to realtime tasks and historicals based on a snapshot of segment distribution state. If there are some segments moved after this snapshot is created, certain historicals and realtime tasks can report those segments as missing to the broker. The broker will resend the query to the new servers that serve those segments after move. In this case, those segments can be counted more than once in this metric.||Varies|
+|`query/priority`|Assigned lane and priority, only if Laning strategy is enabled. Refer to [Laning strategies](../configuration/index.md#laning-strategies)|`lane`, `dataSource`, `type`|0|
+|`sqlQuery/time`|Milliseconds taken to complete a SQL query.|`id`, `nativeQueryIds`, `dataSource`, `remoteAddress`, `success`, `engine`, `statusCode`|< 1s|
+|`sqlQuery/planningTimeMs`|Milliseconds taken to plan a SQL to native query.|`id`, `nativeQueryIds`, `dataSource`, `remoteAddress`, `success`, `engine`| |
+|`sqlQuery/bytes`|Number of bytes returned in the SQL query response.|`id`, `nativeQueryIds`, `dataSource`, `remoteAddress`, `success`, `engine`| |
+|`serverview/init/time`|Time taken to initialize the broker server view. Useful to detect if brokers are taking too long to start.||Depends on the number of segments.|
+|`metadatacache/init/time`|Time taken to initialize the broker segment metadata cache. Useful to detect if brokers are taking too long to start||Depends on the number of segments.|
+|`segment/schemaCache/refresh/count`|Number of segments refreshed in broker segment schema cache.|`dataSource`||
+|`segment/schemaCache/refresh/time`|Time taken to refresh segments in broker segment schema cache.|`dataSource`||
+|`segment/schemaCache/poll/count`|Number of coordinator polls to fetch datasource schema.|||
+|`segment/schemaCache/poll/failed`|Number of failed coordinator polls to fetch datasource schema.|||
+|`metadatacache/schemaPoll/time`|Time taken for coordinator polls to fetch datasource schema.|||
+|`serverview/sync/healthy`|Sync status of the Broker with a segment-loading server such as a Historical or Peon. Emitted only when [HTTP-based server view](../configuration/index.md#segment-management) is enabled. This metric can be used in conjunction with `serverview/sync/unstableTime` to debug slow startup of Brokers.|`server`, `tier`|1 for fully synced servers, 0 otherwise|
+|`serverview/sync/unstableTime`|Time in milliseconds for which the Broker has been failing to sync with a segment-loading server. Emitted only when [HTTP-based server view](../configuration/index.md#segment-management) is enabled.|`server`, `tier`|Not emitted for synced servers.|
+|`subquery/rows`|Number of rows materialized by the subquery's results. |`id`, `subqueryId`| Varies |
+|`subquery/bytes`|Number of bytes materialized by the subquery's results. This metric is only emitted if the query uses [byte-based subquery guardrails](https://druid.apache.org/docs/latest/configuration/#guardrails-for-materialization-of-subqueries) |`id`, `subqueryId` | Varies |
+|`subquery/rowLimit/count`|Number of subqueries whose results are materialized as rows (Java objects on heap).|This metric is only available if the `SubqueryCountStatsMonitor` module is included.| |
+|`subquery/byteLimit/count`|Number of subqueries whose results are materialized as frames (Druid's internal byte representation of rows).|This metric is only available if the `SubqueryCountStatsMonitor` module is included.| |
+|`subquery/fallback/count`|Number of subqueries which cannot be materialized as frames|This metric is only available if the `SubqueryCountStatsMonitor` module is included.| |
+|`subquery/fallback/insufficientType/count`|Number of subqueries which cannot be materialized as frames due to insufficient type information in the row signature.|This metric is only available if the `SubqueryCountStatsMonitor` module is included.| |
+|`subquery/fallback/unknownReason/count`|Number of subqueries which cannot be materialized as frames due other reasons.|This metric is only available if the `SubqueryCountStatsMonitor` module is included.| |
+|`query/rowLimit/exceeded/count`|Number of queries whose inlined subquery results exceeded the given row limit|This metric is only available if the `SubqueryCountStatsMonitor` module is included.| |
+|`query/byteLimit/exceeded/count`|Number of queries whose inlined subquery results exceeded the given byte limit|This metric is only available if the `SubqueryCountStatsMonitor` module is included.| |
+|`mergeBuffer/pendingRequests`|Number of requests waiting to acquire a batch of buffers from the merge buffer pool.|This metric is only available if the `GroupByStatsMonitor` module is included.|Should be ideally 0, though a higher number isn't representative of a problem.|
+|`mergeBuffer/used`|Number of merge buffers used from the merge buffer pool.|This metric is only available if the `GroupByStatsMonitor` module is included.|Depends on the number of groupBy queries needing merge buffers.|
+|`mergeBuffer/queries`|Number of groupBy queries that acquired a batch of buffers from the merge buffer pool.|This metric is only available if the `GroupByStatsMonitor` module is included.|Depends on the number of groupBy queries needing merge buffers.|
+|`mergeBuffer/acquisitionTimeNs`|Total time in nanoseconds to acquire merge buffer for groupBy queries.|This metric is only available if the `GroupByStatsMonitor` module is included.|Varies|
+|`groupBy/spilledQueries`|Number of groupBy queries that have spilled onto the disk.|This metric is only available if the `GroupByStatsMonitor` module is included.|Varies|
+|`groupBy/spilledBytes`|Number of bytes spilled on the disk by the groupBy queries.|This metric is only available if the `GroupByStatsMonitor` module is included.|Varies|
+|`groupBy/mergeDictionarySize`|Size of on-heap merge dictionary in bytes.|This metric is only available if the `GroupByStatsMonitor` module is included.|Varies|
+
+### Historical
+
+|Metric|Description|Dimensions|Normal value|
+|------|-----------|----------|------------|
+|`query/time`|Milliseconds taken to complete a query.|<p>Common: `dataSource`, `type`, `interval`, `hasFilters`, `duration`, `context`, `remoteAddress`, `id`, `statusCode`.</p><p> Aggregation Queries: `numMetrics`, `numComplexMetrics`.</p><p> GroupBy: `numDimensions`.</p><p> TopN: `threshold`, `dimension`.</p>|< 1s|
+|`query/segment/time`|Milliseconds taken to query individual segment. Includes time to page in the segment from disk.|`id`, `status`, `segment`, `vectorized`.|several hundred milliseconds|
+|`query/wait/time`|Milliseconds spent waiting for a segment to be scanned.|`id`, `segment`|< several hundred milliseconds|
+|`segment/scan/pending`|Number of segments in queue waiting to be scanned.||Close to 0|
+|`segment/scan/active`|Number of segments currently scanned. This metric also indicates how many threads from `druid.processing.numThreads` are currently being used.||Close to `druid.processing.numThreads`|
+|`query/segmentAndCache/time`|Milliseconds taken to query individual segment or hit the cache (if it is enabled on the Historical process).|`id`, `segment`|several hundred milliseconds|
+|`query/cpu/time`|Microseconds of CPU time taken to complete a query.|<p>Common: `dataSource`, `type`, `interval`, `hasFilters`, `duration`, `context`, `remoteAddress`, `id`.</p><p> Aggregation Queries: `numMetrics`, `numComplexMetrics`.</p><p> GroupBy: `numDimensions`.</p><p> TopN: `threshold`, `dimension`.</p>|Varies|
+|`query/count`|Total number of queries.|This metric is only available if the `QueryCountStatsMonitor` module is included.||
+|`query/success/count`|Number of queries successfully processed.|This metric is only available if the `QueryCountStatsMonitor` module is included.||
+|`query/failed/count`|Number of failed queries.|This metric is only available if the `QueryCountStatsMonitor` module is included.||
+|`query/interrupted/count`|Number of queries interrupted due to cancellation.|This metric is only available if the `QueryCountStatsMonitor` module is included.||
+|`query/timeout/count`|Number of timed out queries.|This metric is only available if the `QueryCountStatsMonitor` module is included.||
+|`mergeBuffer/pendingRequests`|Number of requests waiting to acquire a batch of buffers from the merge buffer pool.|This metric is only available if the `GroupByStatsMonitor` module is included.|Should be ideally 0, though a higher number isn't representative of a problem.|
+|`mergeBuffer/used`|Number of merge buffers used from the merge buffer pool.|This metric is only available if the `GroupByStatsMonitor` module is included.|Depends on the number of groupBy queries needing merge buffers.|
+|`mergeBuffer/queries`|Number of groupBy queries that acquired a batch of buffers from the merge buffer pool.|This metric is only available if the `GroupByStatsMonitor` module is included.|Depends on the number of groupBy queries needing merge buffers.|
+|`mergeBuffer/acquisitionTimeNs`|Total time in nanoseconds to acquire merge buffer for groupBy queries.|This metric is only available if the `GroupByStatsMonitor` module is included.|Varies|
+|`groupBy/spilledQueries`|Number of groupBy queries that have spilled onto the disk.|This metric is only available if the `GroupByStatsMonitor` module is included.|Varies|
+|`groupBy/spilledBytes`|Number of bytes spilled on the disk by the groupBy queries.|This metric is only available if the `GroupByStatsMonitor` module is included.|Varies|
+|`groupBy/mergeDictionarySize`|Size of on-heap merge dictionary in bytes.|This metric is only available if the `GroupByStatsMonitor` module is included.|Varies|
+
+### Real-time
+
+|Metric|Description|Dimensions|Normal value|
+|------|-----------|----------|------------|
+|`query/time`|Milliseconds taken to complete a query.|<p>Common: `dataSource`, `type`, `interval`, `hasFilters`, `duration`, `context`, `remoteAddress`, `id`, `statusCode`.</p><p> Aggregation Queries: `numMetrics`, `numComplexMetrics`.</p><p> GroupBy: `numDimensions`.</p><p> TopN: `threshold`, `dimension`.</p>|< 1s|
+|`query/wait/time`|Milliseconds spent waiting for a segment to be scanned.|`id`, `segment`|several hundred milliseconds|
+|`segment/scan/pending`|Number of segments in queue waiting to be scanned.||Close to 0|
+|`segment/scan/active`|Number of segments currently scanned. This metric also indicates how many threads from `druid.processing.numThreads` are currently being used.||Close to `druid.processing.numThreads`|
+|`query/cpu/time`|Microseconds of CPU time taken to complete a query.|<p>Common: `dataSource`, `type`, `interval`, `hasFilters`, `duration`, `context`, `remoteAddress`, `id`.</p><p> Aggregation Queries: `numMetrics`, `numComplexMetrics`.</p><p> GroupBy: `numDimensions`. </p><p>TopN: `threshold`, `dimension`.</p>|Varies|
+|`query/count`|Number of total queries.|This metric is only available if the `QueryCountStatsMonitor` module is included.||
+|`query/success/count`|Number of queries successfully processed.|This metric is only available if the `QueryCountStatsMonitor` module is included.||
+|`query/failed/count`|Number of failed queries.|This metric is only available if the `QueryCountStatsMonitor` module is included.||
+|`query/interrupted/count`|Number of queries interrupted due to cancellation.|This metric is only available if the `QueryCountStatsMonitor` module is included.||
+|`query/timeout/count`|Number of timed out queries.|This metric is only available if the `QueryCountStatsMonitor` module is included.||
+|`mergeBuffer/pendingRequests`|Number of requests waiting to acquire a batch of buffers from the merge buffer pool.|This metric is only available if the `GroupByStatsMonitor` module is included.|Should be ideally 0, though a higher number isn't representative of a problem.|
+|`mergeBuffer/used`|Number of merge buffers used from the merge buffer pool.|This metric is only available if the `GroupByStatsMonitor` module is included.|Depends on the number of groupBy queries needing merge buffers.|
+|`mergeBuffer/queries`|Number of groupBy queries that acquired a batch of buffers from the merge buffer pool.|This metric is only available if the `GroupByStatsMonitor` module is included.|Depends on the number of groupBy queries needing merge buffers.|
+|`mergeBuffer/acquisitionTimeNs`|Total time in nanoseconds to acquire merge buffer for groupBy queries.|This metric is only available if the `GroupByStatsMonitor` module is included.|Varies|
+|`groupBy/spilledQueries`|Number of groupBy queries that have spilled onto the disk.|This metric is only available if the `GroupByStatsMonitor` module is included.|Varies|
+|`groupBy/spilledBytes`|Number of bytes spilled on the disk by the groupBy queries.|This metric is only available if the `GroupByStatsMonitor` module is included.|Varies|
+|`groupBy/mergeDictionarySize`|Size of on-heap merge dictionary in bytes.|This metric is only available if the `GroupByStatsMonitor` module is included.|Varies|
+
+### Jetty
+
+|Metric|Description|Normal value|
+|------|-----------|------------|
+|`jetty/numOpenConnections`|Number of open jetty connections.|Not much higher than number of jetty threads.|
+|`jetty/threadPool/total`|Number of total workable threads allocated.|The number should equal to `threadPoolNumIdleThreads` + `threadPoolNumBusyThreads`.|
+|`jetty/threadPool/idle`|Number of idle threads.|Less than or equal to `threadPoolNumTotalThreads`. Non zero number means there is less work to do than configured capacity.|
+|`jetty/threadPool/busy`|Number of busy threads that has work to do from the worker queue.|Less than or equal to `threadPoolNumTotalThreads`.|
+|`jetty/threadPool/isLowOnThreads`|A rough indicator of whether number of total workable threads allocated is enough to handle the works in the work queue.|0|
+|`jetty/threadPool/min`|Number of minimum threads allocatable.|`druid.server.http.numThreads` plus a small fixed number of threads allocated for Jetty acceptors and selectors.|
+|`jetty/threadPool/max`|Number of maximum threads allocatable.|`druid.server.http.numThreads` plus a small fixed number of threads allocated for Jetty acceptors and selectors.|
+|`jetty/threadPool/queueSize`|Size of the worker queue.|Not much higher than `druid.server.http.queueSize`.|
+
+### Cache
+
+|Metric|Description|Dimensions|Normal value|
+|------|-----------|----------|------------|
+|`query/cache/delta/*`|Cache metrics since the last emission.||N/A|
+|`query/cache/total/*`|Total cache metrics.||N/A|
+|`*/numEntries`|Number of cache entries.||Varies|
+|`*/sizeBytes`|Size in bytes of cache entries.||Varies|
+|`*/hits`|Number of cache hits.||Varies|
+|`*/misses`|Number of cache misses.||Varies|
+|`*/evictions`|Number of cache evictions.||Varies|
+|`*/hitRate`|Cache hit rate.||~40%|
+|`*/averageByte`|Average cache entry byte size.||Varies|
+|`*/timeouts`|Number of cache timeouts.||0|
+|`*/errors`|Number of cache errors.||0|
+|`*/put/ok`|Number of new cache entries successfully cached.||Varies, but more than zero|
+|`*/put/error`|Number of new cache entries that could not be cached due to errors.||Varies, but more than zero|
+|`*/put/oversized`|Number of potential new cache entries that were skipped due to being too large (based on `druid.{broker,historical,realtime}.cache.maxEntrySize` properties).||Varies|
+
+#### Memcached only metrics
+
+Memcached client metrics are reported as per the following. These metrics come directly from the client as opposed to from the cache retrieval layer.
+
+|Metric|Description|Dimensions|Normal value|
+|------|-----------|----------|------------|
+|`query/cache/memcached/total`|Cache metrics unique to memcached (only if `druid.cache.type=memcached`) as their actual values.|Variable|N/A|
+|`query/cache/memcached/delta`|Cache metrics unique to memcached (only if `druid.cache.type=memcached`) as their delta from the prior event emission.|Variable|N/A|
+
+## SQL Metrics
+
+If SQL is enabled, the Broker will emit the following metrics for SQL.
+
+|Metric|Description|Dimensions|Normal value|
+|------|-----------|----------|------------|
+|`sqlQuery/time`|Milliseconds taken to complete a SQL.|`id`, `nativeQueryIds`, `dataSource`, `remoteAddress`, `success`, `engine`, `statusCode`|< 1s|
+|`sqlQuery/planningTimeMs`|Milliseconds taken to plan a SQL to native query.|`id`, `nativeQueryIds`, `dataSource`, `remoteAddress`, `success`, `engine`| |
+|`sqlQuery/bytes`|number of bytes returned in SQL response.|`id`, `nativeQueryIds`, `dataSource`, `remoteAddress`, `success`, `engine`| |
+
+## Ingestion metrics
+
+### General native ingestion metrics
+
+|Metric|Description|Dimensions|Normal value|
+|------|-----------|----------|------------|
+|`ingest/count`|Count of `1` every time an ingestion job runs (includes compaction jobs). Aggregate using dimensions. | `dataSource`, `taskId`, `taskType`, `groupId`, `taskIngestionMode`, `tags` |Always `1`.|
+|`ingest/segments/count`|Count of final segments created by job (includes tombstones). | `dataSource`, `taskId`, `taskType`, `groupId`, `taskIngestionMode`, `tags` |At least `1`.|
+|`ingest/tombstones/count`|Count of tombstones created by job. | `dataSource`, `taskId`, `taskType`, `groupId`, `taskIngestionMode`, `tags` |Zero or more for replace. Always zero for non-replace tasks (always zero for legacy replace, see below).|
+
+The `taskIngestionMode` dimension includes the following modes:
+
+* `APPEND`: a native ingestion job appending to existing segments
+* `REPLACE_LEGACY`: the original replace before tombstones
+* `REPLACE`: a native ingestion job replacing existing segments using tombstones
+
+The mode is decided using the values
+of the `isAppendToExisting` and `isDropExisting` flags in the
+task's `IOConfig` as follows:
+
+|`isAppendToExisting`|`isDropExisting`|Mode|
+|--------------------|----------------|----|
+|`true`|`false`|`APPEND`|
+|`true`|`true `|Invalid combination, exception thrown.|
+|`false`|`false`|`REPLACE_LEGACY`. The default for JSON-based batch ingestion. |
+|`false`|`true`|`REPLACE`|
+
+The `tags` dimension is reported only for metrics emitted from ingestion tasks whose ingest spec specifies the `tags`
+field in the `context` field of the ingestion spec. `tags` is expected to be a map of string to object.
+
+### Ingestion metrics for Kafka
+
+These metrics apply to the [Kafka indexing service](../ingestion/kafka-ingestion.md).
+
+|Metric|Description|Dimensions|Normal value|
+|------|-----------|----------|------------|
+|`ingest/kafka/lag`|Total lag between the offsets consumed by the Kafka indexing tasks and latest offsets in Kafka brokers across all partitions. Minimum emission period for this metric is a minute.|`supervisorId`, `dataSource`, `stream`, `tags`|Greater than 0, should not be a very high number. |
+|`ingest/kafka/maxLag`|Max lag between the offsets consumed by the Kafka indexing tasks and latest offsets in Kafka brokers across all partitions. Minimum emission period for this metric is a minute.|`supervisorId`, `dataSource`, `stream`, `tags`|Greater than 0, should not be a very high number. |
+|`ingest/kafka/avgLag`|Average lag between the offsets consumed by the Kafka indexing tasks and latest offsets in Kafka brokers across all partitions. Minimum emission period for this metric is a minute.|`supervisorId`, `dataSource`, `stream`, `tags`|Greater than 0, should not be a very high number. |
+|`ingest/kafka/partitionLag`|Partition-wise lag between the offsets consumed by the Kafka indexing tasks and latest offsets in Kafka brokers. Minimum emission period for this metric is a minute.|`supervisorId`, `dataSource`, `stream`, `partition`, `tags`|Greater than 0, should not be a very high number. |
+|`ingest/kafka/fetchOffsets/time`|Total time (in milliseconds) taken to fetch and update the latest offsets from Kafka stream and the ingestion tasks.|`supervisorId`, `dataSource`, `taskId`, `taskType`, `groupId`, `tags`|Generally a few seconds at most.|
+|`ingest/kafka/lag/time`|Total lag time in milliseconds between the current message sequence number consumed by the Kafka indexing tasks and latest sequence number in Kafka across all shards. Minimum emission period for this metric is a minute. Enabled only when `pusblishLagTime` is set to true on supervisor config.|`dataSource`, `stream`, `tags`|Greater than 0, up to max kafka retention period in milliseconds. |
+|`ingest/kafka/maxLag/time`|Max lag time in milliseconds between the current message sequence number consumed by the Kafka indexing tasks and latest sequence number in Kafka across all shards. Minimum emission period for this metric is a minute. Enabled only when `pusblishLagTime` is set to true on supervisor config.|`dataSource`, `stream`, `tags`|Greater than 0, up to max kafka retention period in milliseconds. |
+|`ingest/kafka/avgLag/time`|Average lag time in milliseconds between the current message sequence number consumed by the Kafka indexing tasks and latest sequence number in Kafka across all shards. Minimum emission period for this metric is a minute. Enabled only when `pusblishLagTime` is set to true on supervisor config.|`dataSource`, `stream`, `tags`|Greater than 0, up to max kafka retention period in milliseconds. |
+
+### Ingestion metrics for Kinesis
+
+These metrics apply to the [Kinesis indexing service](../ingestion/kinesis-ingestion.md).
+
+|Metric|Description|Dimensions|Normal value|
+|------|-----------|----------|------------|
+|`ingest/kinesis/lag/time`|Total lag time in milliseconds between the current message sequence number consumed by the Kinesis indexing tasks and latest sequence number in Kinesis across all shards. Minimum emission period for this metric is a minute.|`supervisorId`, `dataSource`, `stream`, `tags`|Greater than 0, up to max Kinesis retention period in milliseconds. |
+|`ingest/kinesis/maxLag/time`|Max lag time in milliseconds between the current message sequence number consumed by the Kinesis indexing tasks and latest sequence number in Kinesis across all shards. Minimum emission period for this metric is a minute.|`supervisorId`, `dataSource`, `stream`, `tags`|Greater than 0, up to max Kinesis retention period in milliseconds. |
+|`ingest/kinesis/avgLag/time`|Average lag time in milliseconds between the current message sequence number consumed by the Kinesis indexing tasks and latest sequence number in Kinesis across all shards. Minimum emission period for this metric is a minute.|`supervisorId`, `dataSource`, `stream`, `tags`|Greater than 0, up to max Kinesis retention period in milliseconds. |
+|`ingest/kinesis/partitionLag/time`|Partition-wise lag time in milliseconds between the current message sequence number consumed by the Kinesis indexing tasks and latest sequence number in Kinesis. Minimum emission period for this metric is a minute.|`supervisorId`, `dataSource`, `stream`, `partition`, `tags`|Greater than 0, up to max Kinesis retention period in milliseconds. |
+|`ingest/kinesis/fetchOffsets/time`|Total time (in milliseconds) taken to fetch and update the latest offsets from Kafka stream and the ingestion tasks.|`supervisorId`, `dataSource`, `taskId`, `taskType`, `groupId`, `tags`|Generally a few seconds at most.|
+
+### Compaction metrics
+
+[Compaction tasks](../data-management/compaction.md) emit the following metrics.
+
+|Metric|Description|Dimensions|Normal value|
+|------|-----------|----------|------------|
+|`compact/segmentAnalyzer/fetchAndProcessMillis`|Time taken to fetch and process segments to infer the schema for the compaction task to run.|`dataSource`, `taskId`, `taskType`, `groupId`,`tags`| Varies. A high value indicates compaction tasks will speed up from explicitly setting the data schema. |
+
+### Other ingestion metrics
+
+Streaming ingestion tasks and certain types of
+batch ingestion emit the following metrics. These metrics are deltas for each emission period.
+
+|Metric|Description|Dimensions|Normal value|
+|------|-----------|----------|------------|
+|`ingest/events/processed`|Number of events processed per emission period.|`dataSource`, `taskId`, `taskType`, `groupId`, `tags`|Equal to the number of events per emission period.|
+|`ingest/events/processedWithError`|Number of events processed with some partial errors per emission period. Events processed with partial errors are counted towards both this metric and `ingest/events/processed`.|`dataSource`, `taskId`, `taskType`, `groupId`, `tags`|0|
+|`ingest/events/unparseable`|Number of events rejected because the events are unparseable.|`dataSource`, `taskId`, `taskType`, `groupId`, `tags`|0|
+|`ingest/events/thrownAway`|Number of events rejected because they are null, or filtered by `transformSpec`, or outside one of `lateMessageRejectionPeriod`, `earlyMessageRejectionPeriod`.|`dataSource`, `taskId`, `taskType`, `groupId`, `tags`|0|
+|`ingest/events/duplicate`|Number of events rejected because the events are duplicated.|`dataSource`, `taskId`, `taskType`, `groupId`, `tags`|0|
+|`ingest/input/bytes`|Number of bytes read from input sources, after decompression but prior to parsing. This covers all data read, including data that does not end up being fully processed and ingested. For example, this includes data that ends up being rejected for being unparseable or filtered out.|`dataSource`, `taskId`, `taskType`, `groupId`, `tags`|Depends on the amount of data read.|
+|`ingest/rows/output`|Number of Druid rows persisted.|`dataSource`, `taskId`, `taskType`, `groupId`|Your number of events with rollup.|
+|`ingest/persists/count`|Number of times persist occurred.|`dataSource`, `taskId`, `taskType`, `groupId`, `tags`|Depends on the configuration.|
+|`ingest/persists/time`|Milliseconds spent doing intermediate persist.|`dataSource`, `taskId`, `taskType`, `groupId`, `tags`|Depends on the configuration. Generally a few minutes at most.|
+|`ingest/persists/cpu`|CPU time in nanoseconds spent on doing intermediate persist.|`dataSource`, `taskId`, `taskType`, `groupId`, `tags`|Depends on the configuration. Generally a few minutes at most.|
+|`ingest/persists/backPressure`|Milliseconds spent creating persist tasks and blocking waiting for them to finish.|`dataSource`, `taskId`, `taskType`, `groupId`, `tags`|0 or very low|
+|`ingest/persists/failed`|Number of persists that failed.|`dataSource`, `taskId`, `taskType`, `groupId`, `tags`|0|
+|`ingest/handoff/failed`|Number of handoffs that failed.|`dataSource`, `taskId`, `taskType`, `groupId`,`tags`|0|
+|`ingest/merge/time`|Milliseconds spent merging intermediate segments.|`dataSource`, `taskId`, `taskType`, `groupId`, `tags`|Depends on the configuration. Generally a few minutes at most.|
+|`ingest/merge/cpu`|CPU time in Nanoseconds spent on merging intermediate segments.|`dataSource`, `taskId`, `taskType`, `groupId`, `tags`|Depends on the configuration. Generally a few minutes at most.|
+|`ingest/handoff/count`|Number of handoffs that happened.|`dataSource`, `taskId`, `taskType`, `groupId`, `tags`|Varies. Generally greater than 0 once every segment granular period if cluster operating normally.|
+|`ingest/sink/count`|Number of sinks not handed off.|`dataSource`, `taskId`, `taskType`, `groupId`, `tags`|1~3|
+|`ingest/events/messageGap`|Time gap in milliseconds between the latest ingested event timestamp and the current system timestamp of metrics emission. If the value is increasing but lag is low, Druid may not be receiving new data. This metric is reset as new tasks spawn up.|`dataSource`, `taskId`, `taskType`, `groupId`, `tags`|Greater than 0, depends on the time carried in event.|
+|`ingest/events/maxMessageGap`|Maximum seen time gap in milliseconds between each ingested event timestamp and the current system timestamp of metrics emission. This metric is reset every emission period.|`dataSource`, `taskId`, `taskType`, `groupId`, `tags`|Greater than 0, depends on the time carried in event.|
+|`ingest/events/minMessageGap`|Minimum seen time gap in milliseconds between each ingested event timestamp and the current system timestamp of metrics emission. This metric is reset every emission period.|`dataSource`, `taskId`, `taskType`, `groupId`, `tags`|Greater than 0, depends on the time carried in event.|
+|`ingest/events/avgMessageGap`|Average time gap in milliseconds between each ingested event timestamp and the current system timestamp of metrics emission. This metric is reset every emission period.|`dataSource`, `taskId`, `taskType`, `groupId`, `tags`|Greater than 0, depends on the time carried in event.|
+|`ingest/notices/queueSize`|Number of pending notices to be processed by the coordinator.|`supervisorId`, `dataSource`, `tags`|Typically 0 and occasionally in lower single digits. Should not be a very high number. |
+|`ingest/notices/time`|Milliseconds taken to process a notice by the supervisor.|`supervisorId`, `dataSource`, `tags`| < 1s |
+|`ingest/pause/time`|Milliseconds spent by a task in a paused state without ingesting.|`dataSource`, `taskId`, `tags`| < 10 seconds|
+|`ingest/handoff/time`|Total number of milliseconds taken to handoff a set of segments.|`dataSource`, `taskId`, `taskType`, `groupId`, `tags`|Depends on the coordinator cycle time.|
+|`task/autoScaler/requiredCount`|Count of required tasks based on the calculations of `lagBased` auto scaler.|`supervisorId`, `dataSource`, `stream`, `scalingSkipReason`|Depends on auto scaler config.|
+|`task/autoScaler/scaleActionTime`|Time taken in milliseconds to complete the scale action.|`supervisorId`, `dataSource`, `stream`|Depends on auto scaler config.|
+
+If the JVM does not support CPU time measurement for the current thread, `ingest/merge/cpu` and `ingest/persists/cpu` will be 0.
+
+## Indexing service
+
+|Metric|Description|Dimensions|Normal value|
+|------|-----------|----------|------------|
+|`task/run/time`|Milliseconds taken to run a task.| `dataSource`, `taskId`, `taskType`, `groupId`, `taskStatus`, `description`, `tags`|Varies|
+|`task/pending/time`|Milliseconds taken for a task to wait for running.| `dataSource`, `taskId`, `taskType`, `groupId`, `tags`|Varies|
+|`task/action/log/time`|Milliseconds taken to log a task action to the audit log.| `dataSource`, `taskId`, `taskType`, `groupId`, `taskActionType`, `tags`|< 1000 (subsecond)|
+|`task/action/run/time`|Milliseconds taken to execute a task action.| `dataSource`, `taskId`, `taskType`, `groupId`, `taskActionType`, `tags`|Varies from subsecond to a few seconds, based on action type.|
+|`task/action/success/count`|Number of task actions that were executed successfully during the emission period. Currently only being emitted for [batched `segmentAllocate` actions](../ingestion/tasks.md#batching-segmentallocate-actions).| `dataSource`, `taskId`, `taskType`, `groupId`, `taskActionType`, `tags`|Varies|
+|`task/action/failed/count`|Number of task actions that failed during the emission period. Currently only being emitted for [batched `segmentAllocate` actions](../ingestion/tasks.md#batching-segmentallocate-actions).| `dataSource`, `taskId`, `taskType`, `groupId`, `taskActionType`, `tags`|Varies|
+|`task/action/batch/queueTime`|Milliseconds spent by a batch of task actions in queue. Currently only being emitted for [batched `segmentAllocate` actions](../ingestion/tasks.md#batching-segmentallocate-actions).| `dataSource`, `taskActionType`, `interval`|Varies based on the `batchAllocationWaitTime` and number of batches in queue.|
+|`task/action/batch/runTime`|Milliseconds taken to execute a batch of task actions. Currently only being emitted for [batched `segmentAllocate` actions](../ingestion/tasks.md#batching-segmentallocate-actions).| `dataSource`, `taskActionType`, `interval`|Varies from subsecond to a few seconds, based on action type and batch size.|
+|`task/action/batch/size`|Number of task actions in a batch that was executed during the emission period. Currently only being emitted for [batched `segmentAllocate` actions](../ingestion/tasks.md#batching-segmentallocate-actions).| `dataSource`, `taskActionType`, `interval`|Varies based on number of concurrent task actions.|
+|`task/action/batch/attempts`|Number of execution attempts for a single batch of task actions. Currently only being emitted for [batched `segmentAllocate` actions](../ingestion/tasks.md#batching-segmentallocate-actions).| `dataSource`, `taskActionType`, `interval`|1 if there are no failures or retries.|
+|`task/segmentAvailability/wait/time`|The amount of milliseconds a batch indexing task waited for newly created segments to become available for querying.| `dataSource`, `taskType`, `groupId`, `taskId`, `segmentAvailabilityConfirmed`, `tags`|Varies|
+|`segment/added/bytes`|Size in bytes of new segments created.| `dataSource`, `taskId`, `taskType`, `groupId`, `interval`, `tags`|Varies|
+|`segment/moved/bytes`|Size in bytes of segments moved/archived via the Move Task.| `dataSource`, `taskId`, `taskType`, `groupId`, `interval`, `tags`|Varies|
+|`segment/nuked/bytes`|Size in bytes of segments deleted via the Kill Task.| `dataSource`, `taskId`, `taskType`, `groupId`, `interval`, `tags`|Varies|
+|`task/success/count`|Number of successful tasks per emission period. This metric is available only if the `TaskCountStatsMonitor` module is included.| `dataSource`,`taskType`|Varies|
+|`task/failed/count`|Number of failed tasks per emission period. This metric is available only if the `TaskCountStatsMonitor` module is included.|`dataSource`,`taskType`|Varies|
+|`task/running/count`|Number of current running tasks. This metric is available only if the `TaskCountStatsMonitor` module is included.|`dataSource`,`taskType`|Varies|
+|`task/pending/count`|Number of current pending tasks. This metric is available only if the `TaskCountStatsMonitor` module is included.|`dataSource`,`taskType`|Varies|
+|`task/waiting/count`|Number of current waiting tasks. This metric is available only if the `TaskCountStatsMonitor` module is included.|`dataSource`,`taskType`|Varies|
+|`taskSlot/total/count`|Number of total task slots per emission period. This metric is available only if the `TaskSlotCountStatsMonitor` module is included.| `category`|Varies|
+|`taskSlot/idle/count`|Number of idle task slots per emission period. This metric is available only if the `TaskSlotCountStatsMonitor` module is included.| `category`|Varies|
+|`taskSlot/used/count`|Number of busy task slots per emission period. This metric is available only if the `TaskSlotCountStatsMonitor` module is included.| `category`|Varies|
+|`taskSlot/lazy/count`|Number of total task slots in lazy marked Middle Managers and Indexers per emission period. This metric is available only if the `TaskSlotCountStatsMonitor` module is included.| `category`|Varies|
+|`taskSlot/blacklisted/count`|Number of total task slots in blacklisted Middle Managers and Indexers per emission period. This metric is available only if the `TaskSlotCountStatsMonitor` module is included.| `category`|Varies|
+|`worker/task/failed/count`|Number of failed tasks run on a Middle Manager-based worker per emission period. This metric is available only if the `WorkerTaskCountStatsMonitor` module is included.| `category`, `workerVersion`|Varies|
+|`worker/task/success/count`|Number of successful tasks run on a Middle Manager-based worker per emission period. This metric is available only if the `WorkerTaskCountStatsMonitor` module is included.| `category`,`workerVersion`|Varies|
+|`worker/taskSlot/idle/count`|Number of idle task slots on a Middle Manager-based worker per emission period. This metric is available only if the `WorkerTaskCountStatsMonitor` module is included.| `category`, `workerVersion`|Varies|
+|`worker/taskSlot/total/count`|Number of total task slots on a Middle Manager-based worker per emission period. This metric is available only if the `WorkerTaskCountStatsMonitor` module is included.| `category`, `workerVersion`|Varies|
+|`worker/taskSlot/used/count`|Number of busy task slots on a Middle Manager-based worker per emission period. This metric is available only if the `WorkerTaskCountStatsMonitor` module is included.| `category`, `workerVersion`|Varies|
+|`worker/task/assigned/count`|Number of tasks assigned to an Indexer-based worker per emission period. This metric is available only if the `WorkerTaskCountStatsMonitor` module is included.|`dataSource`|Varies|
+|`worker/task/completed/count`|Number of tasks completed by an Indexer-based worker per emission period. This metric is available only if the `WorkerTaskCountStatsMonitor` module is included.|`dataSource`|Varies|
+|`worker/task/failed/count`|Number of tasks that failed on an Indexer-based worker per emission period. This metric is available only if the `WorkerTaskCountStatsMonitor` module is included.|`dataSource`|Varies|
+|`worker/task/success/count`|Number of tasks that succeeded on an Indexer-based worker per emission period. This metric is available only if the `WorkerTaskCountStatsMonitor` module is included.|`dataSource`|Varies|
+|`worker/task/running/count`|Number of tasks running on an Indexer-based worker per emission period. This metric is available only if the `WorkerTaskCountStatsMonitor` module is included.|`dataSource`|Varies|
+
+### Segment metadata cache
+
+The following metrics are emitted only when [segment metadata caching](../configuration/index.md#segment-metadata-cache-experimental) is enabled on the Overlord.
+
+|Metric|Description|Dimensions|
+|------|-----------|----------|
+|`segment/used/count`|Number of used segments currently present in the metadata store.|`dataSource`|
+|`segment/pending/count`|Number of pending segments currently present in the metadata store.|`dataSource`|
+|`segment/metadataCache/interval/count`|Total number of intervals present in the cache for a single datasource.|`dataSource`|
+|`segment/metadataCache/used/count`|Total number of used segments present in the cache for a single datasource.|`dataSource`|
+|`segment/metadataCache/pending/count`|Total number of pending segments present in the cache for a single datasource.|`dataSource`|
+|`segment/metadataCache/transactions/readOnly`|Number of read-only transactions performed on the cache for a single datasource.|`dataSource`|
+|`segment/metadataCache/transactions/readWrite`|Number of read-write transactions performed on the cache for a single datasource.|`dataSource`|
+|`segment/metadataCache/transactions/writeOnly`|Number of write-only transactions performed on the cache for a single datasource. These transactions happen only if the cache is operating in mode `ifSynced` and the first sync on the leader Overlord is not complete yet.|`dataSource`|
+|`segment/metadataCache/sync/time`|Number of milliseconds taken for the cache to sync with the metadata store.||
+|`segment/metadataCache/dataSource/deleted`|Indicates that a datasource has no used or pending segments anymore and has been removed from the cache.|`dataSource`|
+|`segment/metadataCache/deleted`|Total number of segments deleted from the cache during the latest sync.||
+|`segment/metadataCache/skipped`|Total number of unparseable segment records that were skipped in the latest sync.||
+|`segment/metadataCache/used/stale`|Number of used segments in the cache which are out-of-date and need to be refreshed.|`dataSource`|
+|`segment/metadataCache/used/updated`|Number of used segments updated in the cache during the latest sync.|`dataSource`|
+|`segment/metadataCache/pending/deleted`|Number of pending segments deleted from the cache during the latest sync.|`dataSource`|
+|`segment/metadataCache/pending/updated`|Number of pending segments updated in the cache during the latest sync.|`dataSource`|
+|`segment/metadataCache/pending/skipped`|Number of unparseable pending segment records that were skipped in the latest sync.|`dataSource`|
+
+### Auto-kill unused segments
+
+These metrics are emitted only if [auto-kill of unused segments](../data-management/delete.md#auto-kill-data-on-the-overlord-experimental) is enabled on the Overlord.
+
+|Metric|Description|Dimensions|
+|------|-----------|----------|
+|`segment/killed/metadataStore/count`|Number of segments permanently deleted from the metadata store.|`taskId`, `groupId`, `taskType`(=`kill`), `dataSource`|
+|`segment/killed/deepStorage/count`|Number of segments permanently deleted from the deep storage.|`taskId`, `groupId`, `taskType`(=`kill`), `dataSource`|
+|`segment/kill/unusedIntervals/count`|Number of intervals containing unused segments for a given datasource.|`dataSource`|
+|`segment/kill/skippedIntervals/count`|Number of intervals that were skipped for kill due to being already locked by another task.|`taskId`, `groupId`, `taskType`(=`kill`), `dataSource`|
+|`segment/kill/queueReset/time`|Time taken in milliseconds to reset the kill queue.||
+|`segment/kill/queueProcess/time`|Time taken in milliseconds to fully process the kill queue.||
+|`segment/kill/jobsProcessed/count`|Number of jobs processed from the kill queue for a given datasource.|`dataSource`|
+
+## Shuffle metrics (Native parallel task)
+
+The shuffle metrics can be enabled by adding `org.apache.druid.indexing.worker.shuffle.ShuffleMonitor` in `druid.monitoring.monitors`.
+See [Enabling metrics](../configuration/index.md#metrics-monitors) for more details.
+
+|Metric|Description|Dimensions|Normal value|
+|------|-----------|----------|------------|
+|`ingest/shuffle/bytes`|Number of bytes shuffled per emission period.|`supervisorTaskId`|Varies|
+|`ingest/shuffle/requests`|Number of shuffle requests per emission period.|`supervisorTaskId`|Varies|
+
+## Coordination
+
+These metrics are emitted by the Druid Coordinator in every run of the corresponding coordinator duty.
+
+|Metric|Description|Dimensions|Normal value|
+|------|-----------|----------|------------|
+|`segment/assigned/count`|Number of segments assigned to be loaded in the cluster.|`dataSource`, `tier`|Varies|
+|`segment/moved/count`|Number of segments moved in the cluster.|`dataSource`, `tier`|Varies|
+|`segment/dropped/count`|Number of segments chosen to be dropped from the cluster due to being over-replicated.|`dataSource`, `tier`|Varies|
+|`segment/deleted/count`|Number of segments marked as unused due to drop rules.|`dataSource`|Varies|
+|`segment/unneeded/count`|Number of segments dropped due to being marked as unused.|`dataSource`, `tier`|Varies|
+|`segment/assignSkipped/count`|Number of segments that could not be assigned to any server for loading. This can occur due to replication throttling, no available disk space, or a full load queue.|`dataSource`, `server`, `tier`, `description`|Varies|
+|`segment/moveSkipped/count`|Number of segments that were chosen for balancing but could not be moved. This can occur when segments are already optimally placed.|`dataSource`, `server`, `tier`, `description`|Varies|
+|`segment/dropSkipped/count`|Number of segments that could not be dropped from any server.|`dataSource`, `server`, `tier`, `description`|Varies|
+|`segment/loadQueue/size`|Size in bytes of segments to load.|`server`|Varies|
+|`segment/loadQueue/count`|Number of segments to load.|`server`|Varies|
+|`segment/loading/rateKbps`|Current rate of segment loading on a server in kbps (1000 bits per second). The rate is calculated as a moving average over the last 10 GiB or more of successful segment loads on that server.|`server`|Varies|
+|`segment/dropQueue/count`|Number of segments to drop.|`server`|Varies|
+|`segment/loadQueue/assigned`|Number of segments assigned for load or drop to the load queue of a server.|`dataSource`, `server`|Varies|
+|`segment/loadQueue/success`|Number of segment assignments that completed successfully.|`dataSource`, `server`|Varies|
+|`segment/loadQueue/failed`|Number of segment assignments that failed to complete.|`dataSource`, `server`|0|
+|`segment/loadQueue/cancelled`|Number of segment assignments that were canceled before completion.|`dataSource`, `server`|Varies|
+|`segment/size`|Total size of used segments in a data source. Emitted only for data sources to which at least one used segment belongs.|`dataSource`|Varies|
+|`segment/count`|Number of used segments belonging to a data source. Emitted only for data sources to which at least one used segment belongs.|`dataSource`|< max|
+|`segment/overShadowed/count`|Number of segments marked as unused due to being overshadowed.| |Varies|
+|`segment/unneededEternityTombstone/count`|Number of non-overshadowed eternity tombstones marked as unused.| |Varies|
+|`segment/unavailable/count`|Number of unique segments left to load until all used segments are available for queries.|`dataSource`|0|
+|`segment/underReplicated/count`|Number of segments, including replicas, left to load until all used segments are available for queries.|`tier`, `dataSource`|0|
+|`segment/availableDeepStorageOnly/count`|Number of unique segments that are only available for querying directly from deep storage.|`dataSource`|Varies|
+|`tier/historical/count`|Number of available historical nodes in each tier.|`tier`|Varies|
+|`tier/replication/factor`|Configured maximum replication factor in each tier.|`tier`|Varies|
+|`tier/required/capacity`|Total capacity in bytes required in each tier.|`tier`|Varies|
+|`tier/total/capacity`|Total capacity in bytes available in each tier.|`tier`|Varies|
+|`compact/task/count`|Number of tasks issued in the auto compaction run.| |Varies|
+|`compactTask/maxSlot/count`|Maximum number of task slots available for auto compaction tasks in the auto compaction run.| |Varies|
+|`compactTask/availableSlot/count`|Number of available task slots that can be used for auto compaction tasks in the auto compaction run. This is the max number of task slots minus any currently running compaction tasks.| |Varies|
+|`killTask/availableSlot/count`| Number of available task slots that can be used for auto kill tasks in the auto kill run. This is the max number of task slots minus any currently running auto kill tasks.                                                                                                                                                                                                                                                                                                                     | |Varies|
+|`killTask/maxSlot/count`| Maximum number of task slots available for auto kill tasks in the auto kill run.                                                                                                                                                                                                                                                                                                                                                                                                                | |Varies|
+|`kill/task/count`| Number of tasks issued in the auto kill run.                                                                                                                                                                                                                                                                                                                                                                                                                                                    | |Varies|
+|`kill/eligibleUnusedSegments/count`|The number of unused segments of a datasource that are identified as eligible for deletion from the metadata store by the coordinator.|`dataSource`|Varies|
+|`kill/pendingSegments/count`|Number of stale pending segments deleted from the metadata store.|`dataSource`|Varies|
+|`segment/waitCompact/bytes`|Total bytes of this datasource waiting to be compacted by the auto compaction (only consider intervals/segments that are eligible for auto compaction).|`dataSource`|Varies|
+|`segment/waitCompact/count`|Total number of segments of this datasource waiting to be compacted by the auto compaction (only consider intervals/segments that are eligible for auto compaction).|`dataSource`|Varies|
+|`interval/waitCompact/count`|Total number of intervals of this datasource waiting to be compacted by the auto compaction (only consider intervals/segments that are eligible for auto compaction).|`dataSource`|Varies|
+|`segment/compacted/bytes`|Total bytes of this datasource that are already compacted with the spec set in the auto compaction config.|`dataSource`|Varies|
+|`segment/compacted/count`|Total number of segments of this datasource that are already compacted with the spec set in the auto compaction config.|`dataSource`|Varies|
+|`interval/compacted/count`|Total number of intervals of this datasource that are already compacted with the spec set in the auto compaction config.|`dataSource`|Varies|
+|`segment/skipCompact/bytes`|Total bytes of this datasource that are skipped (not eligible for auto compaction) by the auto compaction.|`dataSource`|Varies|
+|`segment/skipCompact/count`|Total number of segments of this datasource that are skipped (not eligible for auto compaction) by the auto compaction.|`dataSource`|Varies|
+|`interval/skipCompact/count`|Total number of intervals of this datasource that are skipped (not eligible for auto compaction) by the auto compaction.|`dataSource`|Varies|
+|`coordinator/time`|Approximate Coordinator duty runtime in milliseconds. |`duty`|Varies|
+|`coordinator/global/time`|Approximate runtime of a full coordination cycle in milliseconds. The `dutyGroup` dimension indicates what type of coordination this run was. For example: Historical Management or Indexing.|`dutyGroup`|Varies|
+|`metadata/kill/supervisor/count`|Total number of terminated supervisors that were automatically deleted from metadata store per each Coordinator kill supervisor duty run. This metric can help adjust `druid.coordinator.kill.supervisor.durationToRetain` configuration based on whether more or less terminated supervisors need to be deleted per cycle. This metric is only emitted when `druid.coordinator.kill.supervisor.on` is set to true.| |Varies|
+|`metadata/kill/audit/count`|Total number of audit logs that were automatically deleted from metadata store per each Coordinator kill audit duty run. This metric can help adjust `druid.coordinator.kill.audit.durationToRetain` configuration based on whether more or less audit logs need to be deleted per cycle. This metric is emitted only when `druid.coordinator.kill.audit.on` is set to true.| |Varies|
+|`metadata/kill/compaction/count`|Total number of compaction configurations that were automatically deleted from metadata store per each Coordinator kill compaction configuration duty run. This metric is only emitted when `druid.coordinator.kill.compaction.on` is set to true.| |Varies|
+|`metadata/kill/rule/count`|Total number of rules that were automatically deleted from metadata store per each Coordinator kill rule duty run. This metric can help adjust `druid.coordinator.kill.rule.durationToRetain` configuration based on whether more or less rules need to be deleted per cycle. This metric is only emitted when `druid.coordinator.kill.rule.on` is set to true.| |Varies|
+|`metadata/kill/datasource/count`|Total number of datasource metadata that were automatically deleted from metadata store per each Coordinator kill datasource duty run. Note that datasource metadata only exists for datasource created from supervisor. This metric can help adjust `druid.coordinator.kill.datasource.durationToRetain` configuration based on whether more or less datasource metadata need to be deleted per cycle. This metric is only emitted when `druid.coordinator.kill.datasource.on` is set to true.| |Varies|
+|`serverview/init/time`|Time taken to initialize the coordinator server view.||Depends on the number of segments.|
+|`serverview/sync/healthy`|Sync status of the Coordinator with a segment-loading server such as a Historical or Peon. Emitted only when [HTTP-based server view](../configuration/index.md#segment-management) is enabled. You can use this metric in conjunction with `serverview/sync/unstableTime` to debug slow startup of the Coordinator.|`server`, `tier`|1 for fully synced servers, 0 otherwise|
+|`serverview/sync/unstableTime`|Time in milliseconds for which the Coordinator has been failing to sync with a segment-loading server. Emitted only when [HTTP-based server view](../configuration/index.md#segment-management) is enabled.|`server`, `tier`|Not emitted for synced servers.|
+|`metadatacache/init/time`|Time taken to initialize the coordinator segment metadata cache.||Depends on the number of segments.|
+|`segment/schemaCache/refresh/count`|Number of segments for which schema was refreshed in coordinator segment schema cache.|`dataSource`||
+|`segment/schemaCache/refreshSkipped/count`|Number of segments for which schema refresh was skipped due to presence of segment metadata in datasource polled from coordinator.|`dataSource`||
+|`segment/schemaCache/dataSource/removed`|Emitted when a datasource is removed from the Broker cache due to segments being marked as unused.|`dataSource`||
+|`segment/schemaCache/refresh/time`|Time taken to refresh segments in coordinator segment schema cache.|`dataSource`||
+|`segment/schemaCache/backfill/count`|Number of segments for which schema was back filled in the database.|`dataSource`||
+|`segment/schemaCache/realtime/count`|Number of realtime segments for which schema is cached.||Depends on the number of realtime segments in the cluster.|
+|`segment/schemaCache/used/count`|Number of published used segments for which schema is cached.||Depends on the number of segments in the cluster.|
+|`segment/schemaCache/usedFingerprint/count`|Number of unique schema fingerprints cached for published used segments.||Depends on the number of distinct schema in the cluster.|
+|`segment/schemaCache/pendingBackfill/count`|Number of segments for which schema was fetched by executing segment metadata query and is pending backfill in the metadata store.||Eventually it should be 0.|
+|`segment/used/deepStorageOnly/count`|Number of published used segments present only on deep storage.|`dataSource`||
+|`segment/schemaCache/deepStorageOnly/count`|Number of deep storage only segments with cached schema.|`dataSource`||
+|`segment/schemaCache/deepStorageOnly/refresh/time`|Time taken in milliseconds to refresh schemas of deep storage only segments.||Under a minute|
+
+## General Health
+
+### Service Health
+
+|Metric|Description|Dimensions|Normal value|
+|------|-----------|----------|------------|
+| `service/heartbeat` | Metric indicating the service is up. This metric is emitted only when `ServiceStatusMonitor` is enabled. | `leader` on the Overlord and Coordinator.<br />`workerVersion`, `category`, `status` on the Middle Manager.<br />`taskId`, `groupId`, `taskType`, `status`, `dataSource`, `tags` on the Peon |1|
+
+### Historical
+
+|Metric|Description|Dimensions|Normal value|
+|------|-----------|----------|------------|
+|`segment/max`|Maximum byte limit available for segments.| |Varies.|
+|`segment/used`|Bytes used for served segments.|`dataSource`, `tier`, `priority`|< max|
+|`segment/usedPercent`|Percentage of space used by served segments.|`dataSource`, `tier`, `priority`|< 100%|
+|`segment/count`|Number of served segments.|`dataSource`, `tier`, `priority`|Varies|
+|`segment/pendingDelete`|On-disk size in bytes of segments that are waiting to be cleared out.| |Varies|
+|`segment/rowCount/avg`| The average number of rows per segment on a historical. `SegmentStatsMonitor` must be enabled.| `dataSource`, `tier`, `priority`|Varies. See [segment optimization](../operations/segment-optimization.md) for guidance on optimal segment sizes. |
+|`segment/rowCount/range/count`| The number of segments in a bucket. `SegmentStatsMonitor` must be enabled.| `dataSource`, `tier`, `priority`, `range`|Varies|
+
+### JVM
+
+These metrics are only available if the `JvmMonitor` module is included in `druid.monitoring.monitors`.
+For more information, see [Enabling Metrics](../configuration/index.md#metrics-monitors).
+
+|Metric|Description|Dimensions|Normal value|
+|------|-----------|----------|------------|
+|`jvm/pool/committed`|Committed pool|`poolKind`, `poolName`, `jvmVersion`|Close to max pool|
+|`jvm/pool/init`|Initial pool|`poolKind`, `poolName`, `jvmVersion`|Varies|
+|`jvm/pool/max`|Max pool|`poolKind`, `poolName`, `jvmVersion`|Varies|
+|`jvm/pool/used`|Pool used|`poolKind`, `poolName`, `jvmVersion`|< max pool|
+|`jvm/bufferpool/count`|Bufferpool count|`bufferpoolName`, `jvmVersion`|Varies|
+|`jvm/bufferpool/used`|Bufferpool used|`bufferpoolName`, `jvmVersion`|Close to capacity|
+|`jvm/bufferpool/capacity`|Bufferpool capacity|`bufferpoolName`, `jvmVersion`|Varies|
+|`jvm/mem/init`|Initial memory|`memKind`, `jvmVersion`|Varies|
+|`jvm/mem/max`|Max memory|`memKind`, `jvmVersion`|Varies|
+|`jvm/mem/used`|Used memory|`memKind`, `jvmVersion`|< max memory|
+|`jvm/mem/committed`|Committed memory|`memKind`, `jvmVersion`|Close to max memory|
+|`jvm/gc/count`|Garbage collection count|`gcName` (cms/g1/parallel/etc.), `gcGen` (old/young), `jvmVersion`|Varies|
+|`jvm/gc/cpu`|Count of CPU time in Nanoseconds spent on garbage collection. Note: `jvm/gc/cpu` represents the total time over multiple GC cycles; divide by `jvm/gc/count` to get the mean GC time per cycle.|`gcName`, `gcGen`, `jvmVersion`|Sum of `jvm/gc/cpu` should be within 10-30% of sum of `jvm/cpu/total`, depending on the GC algorithm used (reported by [`JvmCpuMonitor`](../configuration/index.md#metrics-monitors)). |
+
+### ZooKeeper
+
+These metrics are available only when `druid.zk.service.enabled = true`.
+
+|Metric|Description|Dimensions|Normal value|
+|------|-----------|----------|------------|
+|`zk/connected`|Indicator of connection status. `1` for connected, `0` for disconnected. Emitted once per monitor period.|None|1|
+|`zk/reconnect/time`|Amount of time, in milliseconds, that a server was disconnected from ZooKeeper before reconnecting. Emitted on reconnection. Not emitted if connection to ZooKeeper is permanently lost, because in this case, there is no reconnection.|None|Not present|
+
+## Sys [Deprecated]
+
+> SysMonitor is now deprecated and will be removed in future releases.
+> Instead, use the new OSHI monitor called [OshiSysMonitor](#oshisysmonitor). The new monitor has a wider support for different machine architectures including ARM instances.
+
+These metrics are only available if the `SysMonitor` module is included.
+
+|Metric|Description|Dimensions|Normal value|
+|------|-----------|----------|------------|
+|`sys/swap/free`|Free swap||Varies|
+|`sys/swap/max`|Max swap||Varies|
+|`sys/swap/pageIn`|Paged in swap||Varies|
+|`sys/swap/pageOut`|Paged out swap||Varies|
+|`sys/disk/write/count`|Writes to disk|`fsDevName`, `fsDirName`, `fsTypeName`, `fsSysTypeName`, `fsOptions`|Varies|
+|`sys/disk/read/count`|Reads from disk|`fsDevName`, `fsDirName`, `fsTypeName`, `fsSysTypeName`, `fsOptions`|Varies|
+|`sys/disk/write/size`|Bytes written to disk. One indicator of the amount of paging occurring for segments.|`fsDevName`,`fsDirName`,`fsTypeName`, `fsSysTypeName`, `fsOptions`|Varies|
+|`sys/disk/read/size`|Bytes read from disk. One indicator of the amount of paging occurring for segments.|`fsDevName`,`fsDirName`, `fsTypeName`, `fsSysTypeName`, `fsOptions`|Varies|
+|`sys/net/write/size`|Bytes written to the network|`netName`, `netAddress`, `netHwaddr`|Varies|
+|`sys/net/read/size`|Bytes read from the network|`netName`, `netAddress`, `netHwaddr`|Varies|
+|`sys/fs/used`|Filesystem bytes used|`fsDevName`, `fsDirName`, `fsTypeName`, `fsSysTypeName`, `fsOptions`|< max|
+|`sys/fs/max`|Filesystem bytes max|`fsDevName`, `fsDirName`, `fsTypeName`, `fsSysTypeName`, `fsOptions`|Varies|
+|`sys/mem/used`|Memory used||< max|
+|`sys/mem/max`|Memory max||Varies|
+|`sys/storage/used`|Disk space used|`fsDirName`|Varies|
+|`sys/cpu`|CPU used|`cpuName`, `cpuTime`|Varies|
+
+## OshiSysMonitor
+
+These metrics are only available if the `OshiSysMonitor` module is included.
+
+|Metric|Description|Dimensions|Normal Value|
+|------|-----------|----------|------------|
+|`sys/swap/free`|Free swap||Varies|
+|`sys/swap/max`|Max swap||Varies|
+|`sys/swap/pageIn`|Paged in swap||Varies|
+|`sys/swap/pageOut`|Paged out swap||Varies|
+|`sys/disk/write/count`|Writes to disk|`diskName`|Varies|
+|`sys/disk/read/count`|Reads from disk|`diskName`|Varies|
+|`sys/disk/write/size`|Bytes written to disk. One indicator of the amount of paging occurring for segments.|`diskName`|Varies|
+|`sys/disk/read/size`|Bytes read from disk. One indicator of the amount of paging occurring for segments.|`diskName`|Varies|
+|`sys/disk/queue`|Disk queue length. Measures number of requests waiting to be processed by disk|`diskName`|Generally 0|
+|`sys/disk/transferTime`|Transfer time to read from or write to disk|`diskName`|Depends on hardware|
+|`sys/net/write/size`|Bytes written to the network|`netName`, `netAddress`, `netHwaddr`|Varies|
+|`sys/net/read/size`|Bytes read from the network|`netName`, `netAddress`, `netHwaddr`|Varies|
+|`sys/net/read/packets`|Total packets read from the network|`netName`, `netAddress`, `netHwaddr`|Varies|
+|`sys/net/write/packets`|Total packets written to the network|`netName`, `netAddress`, `netHwaddr`|Varies|
+|`sys/net/read/errors`|Total network read errors|`netName`, `netAddress`, `netHwaddr`|Generally 0|
+|`sys/net/write/errors`|Total network write errors|`netName`, `netAddress`, `netHwaddr`|Generally 0|
+|`sys/net/read/dropped`|Total packets dropped coming from network|`netName`, `netAddress`, `netHwaddr`|Generally 0|
+|`sys/net/write/collisions`|Total network write collisions|`netName`, `netAddress`, `netHwaddr`|Generally 0|
+|`sys/fs/used`|Filesystem bytes used |`fsDevName`, `fsDirName`|< max|
+|`sys/fs/max`|Filesystem bytes max |`fsDevName`, `fsDirName`|Varies|
+|`sys/fs/files/count`|Filesystem total IO nodes |`fsDevName`, `fsDirName`|< max|
+|`sys/fs/files/free`|Filesystem free IO nodes|`fsDevName`, `fsDirName`| Varies |
+|`sys/mem/used`|Memory used||< max|
+|`sys/mem/max`|Memory max||Varies|
+|`sys/mem/free`|Memory free||Varies|
+|`sys/cpu`|CPU used|`cpuName`, `cpuTime`|Varies|
+|`sys/uptime`|Total system uptime||Varies|
+|`sys/la/{i}`|System CPU load averages over past `i` minutes, where `i={1,5,15}`||Varies|
+|`sys/tcpv4/activeOpens`|Total TCP active open connections||Varies|
+|`sys/tcpv4/passiveOpens`|Total TCP passive open connections||Varies|
+|`sys/tcpv4/attemptFails`|Total TCP active connection failures||Generally 0|
+|`sys/tcpv4/estabResets`|Total TCP connection resets||Generally 0|
+|`sys/tcpv4/in/segs`|Total segments received in connection||Varies|
+|`sys/tcpv4/in/errs`|Errors while reading segments||Generally 0|
+|`sys/tcpv4/out/segs`|Total segments sent||Varies|
+|`sys/tcpv4/out/rsts`|Total "out reset" packets sent to reset the connection||Generally 0|
+|`sys/tcpv4/retrans/segs`|Total segments re-transmitted||Varies|
+
+If you want to enable only some of these metrics categories you could specify `druid.monitoring.sys.categories`.
+Possible values are `mem`, `swap`, `fs`, `disk`, `net`, `cpu`, `sys`, and `tcp`.
+
+## S3 multi-part upload
+
+These metrics are only available if the `druid-s3-extensions` module is included and if certain specific features are being used: MSQ export to S3, durable intermediate storage on S3.
+
+|Metric|Description|Dimensions|Normal value|
+|------|-----------|----------|------------|
+|`s3/upload/part/queueSize`|Number of items currently waiting in queue to be uploaded to S3. Each item in the queue corresponds to a single part in a multi-part upload.||Varies|
+|`s3/upload/part/queuedTime`|Milliseconds spent by a single item (or part) in queue before it starts getting uploaded to S3.|`uploadId`, `partNumber`|Varies|
+|`s3/upload/part/time`|Milliseconds taken to upload a single part of a multi-part upload to S3.|`uploadId`, `partNumber`|Varies|
+|`s3/upload/total/time`|Milliseconds taken for uploading all parts of a multi-part upload to S3.|`uploadId`|Varies|
+|`s3/upload/total/bytes`|Total bytes uploaded to S3 during a multi-part upload.|`uploadId`|Varies|
+
+## Cgroup
+
+These metrics are available on operating systems with the cgroup kernel feature. All the values are derived by reading from `/sys/fs/cgroup`.
+
+|Metric|Description|Dimensions|Normal value|
+|------|-----------|----------|------------|
+|`cgroup/cpu/shares`|Relative value of CPU time available to this process. Read from `cpu.shares`.||Varies|
+|`cgroup/cpu/cores_quota`|Number of cores available to this process. Derived from `cpu.cfs_quota_us`/`cpu.cfs_period_us`.||Varies. A value of -1 indicates there is no explicit quota set.|
+|`cgroup/cpu/usage/total/percentage`|Total cpu percentage used by cgroup of process that is running||0-100|
+|`cgroup/cpu/usage/user/percentage`|User cpu percentage used by cgroup of process that is running||0-100|
+|`cgroup/cpu/usage/sys/percentage`|Sys cpu percentage used by cgroup of process that is running||0-100|
+|`cgroup/disk/read/size`|Reports the number of bytes transferred to specific devices by a cgroup of process that is running.|`diskName`|Varies|
+|`cgroup/disk/write/size`|Reports the number of bytes transferred from specific devices by a cgroup of process that is running.|`diskName`|Varies|
+|`cgroup/disk/read/count`|Reports the number of read operations performed on specific devices by a cgroup of process that is running.|`diskName`|Varies|
+|`cgroup/disk/write/count`|Reports the number of write operations performed on specific devices by a cgroup of process that is running.|`diskName`|Varies|
+|`cgroup/memory/*`|Memory stats for this process, such as `cache` and `total_swap`. Each stat produces a separate metric. Read from `memory.stat`.||Varies|
+|`cgroup/memory_numa/*/pages`|Memory stats, per NUMA node, for this process, such as `total` and `unevictable`. Each stat produces a separate metric. Read from `memory.num_stat`.|`numaZone`|Varies|
+|`cgroup/memory/limit/bytes`|Reports the maximum memory that can be used by processes in the cgroup (in bytes)||Varies|
+|`cgroup/memory/usage/bytes`|Reports the maximum amount of user memory (including file cache)||Varies|
+|`cgroup/cpuset/cpu_count`|Total number of CPUs available to the process. Derived from `cpuset.cpus`.||Varies|
+|`cgroup/cpuset/effective_cpu_count`|Total number of active CPUs available to the process. Derived from `cpuset.effective_cpus`.||Varies|
+|`cgroup/cpuset/mems_count`|Total number of memory nodes available to the process. Derived from `cpuset.mems`.||Varies|
+|`cgroup/cpuset/effective_mems_count`|Total number of active memory nodes available to the process. Derived from `cpuset.effective_mems`.||Varies|
diff --git a/docs/35.0.0/operations/migrate-from-firehose-ingestion.md b/docs/35.0.0/operations/migrate-from-firehose-ingestion.md
new file mode 100644
index 0000000000..540685a717
--- /dev/null
+++ b/docs/35.0.0/operations/migrate-from-firehose-ingestion.md
@@ -0,0 +1,207 @@
+---
+id: migrate-from-firehose
+title: "Migrate from firehose to input source ingestion (legacy)"
+sidebar_label: "Migrate from firehose"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+Apache deprecated support for Druid firehoses in version 0.17. Support for firehose ingestion was removed in version 26.0.
+
+Firehose ingestion doesn't work with newer Druid versions, so you must be using an ingestion spec with a defined input source before you upgrade. 
+
+## Migrate from firehose ingestion to an input source
+
+To migrate from firehose ingestion, you can use the Druid console to update your ingestion spec, or you can update it manually.
+
+### Use the Druid console
+
+To update your ingestion spec using the Druid console, open the console and copy your spec into the **Edit spec** stage of the data loader.
+
+Druid converts the spec into one with a defined input source. For example, it converts the [example firehose ingestion spec](#example-firehose-ingestion-spec) below into the [example ingestion spec after migration](#example-ingestion-spec-after-migration).
+
+If you're unable to use the console or you have problems with the console method, the alternative is to update your ingestion spec manually.
+
+### Update your ingestion spec manually
+
+To update your ingestion spec manually, copy your existing spec into a new file. Refer to [Native batch ingestion with firehose (Deprecated)](../ingestion/native-batch-firehose.md) for a description of firehose properties.
+
+Edit the new file as follows:
+
+1. In the `ioConfig` component, replace the `firehose` definition with an `inputSource` definition for your chosen input source. See [Native batch input sources](../ingestion/input-sources.md) for details.
+2. Move the `timeStampSpec` definition from `parser.parseSpec` to the `dataSchema` component.
+3. Move the `dimensionsSpec` definition from `parser.parseSpec` to the `dataSchema` component.
+4. Move the `format` definition from `parser.parseSpec` to an `inputFormat` definition in `ioConfig`.
+5. Delete the `parser` definition.
+6. Save the file.
+You can check the format of your new ingestion file against the [migrated example](#example-ingestion-spec-after-migration) below.
+7. Test the new ingestion spec with a temporary data source.
+8. Once you've successfully ingested sample data with the new spec, stop firehose ingestion and switch to the new spec.
+
+When the transition is complete, you can upgrade Druid to the latest version. See the [Druid release notes](https://druid.apache.org/downloads.html) for upgrade instructions.
+
+### Example firehose ingestion spec
+
+An example firehose ingestion spec is as follows:
+
+```json
+{
+  "type" : "index",
+  "spec" : {
+     "dataSchema" : {
+        "dataSource" : "wikipedia",
+        "metricsSpec" : [
+           {
+              "type" : "count",
+              "name" : "count"
+           },
+           {
+              "type" : "doubleSum",
+              "name" : "added",
+              "fieldName" : "added"
+           },
+           {
+              "type" : "doubleSum",
+              "name" : "deleted",
+              "fieldName" : "deleted"
+           },
+           {
+              "type" : "doubleSum",
+              "name" : "delta",
+              "fieldName" : "delta"
+           }
+        ],
+        "granularitySpec" : {
+           "type" : "uniform",
+           "segmentGranularity" : "DAY",
+           "queryGranularity" : "NONE",
+           "intervals" : [ "2013-08-31/2013-09-01" ]
+        },
+        "parser": {
+           "type": "string",
+           "parseSpec": {
+              "format": "json",
+              "timestampSpec" : {
+                 "column" : "timestamp",
+                 "format" : "auto"
+              },
+              "dimensionsSpec" : {
+                 "dimensions": ["country", "page","language","user","unpatrolled","newPage","robot","anonymous","namespace","continent","region","city"],
+                 "dimensionExclusions" : []
+              }
+           }
+        }
+     },
+     "ioConfig" : {
+        "type" : "index",
+        "firehose" : {
+           "type" : "local",
+           "baseDir" : "examples/indexing/",
+           "filter" : "wikipedia_data.json"
+        }
+     },
+     "tuningConfig" : {
+        "type" : "index",
+        "partitionsSpec": {
+           "type": "single_dim",
+           "partitionDimension": "country",
+           "targetRowsPerSegment": 5000000
+        }
+     }
+  }
+}
+```
+
+### Example ingestion spec after migration
+
+The following example illustrates the result of migrating the [example firehose ingestion spec](#example-firehose-ingestion-spec) to a spec with an input source:
+
+```json
+{
+ "type" : "index",
+ "spec" : {
+   "dataSchema" : {
+     "dataSource" : "wikipedia",
+     "timestampSpec" : {
+       "column" : "timestamp",
+       "format" : "auto"
+     },
+     "dimensionsSpec" : {
+       "dimensions": ["country", "page","language","user","unpatrolled","newPage","robot","anonymous","namespace","continent","region","city"],
+       "dimensionExclusions" : []
+     },
+     "metricsSpec" : [
+       {
+         "type" : "count",
+         "name" : "count"
+       },
+       {
+         "type" : "doubleSum",
+         "name" : "added",
+         "fieldName" : "added"
+       },
+       {
+         "type" : "doubleSum",
+         "name" : "deleted",
+         "fieldName" : "deleted"
+       },
+       {
+         "type" : "doubleSum",
+         "name" : "delta",
+         "fieldName" : "delta"
+       }
+     ],
+     "granularitySpec" : {
+       "type" : "uniform",
+       "segmentGranularity" : "DAY",
+       "queryGranularity" : "NONE",
+       "intervals" : [ "2013-08-31/2013-09-01" ]
+     }
+   },
+   "ioConfig" : {
+     "type" : "index",
+     "inputSource" : {
+       "type" : "local",
+       "baseDir" : "examples/indexing/",
+       "filter" : "wikipedia_data.json"
+      },
+      "inputFormat": {
+        "type": "json"
+      }
+   },
+   "tuningConfig" : {
+     "type" : "index",
+     "partitionsSpec": {
+       "type": "single_dim",
+       "partitionDimension": "country",
+       "targetRowsPerSegment": 5000000
+     }
+   }
+ }
+}
+```
+
+## Learn more
+
+For more information, see the following pages:
+
+- [Ingestion](../ingestion/index.md): Overview of the Druid ingestion process.
+- [Native batch ingestion](../ingestion/native-batch.md): Description of the supported native batch indexing tasks.
+- [Ingestion spec reference](../ingestion/ingestion-spec.md): Description of the components and properties in the ingestion spec.
diff --git a/docs/35.0.0/operations/mixed-workloads.md b/docs/35.0.0/operations/mixed-workloads.md
new file mode 100644
index 0000000000..032f25b5e2
--- /dev/null
+++ b/docs/35.0.0/operations/mixed-workloads.md
@@ -0,0 +1,214 @@
+---
+id: mixed-workloads
+title: Configure Druid for mixed workloads
+sidebar_label: Mixed workloads
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+If you frequently run concurrent, heterogeneous workloads on your Apache Druid cluster, configure Druid to properly allocate cluster resources to optimize your overall query performance.
+
+Each Druid query consumes a certain amount of cluster resources, such as processing threads, memory buffers for intermediate query results, and HTTP threads for communicating between Brokers and data servers.
+"Heavy" queries that return large results are more resource-intensive than short-running, "light" queries.
+You typically do not want these long resource-intensive queries to throttle the performance of short interactive queries.
+For example, if you run both sets of queries in the same Druid cluster, heavy queries may employ all available HTTP threads.
+This situation slows down subsequent queries—heavy and light—and may trigger timeout errors for those queries.
+With proper resource isolation, you can execute long-running, low priority queries without interfering with short-running, high priority queries.
+
+Druid provides the following strategies to isolate resources and improve query concurrency:
+- **Query laning** where you set a limit on the maximum number of long-running queries executed on each Broker. 
+- **Service tiering** which defines separate groups of Historicals and Brokers to receive different query assignments based on query priority.
+
+You can profile Druid queries using normal performance profiling techniques such as Druid query metrics analysis, thread dumps of JVM, or flame graphs to identify what resources are affected by mixed workloads.
+The largest bottleneck will likely be in the Broker HTTP threads.
+Mitigate resource contention of the Broker HTTP threads with query laning.
+However, mixed workloads also affect other resources, including processing threads and merge buffers.
+To reduce the burden on these resources, apply both service tiering and query laning.
+
+
+## Query laning
+
+When you need to run many concurrent queries having heterogeneous workloads, start with query laning to optimize your query performance.
+Query laning restricts resource usage for less urgent queries to ensure dedicated resources for high priority queries.
+
+Query lanes are analogous to carpool and normal lanes on the freeway. With query laning, Druid sets apart prioritized lanes from other general lanes.
+Druid restricts low priority queries to the general lanes and allows high priority queries to run wherever possible, whether in a VIP or general lane.
+
+In Druid, query lanes reserve resources for Broker HTTP threads. Each Druid query requires one Broker thread. The number of threads on a Broker is defined by the `druid.server.http.numThreads` parameter. Broker threads may be occupied by tasks other than queries, such as health checks. You can use query laning to limit the number of HTTP threads designated for resource-intensive queries, leaving other threads available for short-running queries and other tasks.
+
+### General properties
+
+Set the following query laning properties in the `broker/runtime.properties` file.
+
+* `druid.query.scheduler.laning.strategy` – The strategy used to assign queries to lanes.
+You can use the built-in [“high/low” laning strategy](../configuration/index.md#highlow-laning-strategy), or [define your own laning strategy manually](../configuration/index.md#manual-laning-strategy).
+* `druid.query.scheduler.numThreads` – The total number of queries that can be served per Broker. We recommend setting this value to 1-2 less than `druid.server.http.numThreads`.
+
+The query scheduler by default does not limit the number of queries that a Broker can serve. Setting this property to a bounded number limits the thread count. If the allocated threads are all occupied, any incoming query, including interactive queries, will be queued on the broker and will timeout after the request stays in the queue for more than the configured timeout. This configured timeout is equal to `MIN(Integer.MAX_VALUE, druid.server.http.maxQueryTimeout)`. If the value of `druid.server.http.maxQueryTimeout` is negative, the request is queued forever. 
+
+### Lane-specific properties
+
+If you use the __high/low laning strategy__, set the following:
+
+* `druid.query.scheduler.laning.maxLowPercent` – The maximum percent of query threads to handle low priority queries. The remaining query threads are dedicated to high priority queries.
+
+Consider also defining a [prioritization strategy](../configuration/index.md#prioritization-strategies) for the Broker to label queries as high or low priority. Otherwise, manually set the priority for incoming queries on the [query context](../querying/query-context-reference.md).
+
+If you use a __manual laning strategy__, set the following:
+
+* `druid.query.scheduler.laning.lanes.{name}` – The limit for how many queries can run in the `name` lane. Define as many named lanes as needed.
+* `druid.query.scheduler.laning.isLimitPercent` – Whether to treat the lane limit as an exact number or a percent of the minimum of `druid.server.http.numThreads` or `druid.query.scheduler.numThreads`.
+
+With manual laning, incoming queries can be labeled with the desired lane in the `lane` parameter of the [query context](../querying/query-context-reference.md).
+
+See [Query prioritization and laning](../configuration/index.md#query-prioritization-and-laning) for additional details on query laning configuration.
+
+### Example
+
+Example config for query laning with the high/low laning strategy:
+
+```
+# Laning strategy
+druid.query.scheduler.laning.strategy=hilo
+druid.query.scheduler.laning.maxLowPercent=20
+
+# Limit the number of HTTP threads for query processing
+# This value should be less than druid.server.http.numThreads
+druid.query.scheduler.numThreads=40
+```
+
+
+## Service tiering
+
+In service tiering, you define separate groups of Historicals and Brokers to manage queries based on the segments and resource requirements of the query.
+You can limit the resources that are set aside for certain types of queries.
+Many heavy queries involving complex subqueries or large result sets can hog resources away from high priority, interactive queries.
+Minimize the impact of these heavy queries by limiting them to a separate Broker tier.
+When all Brokers set aside for heavy queries are occupied, subsequent heavy queries must wait until the designated resources become available.
+A prolonged wait results in the later queries failing with a timeout error.
+
+Note that you can separate Historical processes into tiers without having separate Broker tiers.
+Historical-only tiering is not sufficient to meet the demands of mixed workloads on a Druid cluster.
+However, it is useful when you query certain segments more frequently than others, such as often analyzing the most recent data.
+Historical tiering assigns data from specific time intervals to specific tiers in order to support higher concurrency on hot data. 
+
+The examples below demonstrate two tiers—hot and cold—for both the Historicals and Brokers. The Brokers will serve short-running, light queries before long-running, heavy queries. Light queries will be routed to the hot tiers, and heavy queries will be routed to the cold tiers.
+
+### Historical tiering
+
+This section describes how to configure segment loading and how to assign Historical services into tiers.
+
+#### Configure segment loading
+
+The Coordinator service assigns segments to different tiers of Historicals using load rules.
+Define a [load rule](rule-configuration.md#load-rules) to indicate how segment replicas should be assigned to different Historical tiers. For example, you may store segments of more recent data on more powerful hardware for better performance.
+
+There are several types of load rules: forever, interval, and period. Select the load rule that matches your use case for each Historical, whether you want all segments to be loaded, segments within a certain time interval, or segments within a certain time period.
+Interval and period load rules must be accompanied by corresponding [drop rules](rule-configuration.md#drop-rules).
+
+In the load rule, define tiers in the `tieredReplicants` property. Provide descriptive names for your tiers, and specify how many replicas each tier should have. You can designate a higher number of replicas for the hot tier to increase the concurrency for processing queries.
+
+The following example shows a period load rule with two Historical tiers, named “hot” and “\_default\_tier”.
+For the most recent month of data, Druid loads three replicas in the hot tier and one replica in the default cold tier.
+Incoming queries that rely on this month of data can use the single replica in the cold Historical tier or any of the three replicas in the hot Historical tier.
+
+```
+{
+  "type" : "loadByPeriod",
+  "period" : "P1M",
+  "includeFuture" : true,
+  "tieredReplicants": {
+    "hot": 3,
+    "_default_tier" : 1
+  }
+}
+```
+
+See [Load rules](rule-configuration.md#load-rules) for more information on segment load rules. Visit [Tutorial: Configuring data retention](../tutorials/tutorial-retention.md) for an example of setting retention rules from the Druid web console.
+
+#### Assign Historicals to tiers
+
+To assign a Historical to a tier, add a label for the tier name and set the priority value in the  `historical/runtime.properties` for the Historical.
+
+Example Historical in the hot tier:
+
+```
+druid.server.tier=hot
+druid.server.priority=1
+```
+
+Example Historical in the cold tier:
+
+```
+druid.server.tier=_default_tier
+druid.server.priority=0
+```
+
+See [Historical general configuration](../configuration/index.md#historical-general-configuration) for more details on these properties.
+
+### Broker tiering
+
+You must set up Historical tiering before you can use Broker tiering.
+To set up Broker tiering, assign Brokers to tiers, and configure query routing by the Router.
+
+#### Assign Brokers to tiers
+
+For each of the Brokers, define the Broker group in the `broker/runtime.properties` files.
+
+Example config for a Broker in the hot tier:
+```
+druid.service=druid:broker-hot
+```
+
+Example config for a Broker in the cold tier:
+```
+druid.service=druid:broker-cold
+```
+
+Also in the `broker/runtime.properties` files, instruct the Broker to select Historicals by priority so that the Broker will select Historicals in the hot tier before Historicals in the cold tier.
+
+Example Broker config to prioritize hot tier Historicals:
+```
+druid.broker.select.tier=highestPriority
+```
+
+See [Broker configuration](../configuration/index.md#broker-process-configs) for more details on these properties.
+
+#### Configure query routing
+
+Direct the Router to route queries appropriately by setting the default Broker tier and the map of Historical tier to Broker tier in the `router/runtime.properties` file.
+
+Example Router config to map hot/cold tier Brokers to hot/cold tier Historicals, respectively:
+
+```
+druid.router.defaultBrokerServiceName=druid:broker-cold
+druid.router.tierToBrokerMap={"hot":"druid:broker-hot","_default_tier":"druid:broker-cold"}
+```
+
+If you plan to run Druid SQL queries, also [enable routing of SQL queries](../design/router.md#routing-of-sql-queries-using-strategies) by setting the following:
+```
+druid.router.sql.enable=true
+```
+
+See [Router process](../design/router.md#example-production-configuration) for an example production configuration.
+
+## Learn more
+
+See [Multitenancy considerations](../querying/multitenancy.md) for applying query concurrency to multitenant workloads.
diff --git a/docs/35.0.0/operations/other-hadoop.md b/docs/35.0.0/operations/other-hadoop.md
new file mode 100644
index 0000000000..7d13a406c1
--- /dev/null
+++ b/docs/35.0.0/operations/other-hadoop.md
@@ -0,0 +1,310 @@
+---
+id: other-hadoop
+title: "Working with different versions of Apache Hadoop"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+:::caution[Deprecated]
+
+Hadoop-based ingestion is deprecated and scheduled to be removed with Druid 37.0.0.
+
+We recommend one of Druid's other supported ingestion methods, such as [SQL-based ingestion](../multi-stage-query/index.md) or [MiddleManager-less ingestion using Kubernetes](../development/extensions-core/k8s-jobs.md)
+
+You must now explicitly opt-in to using the deprecated `index_hadoop` task type. To opt-in, set `druid.indexer.task.allowHadoopTaskExecution` to `true` in your `common.runtime.properties` file. For more information, see [#18239](https://github.com/apache/druid/pull/18239).
+
+:::
+
+
+Apache Druid can interact with Hadoop in two ways:
+
+1. [Use HDFS for deep storage](../development/extensions-core/hdfs.md) using the druid-hdfs-storage extension.
+2. [Batch-load data from Hadoop](../ingestion/hadoop.md) using Map/Reduce jobs.
+
+These are not necessarily linked together; you can load data with Hadoop jobs into a non-HDFS deep storage (like S3),
+and you can use HDFS for deep storage even if you're loading data from streams rather than using Hadoop jobs.
+
+For best results, use these tips when configuring Druid to interact with your favorite Hadoop distribution.
+
+## Tip #1: Place Hadoop XMLs on Druid classpath
+
+Place your Hadoop configuration XMLs (core-site.xml, hdfs-site.xml, yarn-site.xml, mapred-site.xml) on the classpath
+of your Druid processes. You can do this by copying them into `conf/druid/_common/core-site.xml`,
+`conf/druid/_common/hdfs-site.xml`, and so on. This allows Druid to find your Hadoop cluster and properly submit jobs.
+
+## Tip #2: Classloader modification on Hadoop (Map/Reduce jobs only)
+
+Druid uses a number of libraries that are also likely present on your Hadoop cluster, and if these libraries conflict,
+your Map/Reduce jobs can fail. This problem can be avoided by enabling classloader isolation using the Hadoop job
+property `mapreduce.job.classloader = true`. This instructs Hadoop to use a separate classloader for Druid dependencies
+and for Hadoop's own dependencies.
+
+If your version of Hadoop does not support this functionality, you can also try setting the property
+`mapreduce.job.user.classpath.first = true`. This instructs Hadoop to prefer loading Druid's version of a library when
+there is a conflict.
+
+Generally, you should only set one of these parameters, not both.
+
+These properties can be set in either one of the following ways:
+
+- Using the task definition, e.g. add `"mapreduce.job.classloader": "true"` to the `jobProperties` of the `tuningConfig` of your indexing task (see the [Hadoop batch ingestion documentation](../ingestion/hadoop.md)).
+- Using system properties, e.g. on the Middle Manager set `druid.indexer.runner.javaOpts=... -Dhadoop.mapreduce.job.classloader=true` in [Middle Manager configuration](../configuration/index.md#middle-manager-configuration).
+
+### Overriding specific classes
+
+When `mapreduce.job.classloader = true`, it is also possible to specifically define which classes should be loaded from the hadoop system classpath and which should be loaded from job-supplied JARs.
+
+This is controlled by defining class inclusion/exclusion patterns in the `mapreduce.job.classloader.system.classes` property in the `jobProperties` of `tuningConfig`.
+
+For example, some community members have reported version incompatibility errors with the Validator class:
+
+```
+Error: java.lang.ClassNotFoundException: javax.validation.Validator
+```
+
+The following `jobProperties` excludes `javax.validation.` classes from being loaded from the system classpath, while including those from `java.,javax.,org.apache.commons.logging.,org.apache.log4j.,org.apache.hadoop.`.
+
+```
+"jobProperties": {
+  "mapreduce.job.classloader": "true",
+  "mapreduce.job.classloader.system.classes": "-javax.validation.,java.,javax.,org.apache.commons.logging.,org.apache.log4j.,org.apache.hadoop."
+}
+```
+
+[mapred-default.xml](https://hadoop.apache.org/docs/stable/hadoop-mapreduce-client/hadoop-mapreduce-client-core/mapred-default.xml) documentation contains more information about this property.
+
+## Tip #3: Use specific versions of Hadoop libraries
+
+Druid loads Hadoop client libraries from two different locations. Each set of libraries is loaded in an isolated
+classloader.
+
+1. HDFS deep storage uses jars from `extensions/druid-hdfs-storage/` to read and write Druid data on HDFS.
+2. Batch ingestion uses jars from `hadoop-dependencies/` to submit Map/Reduce jobs (location customizable via the
+`druid.extensions.hadoopDependenciesDir` runtime property; see [Configuration](../configuration/index.md#extensions)).
+
+The default version of the Hadoop client bundled with Druid is `3.3.6`. This works with
+many Hadoop distributions (the version does not necessarily need to match), but if you run into issues, you can instead
+have Druid load libraries that exactly match your distribution. To do this, either copy the jars from your Hadoop
+cluster, or use the `pull-deps` tool to download the jars from a Maven repository.
+
+### Preferred: Load using Druid's standard mechanism
+
+If you have issues with HDFS deep storage, you can switch your Hadoop client libraries by recompiling the
+druid-hdfs-storage extension using an alternate version of the Hadoop client libraries. You can do this by editing
+the main Druid pom.xml and rebuilding the distribution by running `mvn package`.
+
+If you have issues with Map/Reduce jobs, you can switch your Hadoop client libraries without rebuilding Druid. You can
+do this by adding a new set of libraries to the `hadoop-dependencies/` directory (or another directory specified by
+druid.extensions.hadoopDependenciesDir) and then using `hadoopDependencyCoordinates` in the
+[Hadoop Index Task](../ingestion/hadoop.md) to specify the Hadoop dependencies you want Druid to load.
+
+Example:
+
+Suppose you specify `druid.extensions.hadoopDependenciesDir=/usr/local/druid_tarball/hadoop-dependencies`, and you have downloaded
+`hadoop-client` 2.3.0 and 2.4.0, either by copying them from your Hadoop cluster or by using `pull-deps` to download
+the jars from a Maven repository. Then underneath `hadoop-dependencies`, your jars should look like this:
+
+```
+hadoop-dependencies/
+└── hadoop-client
+    ├── 2.3.0
+    │   ├── activation-1.1.jar
+    │   ├── avro-1.7.4.jar
+    │   ├── commons-beanutils-1.7.0.jar
+    │   ├── commons-beanutils-core-1.8.0.jar
+    │   ├── commons-cli-1.2.jar
+    │   ├── commons-codec-1.4.jar
+    ..... lots of jars
+    └── 2.4.0
+        ├── activation-1.1.jar
+        ├── avro-1.7.4.jar
+        ├── commons-beanutils-1.7.0.jar
+        ├── commons-beanutils-core-1.8.0.jar
+        ├── commons-cli-1.2.jar
+        ├── commons-codec-1.4.jar
+    ..... lots of jars
+```
+
+As you can see, under `hadoop-client`, there are two sub-directories, each denotes a version of `hadoop-client`.
+
+Next, use `hadoopDependencyCoordinates` in [Hadoop Index Task](../ingestion/hadoop.md) to specify the Hadoop dependencies you want Druid to load.
+
+For example, in your Hadoop Index Task spec file, you can write:
+
+`"hadoopDependencyCoordinates": ["org.apache.hadoop:hadoop-client:2.4.0"]`
+
+This instructs Druid to load hadoop-client 2.4.0 when processing the task. What happens behind the scene is that Druid first looks for a folder
+called `hadoop-client` underneath `druid.extensions.hadoopDependenciesDir`, then looks for a folder called `2.4.0`
+underneath `hadoop-client`, and upon successfully locating these folders, hadoop-client 2.4.0 is loaded.
+
+### Alternative: Append your Hadoop jars to the Druid classpath
+
+You can also load Hadoop client libraries in Druid's main classloader, rather than an isolated classloader. This
+mechanism is relatively easy to reason about, but it also means that you have to ensure that all dependency jars on the
+classpath are compatible. That is, Druid makes no provisions while using this method to maintain class loader isolation
+so you must make sure that the jars on your classpath are mutually compatible.
+
+1. Set `druid.indexer.task.defaultHadoopCoordinates=[]`. By setting this to an empty list, Druid will not load any other Hadoop dependencies except the ones specified in the classpath.
+2. Append your Hadoop jars to Druid's classpath. Druid will load them into the system.
+
+## Notes on specific Hadoop distributions
+
+If the tips above do not solve any issues you are having with HDFS deep storage or Hadoop batch indexing, you may
+have luck with one of the following suggestions contributed by the Druid community.
+
+### CDH
+
+Members of the community have reported dependency conflicts between the version of Jackson used in CDH and Druid when running a Mapreduce job like:
+
+```
+java.lang.VerifyError: class com.fasterxml.jackson.datatype.guava.deser.HostAndPortDeserializer overrides final method deserialize.(Lcom/fasterxml/jackson/core/JsonParser;Lcom/fasterxml/jackson/databind/DeserializationContext;)Ljava/lang/Object;
+```
+
+**Preferred workaround**
+
+First, try the tip under "Classloader modification on Hadoop" above. More recent versions of CDH have been reported to
+work with the classloader isolation option (`mapreduce.job.classloader = true`).
+
+**Alternate workaround - 1**
+
+You can try editing Druid's pom.xml dependencies to match the version of Jackson in your Hadoop version and recompile Druid.
+
+For more about building Druid, please see [Building Druid](../development/build.md).
+
+**Alternate workaround - 2**
+
+Another workaround solution is to build a custom fat jar of Druid using [sbt](http://www.scala-sbt.org/), which manually excludes all the conflicting Jackson dependencies, and then put this fat jar in the classpath of the command that starts Overlord indexing service. To do this, please follow the following steps.
+
+(1) Download and install sbt.
+
+(2) Make a new directory named 'druid_build'.
+
+(3) Cd to 'druid_build' and create the build.sbt file with the content [here](./use_sbt_to_build_fat_jar.md).
+
+You can always add more building targets or remove the ones you don't need.
+
+(4) In the same directory create a new directory named 'project'.
+
+(5) Put the druid source code into 'druid_build/project'.
+
+(6) Create a file 'druid_build/project/assembly.sbt' with content as follows.
+```
+addSbtPlugin("com.eed3si9n" % "sbt-assembly" % "0.13.0")
+```
+
+(7) In the 'druid_build' directory, run 'sbt assembly'.
+
+(8) In the 'druid_build/target/scala-2.10' folder, you will find the fat jar you just build.
+
+(9) Make sure the jars you've uploaded has been completely removed. The HDFS directory is by default '/tmp/druid-indexing/classpath'.
+
+(10) Include the fat jar in the classpath when you start the indexing service. Make sure you've removed 'lib/*' from your classpath because now the fat jar includes all you need.
+
+**Alternate workaround - 3**
+
+If sbt is not your choice, you can also use `maven-shade-plugin` to make a fat jar: relocation all Jackson packages will resolve it too. In this way, druid will not be affected by Jackson library embedded in hadoop. Please follow the steps below:
+
+(1) Add all extensions you needed to `services/pom.xml` like
+
+ ```xml
+ <dependency>
+      <groupId>org.apache.druid.extensions</groupId>
+      <artifactId>druid-avro-extensions</artifactId>
+      <version>${project.parent.version}</version>
+  </dependency>
+
+  <dependency>
+      <groupId>org.apache.druid.extensions</groupId>
+      <artifactId>druid-parquet-extensions</artifactId>
+      <version>${project.parent.version}</version>
+  </dependency>
+
+  <dependency>
+      <groupId>org.apache.druid.extensions</groupId>
+      <artifactId>druid-hdfs-storage</artifactId>
+      <version>${project.parent.version}</version>
+  </dependency>
+
+  <dependency>
+      <groupId>org.apache.druid.extensions</groupId>
+      <artifactId>mysql-metadata-storage</artifactId>
+      <version>${project.parent.version}</version>
+  </dependency>
+ ```
+
+(2) Shade Jackson packages and assemble a fat jar.
+
+```xml
+<plugin>
+     <groupId>org.apache.maven.plugins</groupId>
+     <artifactId>maven-shade-plugin</artifactId>
+     <executions>
+         <execution>
+             <phase>package</phase>
+             <goals>
+                 <goal>shade</goal>
+             </goals>
+             <configuration>
+                 <outputFile>
+                     ${project.build.directory}/${project.artifactId}-${project.version}-selfcontained.jar
+                 </outputFile>
+                 <relocations>
+                     <relocation>
+                         <pattern>com.fasterxml.jackson</pattern>
+                         <shadedPattern>shade.com.fasterxml.jackson</shadedPattern>
+                     </relocation>
+                 </relocations>
+                 <artifactSet>
+                     <includes>
+                         <include>*:*</include>
+                     </includes>
+                 </artifactSet>
+                 <filters>
+                     <filter>
+                         <artifact>*:*</artifact>
+                         <excludes>
+                             <exclude>META-INF/*.SF</exclude>
+                             <exclude>META-INF/*.DSA</exclude>
+                             <exclude>META-INF/*.RSA</exclude>
+                         </excludes>
+                     </filter>
+                 </filters>
+                 <transformers>
+                     <transformer implementation="org.apache.maven.plugins.shade.resource.ServicesResourceTransformer"/>
+                 </transformers>
+             </configuration>
+         </execution>
+     </executions>
+ </plugin>
+```
+
+Copy out `services/target/xxxxx-selfcontained.jar` after `mvn install` in project root for further usage.
+
+(3) run hadoop indexer (post an indexing task is not possible now) as below. `lib` is not needed anymore. As hadoop indexer is a standalone tool, you don't have to replace the jars of your running services:
+
+```bash
+java -Xmx32m \
+  -Dfile.encoding=UTF-8 -Duser.timezone=UTC \
+  -classpath config/hadoop:config/overlord:config/_common:$SELF_CONTAINED_JAR:$HADOOP_DISTRIBUTION/etc/hadoop \
+  -Djava.security.krb5.conf=$KRB5 \
+  org.apache.druid.cli.Main index hadoop \
+  $config_path
+```
diff --git a/docs/35.0.0/operations/password-provider.md b/docs/35.0.0/operations/password-provider.md
new file mode 100644
index 0000000000..d1c116dcbe
--- /dev/null
+++ b/docs/35.0.0/operations/password-provider.md
@@ -0,0 +1,55 @@
+---
+id: password-provider
+title: "Password providers"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+Passwords help secure Apache Druid systems such as the metadata store and the keystore that contains server certificates, and so on.
+
+These passwords have corresponding runtime properties associated with them, for example `druid.metadata.storage.connector.password` corresponds to the metadata store password.
+
+By default users can directly set the passwords in plaintext for runtime properties. For example, `druid.metadata.storage.connector.password=pwd` sets the password to be used by Druid to connect to the metadata store to `pwd`. Alternatively, users can can set passwords as environment variables.
+
+Environment variable passwords allow users to avoid exposing passwords in the `runtime.properties` file. 
+
+You can set an environment variable password as in the following example: 
+
+```json
+druid.metadata.storage.connector.password={ "type": "environment", "variable": "METADATA_STORAGE_PASSWORD" }
+```
+
+The values are described below.
+
+|Field|Type|Description|Required|
+|-----|----|-----------|--------|
+|`type`|String|password provider type|Yes: `environment`|
+|`variable`|String|environment variable to read password from|Yes|
+
+Another option that provides even greater control is to securely fetch passwords at runtime using a custom extension of the `PasswordProvider` interface that is registered at Druid process startup.
+
+For more information, see [Adding a new Password Provider implementation](../development/modules.md#adding-a-new-password-provider-implementation).
+
+To use this implementation, simply set the relevant password runtime property similarly to how was shown for the environment variable password: 
+
+```json
+druid.metadata.storage.connector.password={ "type": "<registered_password_provider_name>", "<jackson_property>": "<value>", ... }
+```
diff --git a/docs/35.0.0/operations/pull-deps.md b/docs/35.0.0/operations/pull-deps.md
new file mode 100644
index 0000000000..4cd0ae1619
--- /dev/null
+++ b/docs/35.0.0/operations/pull-deps.md
@@ -0,0 +1,141 @@
+---
+id: pull-deps
+title: "pull-deps tool"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+`pull-deps` is an Apache Druid tool that can pull down dependencies to the local repository and lay dependencies out into the extension directory as needed.
+
+`pull-deps` has several command line options, they are as follows:
+
+`-c` or `--coordinate` (Can be specified multiple times)
+
+Extension coordinate to pull down, followed by a maven coordinate, e.g. org.apache.druid.extensions:mysql-metadata-storage
+
+`-h` or `--hadoop-coordinate` (Can be specified multiply times)
+
+Apache Hadoop dependency to pull down, followed by a maven coordinate, e.g. org.apache.hadoop:hadoop-client:2.4.0
+
+`--no-default-hadoop`
+
+Don't pull down the default hadoop coordinate, i.e., org.apache.hadoop:hadoop-client:2.3.0. If `-h` option is supplied, then default hadoop coordinate will not be downloaded.
+
+`--clean`
+
+Remove existing extension and hadoop dependencies directories before pulling down dependencies.
+
+`-l` or `--localRepository`
+
+A local repository that Maven will use to put downloaded files. Then pull-deps will lay these files out into the extensions directory as needed.
+
+`-r` or `--remoteRepository`
+
+Add a remote repository. Unless `--no-default-remote-repositories` is provided, these will be used after https://repo1.maven.org/maven2/.
+
+`--no-default-remote-repositories`
+
+Don't use the default remote repository, https://repo1.maven.org/maven2/. Only use the repositories provided directly via --remoteRepository.
+
+`-d` or `--defaultVersion`
+
+Version to use for extension coordinate that doesn't have a version information. For example, if extension coordinate is `org.apache.druid.extensions:mysql-metadata-storage`, and default version is `35.0.0`, then this coordinate will be treated as `org.apache.druid.extensions:mysql-metadata-storage:35.0.0`
+
+`--use-proxy`
+
+Use http/https proxy to send request to the remote repository servers. `--proxy-host` and `--proxy-port` must be set explicitly if this option is enabled.
+
+`--proxy-type`
+
+Set the proxy type, Should be either *http* or *https*, default value is *https*.
+
+`--proxy-host`
+
+Set the proxy host. e.g. proxy.com.
+
+`--proxy-port`
+
+Set the proxy port number. e.g. 8080.
+
+`--proxy-username`
+
+Set a username to connect to the proxy, this option is only required if the proxy server uses authentication.
+
+`--proxy-password`
+
+Set a password to connect to the proxy, this option is only required if the proxy server uses authentication.
+
+To run `pull-deps`, you should
+
+1) Specify `druid.extensions.directory` and `druid.extensions.hadoopDependenciesDir`, these two properties tell `pull-deps` where to put extensions. If you don't specify them,  default values will be used, see [Configuration](../configuration/index.md).
+
+2) Tell `pull-deps` what to download using `-c` or `-h` option, which are followed by a maven coordinate.
+
+Example:
+
+Suppose you want to download ```mysql-metadata-storage``` and ```hadoop-client```(both 2.3.0 and 2.4.0) with a specific version, you can run `pull-deps` command with `-c org.apache.druid.extensions:mysql-metadata-storage:35.0.0`, `-h org.apache.hadoop:hadoop-client:2.3.0` and `-h org.apache.hadoop:hadoop-client:2.4.0`, an example command would be:
+
+```
+java -classpath "/my/druid/lib/*" org.apache.druid.cli.Main tools pull-deps --clean -c org.apache.druid.extensions:mysql-metadata-storage:35.0.0 -h org.apache.hadoop:hadoop-client:2.3.0 -h org.apache.hadoop:hadoop-client:2.4.0
+```
+
+Because `--clean` is supplied, this command will first remove the directories specified at `druid.extensions.directory` and `druid.extensions.hadoopDependenciesDir`, then recreate them and start downloading the extensions there. After finishing downloading, if you go to the extension directories you specified, you will see
+
+```
+tree extensions
+extensions
+└── mysql-metadata-storage
+    └── mysql-metadata-storage-35.0.0.jar
+```
+
+```
+tree hadoop-dependencies
+hadoop-dependencies/
+└── hadoop-client
+    ├── 2.3.0
+    │   ├── activation-1.1.jar
+    │   ├── avro-1.7.4.jar
+    │   ├── commons-beanutils-1.7.0.jar
+    │   ├── commons-beanutils-core-1.8.0.jar
+    │   ├── commons-cli-1.2.jar
+    │   ├── commons-codec-1.4.jar
+    ..... lots of jars
+    └── 2.4.0
+        ├── activation-1.1.jar
+        ├── avro-1.7.4.jar
+        ├── commons-beanutils-1.7.0.jar
+        ├── commons-beanutils-core-1.8.0.jar
+        ├── commons-cli-1.2.jar
+        ├── commons-codec-1.4.jar
+    ..... lots of jars
+```
+
+Note that if you specify `--defaultVersion`, you don't have to put version information in the coordinate. For example, if you want `mysql-metadata-storage` to use version `35.0.0`,  you can change the command above to
+
+```
+java -classpath "/my/druid/lib/*" org.apache.druid.cli.Main tools pull-deps --defaultVersion 35.0.0 --clean -c org.apache.druid.extensions:mysql-metadata-storage -h org.apache.hadoop:hadoop-client:2.3.0 -h org.apache.hadoop:hadoop-client:2.4.0
+```
+
+:::info
+ Please note to use the pull-deps tool you must know the Maven groupId, artifactId, and version of your extension.
+
+ For Druid community extensions listed [here](../configuration/extensions.md), the groupId is "org.apache.druid.extensions.contrib" and the artifactId is the name of the extension.
+:::
diff --git a/docs/35.0.0/operations/request-logging.md b/docs/35.0.0/operations/request-logging.md
new file mode 100644
index 0000000000..6ce65c0421
--- /dev/null
+++ b/docs/35.0.0/operations/request-logging.md
@@ -0,0 +1,249 @@
+---
+id: request-logging
+title: Request logging
+sidebar_label: Request logging
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+All Apache Druid services that can serve queries can also log the query requests they process.
+Request logs contain information on query metrics, including execution time and memory usage.
+You can use information in the request logs to monitor query performance, determine bottlenecks, and analyze and improve slow queries.
+
+Request logging is disabled by default.
+This topic describes how to configure Druid to generate request logs to track query metrics.
+
+## Configure request logging
+
+To enable request logging, determine the type of request logger to use, then set the configurations specific to the request logger type.
+
+The following request logger types are available:
+
+- `noop`: Disables request logging, the default behavior.
+- [`file`](../configuration/index.md#file-request-logging): Stores logs to disk.
+- [`emitter`](../configuration/index.md#emitter-request-logging): Logs request to an external location, which is configured through an emitter.
+- [`slf4j`](../configuration/index.md#slf4j-request-logging): Logs queries via the SLF4J Java logging API.
+- [`filtered`](../configuration/index.md#filtered-request-logging): Filters requests by query type or execution time before logging the filtered queries by the delegated request logger.
+- [`composing`](../configuration/index.md#composing-request-logging): Logs all requests to multiple request loggers.
+- [`switching`](../configuration/index.md#switching-request-logging): Logs native queries and SQL queries to separate request loggers.
+
+Define the type of request logger in `druid.request.logging.type`.
+See the [Request logging configuration](../configuration/index.md#request-logging) for properties to set for each type of request logger.
+Specify these properties in the `common.runtime.properties` file.
+You must restart Druid for the changes to take effect.
+
+Druid stores the results in the Broker logs, unless the request logging type is `emitter`.
+If you use emitter request logging, you must also configure metrics emission.
+
+## Configure metrics emission
+
+Druid includes various emitters to send metrics and alerts. 
+To emit query metrics, set `druid.request.logging.feed=emitter`, and define the emitter type in the `druid.emitter` property.
+
+You can use any of the following emitters in Druid:
+
+- `noop`: Disables metric emission, the default behavior.
+- [`logging`](../configuration/index.md#logging-emitter-module): Emits metrics to Log4j 2. See [Logging](../configuration/logging.md) to configure Log4j 2 for use with Druid.
+- [`http`](../configuration/index.md#http-emitter-module): Sends HTTP `POST` requests containing the metrics in JSON format to a user-defined endpoint.
+- [`parametrized`](../configuration/index.md#parametrized-http-emitter-module): Operates like the `http` emitter but fine-tunes the recipient URL based on the event feed.
+- [`composing`](../configuration/index.md#composing-emitter-module): Emits metrics to multiple emitter types.
+- [`graphite`](../configuration/index.md#graphite-emitter): Emits metrics to a [Graphite](https://graphiteapp.org/) Carbon service.
+
+Specify these properties in the `common.runtime.properties` file.
+See the [Metrics emitters configuration](../configuration/index.md#metrics-emitters) for properties to set for each type of metrics emitter.
+You must restart Druid for the changes to take effect.
+
+
+## Example
+
+The following configuration shows how to enable request logging and post query metrics to the endpoint `http://example.com:8080/path`.
+```
+# Enable request logging and configure the emitter request logger
+druid.request.logging.type=emitter
+druid.request.logging.feed=myRequestLogFeed
+
+# Enable metrics emission and tell Druid where to emit messages
+druid.emitter=http
+druid.emitter.http.recipientBaseUrl=http://example.com:8080/path
+
+# Authenticate to the base URL, if needed
+druid.emitter.http.basicAuthentication=username:password
+```
+
+The following shows an example log emitter output:
+```
+[
+    {
+        "feed": "metrics",
+        "timestamp": "2022-01-06T20:32:06.628Z",
+        "service": "druid/broker",
+        "host": "localhost:8082",
+        "version": "2022.01.0-iap-SNAPSHOT",
+        "metric": "sqlQuery/bytes",
+        "value": 9351,
+        "dataSource": "[wikipedia]",
+        "id": "56e8317b-31cc-443d-b109-47f51b21d4c3",
+        "nativeQueryIds": "[2b9cbced-11fc-4d78-a58c-c42863dff3c8]",
+        "remoteAddress": "127.0.0.1",
+        "success": "true"
+    },
+    {
+        "feed": "myRequestLogFeed",
+        "timestamp": "2022-01-06T20:32:06.585Z",
+        "remoteAddr": "127.0.0.1",
+        "service": "druid/broker",
+        "sqlQueryContext":
+        {
+            "useApproximateCountDistinct": false,
+            "sqlQueryId": "56e8317b-31cc-443d-b109-47f51b21d4c3",
+            "useApproximateTopN": false,
+            "useCache": false,
+            "sqlOuterLimit": 101,
+            "populateCache": false,
+            "nativeQueryIds": "[2b9cbced-11fc-4d78-a58c-c42863dff3c8]"
+        },
+        "queryStats":
+        {
+            "sqlQuery/time": 43,
+            "sqlQuery/planningTimeMs": 5,
+            "sqlQuery/bytes": 9351,
+            "success": true,
+            "context":
+            {
+                "useApproximateCountDistinct": false,
+                "sqlQueryId": "56e8317b-31cc-443d-b109-47f51b21d4c3",
+                "useApproximateTopN": false,
+                "useCache": false,
+                "sqlOuterLimit": 101,
+                "populateCache": false,
+                "nativeQueryIds": "[2b9cbced-11fc-4d78-a58c-c42863dff3c8]"
+            },
+            "identity": "allowAll"
+        },
+        "query": null,
+        "host": "localhost:8082",
+        "sql": "SELECT * FROM wikipedia WHERE cityName = 'Buenos Aires'"
+    },
+    {
+        "feed": "myRequestLogFeed",
+        "timestamp": "2022-01-06T20:32:07.652Z",
+        "remoteAddr": "",
+        "service": "druid/broker",
+        "sqlQueryContext":
+        {},
+        "queryStats":
+        {
+            "query/time": 16,
+            "query/bytes": -1,
+            "success": true,
+            "identity": "allowAll"
+        },
+        "query":
+        {
+            "queryType": "scan",
+            "dataSource":
+            {
+                "type": "table",
+                "name": "wikipedia"
+            },
+            "intervals":
+            {
+                "type": "intervals",
+                "intervals":
+                [
+                    "-146136543-09-08T08:23:32.096Z/146140482-04-24T15:36:27.903Z"
+                ]
+            },
+            "virtualColumns":
+            [
+                {
+                    "type": "expression",
+                    "name": "v0",
+                    "expression": "'Buenos Aires'",
+                    "outputType": "STRING"
+                }
+            ],
+            "resultFormat": "compactedList",
+            "batchSize": 20480,
+            "limit": 101,
+            "filter":
+            {
+                "type": "selector",
+                "dimension": "cityName",
+                "value": "Buenos Aires",
+                "extractionFn": null
+            },
+            "columns":
+            [
+                "__time",
+                "added",
+                "channel",
+                "comment",
+                "commentLength",
+                "countryIsoCode",
+                "countryName",
+                "deleted",
+                "delta",
+                "deltaBucket",
+                "diffUrl",
+                "flags",
+                "isAnonymous",
+                "isMinor",
+                "isNew",
+                "isRobot",
+                "isUnpatrolled",
+                "metroCode",
+                "namespace",
+                "page",
+                "regionIsoCode",
+                "regionName",
+                "user",
+                "v0"
+            ],
+            "context":
+            {
+                "populateCache": false,
+                "queryId": "62e3d373-6e50-41b4-873b-1e56347c2950",
+                "sqlOuterLimit": 101,
+                "sqlQueryId": "cbb3d519-aee9-4566-8920-dbbeab6269f5",
+                "useApproximateCountDistinct": false,
+                "useApproximateTopN": false,
+                "useCache": false
+            },
+            "descending": false,
+            "granularity":
+            {
+                "type": "all"
+            }
+        },
+        "host": "localhost:8082",
+        "sql": null
+    },
+    ...
+]
+``` 
+
+## Learn more
+
+See the following topics for more information.
+* [Query metrics](metrics.md#query-metrics)
+* [Request logging configuration](../configuration/index.md#request-logging)
+* [Metrics emitters configuration](../configuration/index.md#metrics-emitters) 
+
diff --git a/docs/35.0.0/operations/reset-cluster.md b/docs/35.0.0/operations/reset-cluster.md
new file mode 100644
index 0000000000..476a68ef86
--- /dev/null
+++ b/docs/35.0.0/operations/reset-cluster.md
@@ -0,0 +1,29 @@
+---
+id: reset-cluster
+title: "reset-cluster tool"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+In older versions of Apache Druid, `reset-cluster` was a tool that could wipe out Apache Druid cluster state stored in
+metadata and deep storage, intended primarily for use in dev and test environments. However, this tool was prone to
+becoming out of sync with the codebase since it was not used in practice during dev and testing, and could not cover
+all cleanup cases when extensions were involved. It was removed in Druid 35.0.0.
diff --git a/docs/35.0.0/operations/rolling-updates.md b/docs/35.0.0/operations/rolling-updates.md
new file mode 100644
index 0000000000..07cf3b4c8f
--- /dev/null
+++ b/docs/35.0.0/operations/rolling-updates.md
@@ -0,0 +1,103 @@
+---
+id: rolling-updates
+title: "Rolling updates"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+For rolling Apache Druid cluster updates with no downtime, we recommend updating Druid processes in the
+following order:
+
+1. Historical
+2. Middle Manager and Indexer (if any)
+3. Broker
+4. Router
+5. Overlord (Note that you can upgrade the Overlord before any Middle Manager processes if you use [autoscaling-based replacement](#autoscaling-based-replacement).)
+6. Coordinator ( or merged Coordinator+Overlord )
+
+If you need to do a rolling downgrade, reverse the order and start with the Coordinator processes.
+
+For information about the latest release, see [Druid releases](https://github.com/apache/druid/releases).
+
+## Historical
+
+Historical processes can be updated one at a time. Each Historical process has a startup time to memory map
+all the segments it was serving before the update. The startup time typically takes a few seconds to
+a few minutes, depending on the hardware of the host. As long as each Historical process is updated
+with a sufficient delay (greater than the time required to start a single process), you can rolling
+update the entire Historical cluster.
+
+## Overlord
+
+Overlord processes can be updated one at a time in a rolling fashion.
+
+## Middle Managers/Indexers
+
+Middle Managers or Indexer nodes run both batch and real-time indexing tasks. Generally you want to update Middle
+Managers in such a way that real-time indexing tasks do not fail. There are three strategies for
+doing that.
+
+### Rolling restart (restore-based)
+
+Middle Managers can be updated one at a time in a rolling fashion when you set
+`druid.indexer.task.restoreTasksOnRestart=true`. In this case, indexing tasks that support restoring
+will restore their state on Middle Manager restart, and will not fail.
+
+Currently, only realtime tasks support restoring, so non-realtime indexing tasks will fail and will
+need to be resubmitted.
+
+### Rolling restart (graceful-termination-based)
+
+Middle Managers can be gracefully terminated using the "disable" API. This works for all task types,
+even tasks that are not restorable.
+
+To prepare a Middle Manager for update, send a POST request to
+`<Middle_Manager_IP:PORT>/druid/worker/v1/disable`. The Overlord will now no longer send tasks to
+this Middle Manager. Tasks that have already started will run to completion. Current state can be checked
+using `<Middle_Manager_IP:PORT>/druid/worker/v1/enabled` .
+
+To view all existing tasks, send a GET request to `<Middle_Manager_IP:PORT>/druid/worker/v1/tasks`.
+When this list is empty, you can safely update the Middle Manager. After the Middle Manager starts
+back up, it is automatically enabled again. You can also manually enable Middle Managers by POSTing
+to `<Middle_Manager_IP:PORT>/druid/worker/v1/enable`.
+
+### Autoscaling-based replacement
+
+If autoscaling is enabled on your Overlord, then Overlord processes can launch new Middle Manager processes
+en masse and then gracefully terminate old ones as their tasks finish. This process is configured by
+setting `druid.indexer.runner.minWorkerVersion=#{VERSION}`. Each time you update your Overlord process,
+the `VERSION` value should be increased, which will trigger a mass launch of new Middle Managers.
+
+The config `druid.indexer.autoscale.workerVersion=#{VERSION}` also needs to be set.
+
+## Standalone Real-time
+
+Standalone real-time processes can be updated one at a time in a rolling fashion.
+
+## Broker
+
+Broker processes can be updated one at a time in a rolling fashion. There needs to be some delay between
+updating each process as Brokers must load the entire state of the cluster before they return valid
+results.
+
+## Coordinator
+
+Coordinator processes can be updated one at a time in a rolling fashion.
diff --git a/docs/35.0.0/operations/rule-configuration.md b/docs/35.0.0/operations/rule-configuration.md
new file mode 100644
index 0000000000..9117973f0b
--- /dev/null
+++ b/docs/35.0.0/operations/rule-configuration.md
@@ -0,0 +1,357 @@
+---
+id: rule-configuration
+title: "Using rules to drop and retain data"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+Data retention rules allow you to configure Apache Druid to conform to your data retention policies. Your data retention policies specify which data to retain and which data to drop from the cluster.
+
+Druid supports [load](#load-rules), [drop](#drop-rules), and [broadcast](#broadcast-rules) rules. Each rule is a JSON object. See the [rule definitions below](#load-rules) for details.
+
+You can configure a default set of rules to apply to all datasources, and/or you can set specific rules for specific datasources. See [rule structure](#rule-structure) to see how rule order impacts the way the Coordinator applies retention rules.
+
+You can specify the data to retain or drop in the following ways:
+
+- Forever: all data in the segment.
+- Period: segment data specified as an offset from the present time.
+- Interval: a fixed time range.
+
+Retention rules are persistent: they remain in effect until you change them. Druid stores retention rules in its [metadata store](../design/metadata-storage.md).
+
+## Set retention rules
+
+You can use the Druid [web console](./web-console.md) or the [Service status API reference](../api-reference/service-status-api.md#coordinator) to create and manage retention rules.
+
+### Use the web console
+
+To set retention rules in the Druid web console:
+
+1. On the console home page, click **Datasources**.
+2. Click the name of your datasource to open the data window.
+3. Select **Actions > Edit retention rules**.
+4. Click **+New rule**.
+5. Select a rule type and set properties for the rule.
+6. Click **Next** and enter a description for the rule.
+7. Click **Save** to save and apply the rule to the datasource.
+
+### Use the Coordinator API
+
+To set one or more default retention rules for all datasources, send a POST request containing a JSON object for each rule to `/druid/coordinator/v1/rules/_default`.
+
+The following example request sets a default forever broadcast rule for all datasources:
+
+```bash
+curl --location --request POST 'http://localhost:8888/druid/coordinator/v1/rules/_default' \
+--header 'Content-Type: application/json' \
+--data-raw '[{
+  "type": "broadcastForever"
+  }]'
+```
+
+To set one or more retention rules for a specific datasource, send a POST request containing a JSON object for each rule to `/druid/coordinator/v1/rules/{datasourceName}`.
+
+The following example request sets a period drop rule and a period broadcast rule for the `wikipedia` datasource:
+
+```bash
+curl --location --request POST 'http://localhost:8888/druid/coordinator/v1/rules/wikipedia' \
+--header 'Content-Type: application/json' \
+--data-raw '[{
+   "type": "dropByPeriod",
+   "period": "P1M",
+   "includeFuture": true
+   },
+   {
+    "type": "broadcastByPeriod",
+    "period": "P1M",
+    "includeFuture": true
+   }]'
+```
+
+To retrieve all rules for all datasources, send a GET request to `/druid/coordinator/v1/rules`&mdash;for example:
+
+```bash
+curl --location --request GET 'http://localhost:8888/druid/coordinator/v1/rules'
+```
+
+### Rule structure
+
+The rules API accepts an array of rules as JSON objects. The JSON object you send in the API request for each rule is specific to the rules types outlined below.
+
+:::info
+ You must pass the entire array of rules, in your desired order, with each API request. Each POST request to the rules API overwrites the existing rules for the specified datasource.
+:::
+
+The order of rules is very important. The Coordinator reads rules in the order in which they appear in the rules list. For example, in the following screenshot the Coordinator evaluates data against rule 1, then rule 2, then rule 3:
+
+![retention rules](../assets/retention-rules.png)
+
+The Coordinator cycles through all used segments and matches each segment with the first rule that applies. Each segment can only match a single rule.
+
+In the web console you can use the up and down arrows on the right side of the interface to change the order of the rules.
+
+## Load rules
+
+Load rules define how Druid assigns segments to [Historical process tiers](./mixed-workloads.md#historical-tiering), and how many replicas of a segment exist in each tier.
+
+If you have a single tier, Druid automatically names the tier `_default`. If you define an additional tier, you must define a load rule to specify which segments to load on that tier. Until you define a load rule, your new tier remains empty.
+
+All load rules can have these properties:
+
+|Property|Description|Required|Default value|
+|---------|-----------|---------|-------------|
+| `tieredReplicants`| Map from tier names to the respective number of segment replicas to be loaded on those tiers. The number of replicas for each tier must be either 0 or a positive integer.| No | When `useDefaultTierForNull` is `true`, the default value is `{"_default_tier": 2}` i.e. 2 replicas to be loaded on the `_default_tier`.<br/><br/>When `useDefaultTierForNull` is `false`, the default value is `{}` i.e. no replicas to be loaded on any tier. |
+|`useDefaultTierForNull`|Determines the default value of `tieredReplicants` if it is not specified or set to `null`.| No | `true`|
+
+Specific types of load rules discussed below may have other properties too.
+
+Load rules are also how you take advantage of the resource savings that [query the data from deep storage](../querying/query-from-deep-storage.md) provides. One way to configure data so that certain segments are not loaded onto Historical tiers but are available to query from deep storage is to set `tieredReplicants` to an empty array and `useDefaultTierForNull` to `false` for those segments, either by interval or by period.
+
+### Forever load rule
+
+The forever load rule assigns all datasource segments to specified tiers. It is the default rule Druid applies to datasources. Forever load rules have type `loadForever`.
+
+The following example places one replica of each segment on a custom tier named `hot`, and another single replica on the default tier.
+
+```json
+{
+  "type": "loadForever",
+  "tieredReplicants": {
+    "hot": 1,
+    "_default_tier": 1
+  }
+}
+```
+
+Set the following property:
+
+- `tieredReplicants`: a map of tier names to the number of segment replicas for that tier.
+- `useDefaultTierForNull`: This parameter determines the default value of `tieredReplicants` and only has an effect if the field is not present. The default value of `useDefaultTierForNull` is true.
+
+### Period load rule
+
+You can use a period load rule to assign segment data in a specific period to a tier. Druid compares a segment's interval to the period you specify in the rule and loads the matching data.
+
+Period load rules have type `loadByPeriod`. The following example places one replica of data in a one-month period on a custom tier named `hot`, and another single replica on the default tier.
+
+```json
+{
+  "type": "loadByPeriod",
+  "period": "P1M",
+  "includeFuture": true,
+  "tieredReplicants": {
+      "hot": 1,
+      "_default_tier": 1
+  }
+}
+```
+
+Set the following properties:
+
+- `period`: a JSON object representing [ISO 8601](https://en.wikipedia.org/wiki/ISO_8601) periods. The period is from some time in the past to the present, or into the future if `includeFuture` is set to `true`.
+- `includeFuture`: a boolean flag to instruct Druid to match a segment if:
+  - the segment interval overlaps the rule interval, or
+  - the segment interval starts any time after the rule interval starts.
+
+  You can use this property to load segments with future start and end dates, where "future" is relative to the time when the Coordinator evaluates data against the rule. Defaults to `true`.
+- `tieredReplicants`: a map of tier names to the number of segment replicas for that tier. 
+- `useDefaultTierForNull`: This parameter determines the default value of `tieredReplicants` and only has an effect if the field is not present. The default value of `useDefaultTierForNull` is true.
+
+### Interval load rule
+
+You can use an interval rule to assign a specific range of data to a tier. For example, analysts may typically work with the complete data set for all of last week and not so much with the data for the current week.
+
+Interval load rules have type `loadByInterval`. The following example places one replica of data matching the specified interval on a custom tier named `hot`, and another single replica on the default tier.
+
+```json
+{
+  "type": "loadByInterval",
+  "interval": "2012-01-01/2013-01-01",
+  "tieredReplicants": {
+    "hot": 1,
+    "_default_tier": 1
+  }
+}
+```
+
+Set the following properties:
+
+- `interval`: the load interval specified as an [ISO 8601](https://en.wikipedia.org/wiki/ISO_8601) range encoded as a string.
+- `tieredReplicants`: a map of tier names to the number of segment replicas for that tier. 
+- `useDefaultTierForNull`: This parameter determines the default value of `tieredReplicants` and only has an effect if the field is not present. The default value of `useDefaultTierForNull` is true.
+
+## Drop rules
+
+Drop rules define when Druid drops segments from the cluster. Druid keeps dropped data in deep storage. Note that if you enable automatic cleanup of unused segments, or you run a kill task, Druid deletes the data from deep storage. See [Data deletion](../data-management/delete.md) for more information on deleting data.
+
+If you want to use a [load rule](#load-rules) to retain only data from a defined period of time, you must also define a drop rule. If you don't define a drop rule, Druid retains data that doesn't lie within your defined period according to the default rule, `loadForever`.
+
+### Forever drop rule
+
+The forever drop rule drops all segment data from the cluster. If you configure a set of rules with a forever drop rule as the last rule, Druid drops any segment data that remains after it evaluates the higher priority rules.
+
+Forever drop rules have type `dropForever`:
+
+```json
+{
+  "type": "dropForever"
+}
+```
+
+### Period drop rule
+
+Druid compares a segment's interval to the period you specify in the rule and drops the matching data. The rule matches if the period contains the segment interval. This rule always drops recent data.
+
+Period drop rules have type `dropByPeriod` and the following JSON structure:
+
+```json
+{
+  "type": "dropByPeriod",
+  "period": "P1M",
+  "includeFuture": true
+}
+```
+
+Set the following properties:
+
+- `period`: a JSON object representing [ISO 8601](https://en.wikipedia.org/wiki/ISO_8601) periods. The period is from some time in the past to the future or to the current time, depending on the `includeFuture` flag.
+- `includeFuture`: a boolean flag to instruct Druid to match a segment if one of the following conditions apply:
+
+  - the segment interval overlaps the rule interval
+  - the segment interval starts any time after the rule interval starts
+  
+  You can use this property to drop segments with future start and end dates, where "future" is relative to the time when the Coordinator evaluates data against the rule. Defaults to `true`.
+
+### Period drop before rule
+
+Druid compares a segment's interval to the period you specify in the rule and drops the matching data. The rule matches if the segment interval is before the specified period.
+
+If you only want to retain recent data, you can use this rule to drop old data before a specified period, and add a `loadForever` rule to retain the data that follows it. Note that the rule combination `dropBeforeByPeriod` + `loadForever` is equivalent to `loadByPeriod(includeFuture = true)` + `dropForever`.
+
+Period drop rules have type `dropBeforeByPeriod` and the following JSON structure:
+
+```json
+{
+  "type": "dropBeforeByPeriod",
+  "period": "P1M"
+}
+```
+
+Set the following property:
+
+- `period`: a JSON object representing [ISO 8601](https://en.wikipedia.org/wiki/ISO_8601) periods.
+
+### Interval drop rule
+
+You can use a drop interval rule to prevent Druid from loading a specified range of data onto any tier. The range is typically your oldest data. The dropped data resides in deep storage and can still be [queried from deep storage](../querying/query-from-deep-storage.md). 
+
+Interval drop rules have type `dropByInterval` and the following JSON structure:
+
+```json
+{
+  "type": "dropByInterval",
+  "interval": "2012-01-01/2013-01-01"
+}
+```
+
+Set the following property:
+
+- `interval`: the drop interval specified as an [ISO 8601](https://en.wikipedia.org/wiki/ISO_8601) range encoded as a string.
+
+## Broadcast rules
+
+Druid extensions use broadcast rules to load segment data onto all Brokers in the cluster. Apply broadcast rules in a test environment, not in production.
+To use broadcast rules, ensure that `druid.segmentCache.locations` is configured on both Brokers and Historicals.
+This ensures that Druid can load the segments onto those servers. For more information, see [Segment cache size](../operations/basic-cluster-tuning.md#segment-cache-size).
+
+### Forever broadcast rule
+
+The forever broadcast rule loads all segment data in your datasources onto all brokers in the cluster.
+
+Forever broadcast rules have type `broadcastForever`:
+
+```json
+{
+  "type": "broadcastForever"
+}
+```
+
+### Period broadcast rule
+
+Druid compares a segment's interval to the period you specify in the rule and loads the matching data onto the brokers in the cluster.
+
+Period broadcast rules have type `broadcastByPeriod` and the following JSON structure:
+
+```json
+{
+  "type": "broadcastByPeriod",
+  "period": "P1M",
+  "includeFuture": true
+}
+```
+
+Set the following properties:
+
+- `period`: a JSON object representing [ISO 8601](https://en.wikipedia.org/wiki/ISO_8601) periods. The period is from some time in the past to the future or to the current time, depending on the `includeFuture` flag.
+- `includeFuture`: a boolean flag to instruct Druid to match a segment if one of the following conditions apply:
+  - the segment interval overlaps the rule interval
+  - the segment interval starts any time after the rule interval starts.
+
+  You can use this property to broadcast segments with future start and end dates, where "future" is relative to the time when the Coordinator evaluates data against the rule. Defaults to `true`.
+
+### Interval broadcast rule
+
+An interval broadcast rule loads a specific range of data onto the brokers in the cluster.
+
+Interval broadcast rules have type `broadcastByInterval` and the following JSON structure:
+
+```json
+{
+  "type": "broadcastByInterval",
+  "interval": "2012-01-01/2013-01-01"
+}
+```
+
+Set the following property:
+
+- `interval`: the broadcast interval specified as an [ISO 8601](https://en.wikipedia.org/wiki/ISO_8601) range encoded as a string.
+
+## Permanently delete data
+
+Druid can fully drop data from the cluster, wipe the metadata store entry, and remove the data from deep storage for any segments marked `unused`. Note that Druid always marks segments dropped from the cluster by rules as `unused`. You can submit a [kill task](../ingestion/tasks.md) to the [Overlord](../design/overlord.md) to do this.
+
+## Reload dropped data
+
+You can't use a single rule to reload data Druid has dropped from a cluster.
+
+To reload dropped data:
+
+1. Set your retention period&mdash;for example, change the retention period from one month to two months.
+2. Use the web console or the API to mark all segments belonging to the datasource as `used`.
+
+This prompts Druid to rerun the Coordinator rules and load all missing segments. The Coordinator identifies the latest version of the segments and drops older versions.
+
+## Learn more
+
+For more information about using retention rules in Druid, see the following topics:
+
+- [Tutorial: Configuring data retention](../tutorials/tutorial-retention.md)
+- [Configure Druid for mixed workloads](../operations/mixed-workloads.md)
+- [Router process](../design/router.md)
diff --git a/docs/35.0.0/operations/security-overview.md b/docs/35.0.0/operations/security-overview.md
new file mode 100644
index 0000000000..dfbc7946dc
--- /dev/null
+++ b/docs/35.0.0/operations/security-overview.md
@@ -0,0 +1,304 @@
+---
+id: security-overview
+title: "Security overview"
+description: Overiew of Apache Druid security. Includes best practices, configuration instructions, a description of the security model and documentation on how to report security issues.
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+This document provides an overview of Apache Druid security features, configuration instructions, and some best practices to secure Druid.
+
+By default, security features in Druid are disabled, which simplifies the initial deployment experience. However, security features must be configured in a production deployment. These features include TLS, authentication, and authorization.
+
+## Best practices
+
+The following recommendations apply to the Druid cluster setup:
+* Run Druid as an unprivileged Unix user. Do not run Druid as the root user.
+:::warning
+Druid administrators have the same OS permissions as the Unix user account running Druid. See [Authentication and authorization model](security-user-auth.md#authentication-and-authorization-model). If the Druid process is running under the OS root user account, then Druid administrators can read or write all files that the root account has access to, including sensitive files such as `/etc/passwd`.
+:::
+* Enable authentication to the Druid cluster for production environments and other environments that can be accessed by untrusted networks.
+* Enable authorization and do not expose the web console without authorization enabled. If authorization is not enabled, any user that has access to the web console has the same privileges as the operating system user that runs the web console process.
+* Grant users the minimum permissions necessary to perform their functions. For instance, do not allow users who only need to query data to write to data sources or view state.
+* Do not provide plain-text passwords for production systems in configuration specs. For example, sensitive properties should not be in the `consumerProperties` field of `KafkaSupervisorIngestionSpec`. See [Environment variable dynamic config provider](./dynamic-config-provider.md#environment-variable-dynamic-config-provider) for more information.
+* Disable JavaScript, as noted in the [Security section](https://druid.apache.org/docs/latest/development/javascript.html#security) of the JavaScript guide.
+
+The following recommendations apply to the network where Druid runs:
+* Enable TLS to encrypt communication within the cluster.
+* Use an API gateway to:
+  - Restrict access from untrusted networks
+  - Create an allow list of specific APIs that your users need to access
+  - Implement account lockout and throttling features.
+* When possible, use firewall and other network layer filtering to only expose Druid services and ports specifically required for your use case. For example, only expose Broker ports to downstream applications that execute queries. You can limit access to a specific IP address or IP range to further tighten and enhance security.
+
+The following recommendation applies to Druid's authorization and authentication model:
+* Only grant `WRITE` permissions to any `DATASOURCE` to trusted users. Druid's trust model assumes those users have the same privileges as the operating system user that runs the web console process. Additionally, users with `WRITE` permissions can make changes to datasources and they have access to both task and supervisor update (POST) APIs which may affect ingestion.
+* Only grant `STATE READ`, `STATE WRITE`, `CONFIG WRITE`, and `DATASOURCE WRITE` permissions to highly-trusted users. These permissions allow users to access resources on behalf of the Druid server process regardless of the datasource.
+* If your Druid client application allows less-trusted users to control the input source of an ingestion task, validate the URLs from the users. It is possible to point unchecked URLs to other locations and resources within your network or local file system.
+
+## Enable TLS
+
+Enabling TLS encrypts the traffic between external clients and the Druid cluster and traffic between services within the cluster.
+
+### Generating keys
+Before you enable TLS in Druid, generate the KeyStore and truststore. When one Druid process, e.g. Broker, contacts another Druid process , e.g. Historical, the first service is a client for the second service, considered the server.
+
+The client uses a trustStore that contains certificates trusted by the client. For example, the Broker.
+
+The server uses a KeyStore that contains private keys and certificate chain used to securely identify itself.
+
+The following example demonstrates how to use Java keytool to generate the KeyStore for the server and then create a trustStore to trust the key for the client:
+
+1. Generate the KeyStore with the Java `keytool` command:
+```bash
+keytool -keystore keystore.jks -alias druid -genkey -keyalg RSA
+```
+2. Export a public certificate:
+```bash
+keytool -export -alias druid -keystore keystore.jks -rfc -file public.cert
+```
+3. Create the trustStore:
+```bash
+keytool -import -file public.cert -alias druid -keystore truststore.jks
+```
+
+Druid uses Jetty as its embedded web server. See [Configuring SSL/TLS KeyStores
+](https://www.eclipse.org/jetty/documentation/jetty-11/operations-guide/index.html#og-keystore) from the Jetty documentation.
+
+:::warning
+Do not use self-signed certificates for production environments. Instead, rely on your current public key infrastructure to generate and distribute trusted keys.
+:::
+
+### Update Druid TLS configurations
+Edit `common.runtime.properties` for all Druid services on all nodes. Add or update the following TLS options. Restart the cluster when you are finished.
+
+```properties
+# Turn on TLS globally
+druid.enableTlsPort=true
+
+# Disable non-TLS communicatoins
+druid.enablePlaintextPort=false
+
+# For Druid processes acting as a client
+# Load simple-client-sslcontext to enable client side TLS
+# Add the following to extension load list
+druid.extensions.loadList=[......., "simple-client-sslcontext"]
+
+# Setup client side TLS
+druid.client.https.protocol=TLSv1.2
+druid.client.https.trustStoreType=jks
+druid.client.https.trustStorePath=truststore.jks # replace with correct trustStore file
+druid.client.https.trustStorePassword=secret123  # replace with your own password
+
+# Setup server side TLS
+druid.server.https.keyStoreType=jks
+druid.server.https.keyStorePath=my-keystore.jks # replace with correct keyStore file
+druid.server.https.keyStorePassword=secret123 # replace with your own password
+druid.server.https.certAlias=druid
+```
+For more information, see [TLS support](tls-support.md) and [Simple SSLContext Provider Module](../development/extensions-core/simple-client-sslcontext.md).
+
+## Authentication and authorization
+
+You can configure authentication and authorization to control access to the Druid APIs. Then configure users, roles, and permissions, as described in the following sections. Make the configuration changes in the `common.runtime.properties` file on all Druid servers in the cluster.
+
+Within Druid's operating context, authenticators control the way user identities are verified. Authorizers employ user roles to relate authenticated users to the datasources they are permitted to access. You can set the finest-grained permissions on a per-datasource basis.
+
+The following graphic depicts the course of request through the authentication process:
+
+![Druid security check flow](../assets/security-model-1.png "Druid security check flow")
+
+## Enable an authenticator
+
+To authenticate requests in Druid, you configure an Authenticator. Authenticator extensions exist for HTTP basic authentication, LDAP, and Kerberos.
+
+The following takes you through sample configuration steps for enabling basic auth:
+
+1. Add the `druid-basic-security` extension to `druid.extensions.loadList` in `common.runtime.properties`. For the quickstart installation, for example, the properties file is at `conf/druid/cluster/_common`:
+   ```properties
+   druid.extensions.loadList=["druid-basic-security", "druid-histogram", "druid-datasketches", "druid-kafka-indexing-service"]
+   ```
+2. Configure the basic Authenticator, Authorizer, and Escalator settings in the same common.runtime.properties file. The Escalator defines how Druid processes authenticate with one another.
+
+   An example configuration:
+
+   ```properties
+   # Druid basic security
+   druid.auth.authenticatorChain=["MyBasicMetadataAuthenticator"]
+   druid.auth.authenticator.MyBasicMetadataAuthenticator.type=basic
+
+   # Default password for 'admin' user, should be changed for production.
+   druid.auth.authenticator.MyBasicMetadataAuthenticator.initialAdminPassword=password1
+
+   # Default password for internal 'druid_system' user, should be changed for production.
+   druid.auth.authenticator.MyBasicMetadataAuthenticator.initialInternalClientPassword=password2
+
+   # Uses the metadata store for storing users.
+   # You can use the authentication API to create new users and grant permissions
+   druid.auth.authenticator.MyBasicMetadataAuthenticator.credentialsValidator.type=metadata
+
+   # If true and if the request credential doesn't exist in this credentials store,
+   # the request will proceed to next Authenticator in the chain.
+   druid.auth.authenticator.MyBasicMetadataAuthenticator.skipOnFailure=false
+
+   druid.auth.authenticator.MyBasicMetadataAuthenticator.authorizerName=MyBasicMetadataAuthorizer
+
+   # Escalator
+   druid.escalator.type=basic
+   druid.escalator.internalClientUsername=druid_system
+   druid.escalator.internalClientPassword=password2
+   druid.escalator.authorizerName=MyBasicMetadataAuthorizer
+
+   druid.auth.authorizers=["MyBasicMetadataAuthorizer"]
+
+   druid.auth.authorizer.MyBasicMetadataAuthorizer.type=basic
+   ```
+
+3. Restart the cluster.
+
+See the following topics for more information:
+
+* [Authentication and Authorization](../operations/auth.md) for more information about the Authenticator,
+Escalator, and Authorizer.
+* [Basic Security](../development/extensions-core/druid-basic-security.md) for more information about
+the extension used in the examples above.
+* [Kerberos](../development/extensions-core/druid-kerberos.md) for Kerberos authentication.
+* [User authentication and authorization](security-user-auth.md) for details about permissions.
+* [SQL permissions](security-user-auth.md#sql-permissions) for permissions on SQL system tables.
+
+## Enable authorizers
+
+After enabling the basic auth extension, you can add users, roles, and permissions via the Druid Coordinator `user` endpoint. Note that you cannot assign permissions directly to individual users. They must be assigned through roles.
+
+The following diagram depicts the authorization model, and the relationship between users, roles, permissions, and resources.
+
+![Druid Security model](../assets/security-model-2.png "Druid security model")
+
+
+The following steps walk through a sample setup procedure:
+
+:::info
+ The default Coordinator API port is 8081 for non-TLS connections and 8281 for secured connections.
+:::
+
+1. Create a user by issuing a POST request to `druid-ext/basic-security/authentication/db/MyBasicMetadataAuthenticator/users/<USERNAME>`.
+   Replace `<USERNAME>` with the *new* username you are trying to create. For example:
+   ```bash
+   curl -u admin:password1 -XPOST https://my-coordinator-ip:8281/druid-ext/basic-security/authentication/db/MyBasicMetadataAuthenticator/users/myname
+   ```
+:::info
+ If you have TLS enabled, be sure to adjust the curl command accordingly. For example, if your Druid servers use self-signed certificates,
+you may choose to include the `insecure` curl option to forgo certificate checking for the curl command.
+:::
+
+2. Add a credential for the user by issuing a POST request to `druid-ext/basic-security/authentication/db/MyBasicMetadataAuthenticator/users/<USERNAME>/credentials`. For example:
+   ```bash
+   curl -u admin:password1 -H'Content-Type: application/json' -XPOST https://my-coordinator-ip:8281/druid-ext/basic-security/authentication/db/MyBasicMetadataAuthenticator/users/myname/credentials --data-raw '{"password": "my_password"}'
+   ```
+3. For each authenticator user you create, create a corresponding authorizer user by issuing a POST request to `druid-ext/basic-security/authorization/db/MyBasicMetadataAuthorizer/users/<USERNAME>`. For example:
+   ```bash
+   curl -u admin:password1 -XPOST https://my-coordinator-ip:8281/druid-ext/basic-security/authorization/db/MyBasicMetadataAuthorizer/users/myname
+   ```
+4. Create authorizer roles to control permissions by issuing a POST request to `druid-ext/basic-security/authorization/db/MyBasicMetadataAuthorizer/roles/<ROLENAME>`. For example:
+   ```bash
+   curl -u admin:password1 -XPOST https://my-coordinator-ip:8281/druid-ext/basic-security/authorization/db/MyBasicMetadataAuthorizer/roles/myrole
+   ```
+5. Assign roles to users by issuing a POST request to `druid-ext/basic-security/authorization/db/MyBasicMetadataAuthorizer/users/<USERNAME>/roles/<ROLENAME>`. For example:
+   ```bash
+   curl -u admin:password1 -XPOST https://my-coordinator-ip:8281/druid-ext/basic-security/authorization/db/MyBasicMetadataAuthorizer/users/myname/roles/myrole | jq
+   ```
+
+6. Finally, attach permissions to the roles to control how they can interact with Druid at `druid-ext/basic-security/authorization/db/MyBasicMetadataAuthorizer/roles/<ROLENAME>/permissions`. For example:
+   ```bash
+   curl -u admin:password1 -H'Content-Type: application/json' -XPOST --data-binary @perms.json https://my-coordinator-ip:8281/druid-ext/basic-security/authorization/db/MyBasicMetadataAuthorizer/roles/myrole/permissions
+   ```
+   The payload of `perms.json` should be in the following form:
+   ```json
+   [
+      {
+        "resource": {
+          "type": "DATASOURCE",
+          "name": "<PATTERN>"
+        },
+        "action": "READ"
+      },
+      {
+        "resource": {
+          "type": "STATE",
+          "name": "STATE"
+        },
+        "action": "READ"
+      }
+   ]
+   ```
+:::info
+ Note: Druid treats the resource name as a regular expression (regex). You can use a specific datasource name or regex to grant permissions for multiple datasources at a time.
+:::
+
+
+## Configuring an LDAP authenticator
+
+As an alternative to using the basic metadata authenticator, you can use LDAP to authenticate users. See [Configure LDAP authentication](./auth-ldap.md) for information on configuring Druid for LDAP and LDAPS.
+
+## Druid security trust model
+Within Druid's trust model there users can have different authorization levels:
+- Users with resource write permissions are allowed to do anything that the druid process can do.
+- Authenticated read only users can execute queries against resources to which they have permissions.
+- An authenticated user without any permissions is allowed to execute queries that don't require access to a resource.
+
+Additionally, Druid operates according to the following principles:
+
+From the innermost layer:
+1. Druid processes have the same access to the local files granted to the specified system user running the process.
+2. The Druid ingestion system can create new processes to execute tasks. Those tasks inherit the user of their parent process. This means that any user authorized to submit an ingestion task can use the ingestion task permissions to read or write any local files or external resources that the Druid process has access to.
+
+:::info
+ Note: Only grant the `DATASOURCE WRITE` to trusted users because they can act as the Druid process.
+:::
+
+Within the cluster:
+1. Druid assumes it operates on an isolated, protected network where no reachable IP within the network is under adversary control. When you implement Druid, take care to setup firewalls and other security measures to secure both inbound and outbound connections.
+Druid assumes network traffic within the cluster is encrypted, including API calls and data transfers. The default encryption implementation uses TLS.
+2. Druid assumes auxiliary services such as the metadata store and ZooKeeper nodes are not under adversary control.
+
+Cluster to deep storage:
+1. Druid does not make assumptions about the security for deep storage. It follows the system's native security policies to authenticate and authorize with deep storage.
+2. Druid does not encrypt files for deep storage. Instead, it relies on the storage system's native encryption capabilities to ensure compatibility with encryption schemes across all storage types.
+
+Cluster to client:
+1. Druid authenticates with the client based on the configured authenticator.
+2. Druid only performs actions when an authorizer grants permission. The default configuration is `allowAll authorizer`.
+
+## Reporting security issues
+
+The Apache Druid team takes security very seriously. If you find a potential security issue in Druid, such as a way to bypass the security mechanisms described earlier, please report this problem to [security@apache.org](mailto:security@apache.org). This is a private mailing list. Please send one plain text email for each vulnerability you are reporting.
+
+### Vulnerability handling
+
+The following list summarizes the vulnerability handling process:
+
+* The reporter reports the vulnerability privately to [security@apache.org](mailto:security@apache.org)
+* The reporter receives a response that the Druid team has received the report and will investigate the issue.
+* The Druid project security team works privately with the reporter to resolve the vulnerability.
+* The Druid team delivers the fix by creating a new release of the package that the vulnerability affects.
+* The Druid team publicly announces the vulnerability and describes how to apply the fix.
+
+Committers should read a [more detailed description of the process](https://www.apache.org/security/committers.html). Reporters of security vulnerabilities may also find it useful.
diff --git a/docs/35.0.0/operations/security-user-auth.md b/docs/35.0.0/operations/security-user-auth.md
new file mode 100644
index 0000000000..acb3aebb68
--- /dev/null
+++ b/docs/35.0.0/operations/security-user-auth.md
@@ -0,0 +1,174 @@
+---
+id: security-user-auth
+title: "User authentication and authorization"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+This document describes the Druid security model that extensions use to enable user authentication and authorization services to Druid. 
+
+## Authentication and authorization model
+
+At the center of the Druid user authentication and authorization model are _resources_ and _actions_. A resource is something that authenticated users are trying to access or modify. An action is something that users are trying to do. 
+
+### Resource types
+
+Druid uses the following resource types:
+
+* DATASOURCE &ndash; Each Druid table (i.e., `tables` in the `druid` schema in SQL) is a resource.
+* CONFIG &ndash; Configuration resources exposed by the cluster components. 
+* EXTERNAL &ndash; External data read through the [EXTERN function](../multi-stage-query/concepts.md#read-external-data-with-extern) in SQL.
+* STATE &ndash; Cluster-wide state resources.
+* SYSTEM_TABLE &ndash; when the Broker property `druid.sql.planner.authorizeSystemTablesDirectly` is true, then Druid uses this resource type to authorize the system tables in the `sys` schema in SQL.
+
+For specific resources associated with the resource types, see [Defining permissions](#defining-permissions) and the corresponding endpoint descriptions in [API reference](../api-reference/api-reference.md).
+
+### Actions
+
+Users perform one of the following actions on resources:
+
+* READ &ndash; Used for read-only operations.
+* WRITE &ndash; Used for operations that are not read-only.
+
+WRITE permission on a resource does not include READ permission. If a user requires both READ and WRITE permissions on a resource, you must grant them both explicitly. For instance, a user with only `DATASOURCE READ` permission
+might have access to an API or a system schema record that a user with `DATASOURCE WRITE` permission would not have access to.
+
+### User types
+
+In practice, most deployments will only need to define two classes of users: 
+
+* Administrators, who have WRITE action permissions on all resource types. These users will add datasources and administer the system.  
+* Data users, who only need READ access to DATASOURCE. These users should access Query APIs only through an API gateway. Other APIs and permissions include functionality that should be limited to server admins. 
+
+It is important to note that WRITE access to DATASOURCE grants a user broad access. For instance, such users will have access to the Druid file system, S3 buckets, and credentials, among other things. As such, the ability to add and manage datasources should be allocated selectively to administrators.   
+
+## Default user accounts
+
+### Authenticator
+If `druid.auth.authenticator.<authenticator-name>.initialAdminPassword` is set, a default admin user named "admin" will be created, with the specified initial password. If this configuration is omitted, the "admin" user will not be created.
+
+If `druid.auth.authenticator.<authenticator-name>.initialInternalClientPassword` is set, a default internal system user named "druid_system" will be created, with the specified initial password. If this configuration is omitted, the "druid_system" user will not be created.
+
+
+### Authorizer
+
+Each Authorizer will always have a default "admin" and "druid_system" user with full privileges.
+
+## Defining permissions
+
+You define permissions that you then grant to user groups.
+Permissions are defined by resource type, action, and resource name.
+This section describes the resource names available for each resource type.
+
+### `DATASOURCE`
+Resource names for this type are datasource names. Specifying a datasource permission allows the administrator to grant users access to specific datasources.
+
+### `CONFIG`
+There are two possible resource names for the "CONFIG" resource type, "CONFIG" and "security". Granting a user access to CONFIG resources allows them to access the following endpoints.
+
+"CONFIG" resource name covers the following endpoints:
+
+|Endpoint|Process Type|
+|--------|---------|
+|`/druid/coordinator/v1/config`|coordinator|
+|`/druid/indexer/v1/worker`|overlord|
+|`/druid/indexer/v1/worker/history`|overlord|
+|`/druid/worker/v1/disable`|middleManager|
+|`/druid/worker/v1/enable`|middleManager|
+
+"security" resource name covers the following endpoint:
+
+|Endpoint|Process Type|
+|--------|---------|
+|`/druid-ext/basic-security/authentication`|coordinator|
+|`/druid-ext/basic-security/authorization`|coordinator|
+
+### `EXTERNAL`
+
+The EXTERNAL resource type only accepts the resource name "EXTERNAL".
+Granting a user access to EXTERNAL resources allows them to run queries that include
+the [EXTERN function](../multi-stage-query/concepts.md#read-external-data-with-extern) in SQL
+to read external data.
+
+### `STATE`
+There is only one possible resource name for the "STATE" config resource type, "STATE". Granting a user access to STATE resources allows them to access the following endpoints.
+
+"STATE" resource name covers the following endpoints:
+
+|Endpoint|Process Type|
+|--------|---------|
+|`/druid/coordinator/v1`|coordinator|
+|`/druid/coordinator/v1/rules`|coordinator|
+|`/druid/coordinator/v1/rules/history`|coordinator|
+|`/druid/coordinator/v1/servers`|coordinator|
+|`/druid/coordinator/v1/tiers`|coordinator|
+|`/druid/broker/v1`|broker|
+|`/druid/v2/candidates`|broker|
+|`/druid/indexer/v1/leader`|overlord|
+|`/druid/indexer/v1/isLeader`|overlord|
+|`/druid/indexer/v1/action`|overlord|
+|`/druid/indexer/v1/workers`|overlord|
+|`/druid/indexer/v1/scaling`|overlord|
+|`/druid/worker/v1/enabled`|middleManager|
+|`/druid/worker/v1/tasks`|middleManager|
+|`/druid/worker/v1/task/{taskid}/shutdown`|middleManager|
+|`/druid/worker/v1/task/{taskid}/log`|middleManager|
+|`/druid/historical/v1`|historical|
+|`/druid-internal/v1/segments/`|historical|
+|`/druid-internal/v1/segments/`|peon|
+|`/druid-internal/v1/segments/`|realtime|
+|`/status`|all process types|
+
+### `SYSTEM_TABLE`
+Resource names for this type are system schema table names in the `sys` schema in SQL, for example `sys.segments` and `sys.server_segments`. Druid only enforces authorization for `SYSTEM_TABLE` resources when the Broker property `druid.sql.planner.authorizeSystemTablesDirectly` is true.
+### HTTP methods
+
+For information on what HTTP methods are supported on a particular request endpoint, refer to [API reference](../api-reference/api-reference.md).
+
+`GET` requests require READ permissions, while `POST` and `DELETE` requests require WRITE permissions.
+
+### SQL permissions
+
+Queries on Druid datasources require DATASOURCE READ permissions for the specified datasource.
+
+Queries to access external data through the [EXTERN function](../multi-stage-query/concepts.md#read-external-data-with-extern) require EXTERNAL READ permissions.
+
+Queries on [INFORMATION_SCHEMA tables](../querying/sql-metadata-tables.md#information-schema) return information about datasources that the caller has DATASOURCE READ access to. Other
+datasources are omitted.
+
+Queries on the [system schema tables](../querying/sql-metadata-tables.md#system-schema) require the following permissions:
+- `segments`: Druid filters segments according to DATASOURCE READ permissions.
+- `servers`: The user requires STATE READ permissions.
+- `server_segments`: The user requires STATE READ permissions. Druid filters segments according to DATASOURCE READ permissions.
+- `tasks`: Druid filters tasks according to DATASOURCE READ permissions.
+- `supervisors`: Druid filters supervisors according to DATASOURCE READ permissions.
+
+When the Broker property `druid.sql.planner.authorizeSystemTablesDirectly` is true, users also require  `SYSTEM_TABLE` authorization on a system schema table to query it.
+
+## Configuration propagation
+
+To prevent excessive load on the Coordinator, the Authenticator and Authorizer user/role Druid metadata store state is cached on each Druid process.
+
+Each process will periodically poll the Coordinator for the latest Druid metadata store state, controlled by the `druid.auth.basic.common.pollingPeriod` and `druid.auth.basic.common.maxRandomDelay` properties.
+
+When a configuration update occurs, the Coordinator can optionally notify each process with the updated Druid metadata store state. This behavior is controlled by the `enableCacheNotifications` and `cacheNotificationTimeout` properties on Authenticators and Authorizers.
+
+Note that because of the caching, changes made to the user/role Druid metadata store may not be immediately reflected at each Druid process.
diff --git a/docs/35.0.0/operations/segment-optimization.md b/docs/35.0.0/operations/segment-optimization.md
new file mode 100644
index 0000000000..79dbf9db6b
--- /dev/null
+++ b/docs/35.0.0/operations/segment-optimization.md
@@ -0,0 +1,106 @@
+---
+id: segment-optimization
+title: "Segment size optimization"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+In Apache Druid, it's important to optimize the segment size because
+
+  1. Druid stores data in segments. If you're using the [best-effort roll-up](../ingestion/rollup.md) mode,
+  increasing the segment size might introduce further aggregation which reduces the dataSource size.
+  2. When a query is submitted, that query is distributed to all Historicals and realtime tasks
+  which hold the input segments of the query. Each process and task picks a thread from its own processing thread pool
+  to process a single segment. If segment sizes are too large, data might not be well distributed between data
+  servers, decreasing the degree of parallelism possible during query processing.
+  At the other extreme where segment sizes are too small, the scheduling
+  overhead of processing a larger number of segments per query can reduce
+  performance, as the threads that process each segment compete for the fixed
+  slots of the processing pool.
+
+It would be best if you can optimize the segment size at ingestion time, but sometimes it's not easy
+especially when it comes to stream ingestion because the amount of data ingested might vary over time. In this case,
+you can create segments with a sub-optimized size first and optimize them later using [compaction](../data-management/compaction.md).
+
+You may need to consider the followings to optimize your segments.
+
+  - Number of rows per segment: it's generally recommended for each segment to have around 5 million rows.
+  This setting is usually _more_ important than the below "segment byte size".
+  This is because Druid uses a single thread to process each segment,
+  and thus this setting can directly control how many rows each thread processes,
+  which in turn means how well the query execution is parallelized.
+  - Segment byte size: it's recommended to set 300 ~ 700MB. If this value
+  doesn't match with the "number of rows per segment", please consider optimizing
+  number of rows per segment rather than this value. Note that certain deep storage
+  implementations also impose an upper limit on segment size. For example, S3 deep
+  storage imposes an upper limit of 5 GB.
+
+:::info
+ The above recommendation works in general, but the optimal setting can
+ vary based on your workload. For example, if most of your queries
+ are heavy and take a long time to process each row, you may want to make
+ segments smaller so that the query processing can be more parallelized.
+ If you still see some performance issue after optimizing segment size,
+ you may need to find the optimal settings for your workload.
+:::
+
+There might be several ways to check if the compaction is necessary. One way
+is using the [System Schema](../querying/sql-metadata-tables.md#system-schema). The
+system schema provides several tables about the current system status including the `segments` table.
+By running the below query, you can get the average number of rows and average size for published segments.
+
+```sql
+SELECT
+  "start",
+  "end",
+  version,
+  COUNT(*) AS num_segments,
+  AVG("num_rows") AS avg_num_rows,
+  SUM("num_rows") AS total_num_rows,
+  AVG("size") AS avg_size,
+  SUM("size") AS total_size
+FROM
+  sys.segments A
+WHERE
+  datasource = 'your_dataSource' AND
+  is_published = 1
+GROUP BY 1, 2, 3
+ORDER BY 1, 2, 3 DESC
+```
+
+Please note that the query result might include overshadowed segments.
+In this case, you may want to see only rows of the max version per interval (pair of `start` and `end`).
+
+Once you find your segments need compaction, you can consider the below two options:
+
+  - Turning on the [automatic compaction of Coordinators](../design/coordinator.md#automatic-compaction).
+  The Coordinator periodically submits [compaction tasks](../ingestion/tasks.md#compact) to re-index small segments.
+  To enable the automatic compaction, you need to configure it for each dataSource via Coordinator's dynamic configuration.
+  For more information, see [Automatic compaction](../data-management/automatic-compaction.md).
+  - Running periodic Hadoop batch ingestion jobs and using a `dataSource`
+  inputSpec to read from the segments generated by the Kafka indexing tasks. This might be helpful if you want to compact a lot of segments in parallel.
+  Details on how to do this can be found on the [Updating existing data](../data-management/update.md) section
+  of the data management page.
+
+## Learn more
+* For an overview of compaction and how to submit a manual compaction task, see [Compaction](../data-management/compaction.md).
+* To learn how to enable and configure automatic compaction, see [Automatic compaction](../data-management/automatic-compaction.md).
+
diff --git a/docs/35.0.0/operations/single-server.md b/docs/35.0.0/operations/single-server.md
new file mode 100644
index 0000000000..6f9a0ebd3d
--- /dev/null
+++ b/docs/35.0.0/operations/single-server.md
@@ -0,0 +1,57 @@
+---
+id: single-server
+title: "Single server deployment"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+Druid includes a launch script, `bin/start-druid` that automatically sets various memory-related parameters based on available processors and memory.
+It accepts optional arguments such as list of services, total memory, and a config directory to override default JVM arguments and service-specific runtime properties.
+
+By default, the services started by `bin/start-druid`:
+
+- use all processors
+- can use up to 80% memory on the system
+- apply the configuration files in `conf/druid/auto` for all other settings.
+
+For details about possible arguments, run `bin/start-druid --help`.
+
+## Single server reference configurations (deprecated)
+
+Druid includes a set of reference configurations and launch scripts for single-machine deployments.
+These start scripts are deprecated in favor of the `bin/start-druid` script documented above.
+These configuration bundles are located in `conf/druid/single-server/`.
+
+| Configuration      |Sizing|Launch command|Configuration directory|
+|--------------------|-----------|----------|------------|
+| `nano-quickstart`  |1 CPU, 4GiB RAM|`bin/start-nano-quickstart`|`conf/druid/single-server/nano-quickstart`|
+| `micro-quickstart` |4 CPU, 16GiB RAM|`bin/start-micro-quickstart`|`conf/druid/single-server/micro-quickstart`|
+| `small`            |8 CPU, 64GiB RAM (~i3.2xlarge)|`bin/start-small`|`conf/druid/single-server/small`|
+| `medium`           |16 CPU, 128GiB RAM (~i3.4xlarge)|`bin/start-medium`|`conf/druid/single-server/medium`|
+| `large`            |32 CPU, 256GiB RAM (~i3.8xlarge)|`bin/start-large`|`conf/druid/single-server/large`|
+| `xlarge`           |64 CPU, 512GiB RAM (~i3.16xlarge)|`bin/start-xlarge`|`conf/druid/single-server/xlarge`|
+
+The `micro-quickstart` is sized for small machines like laptops and is intended for quick evaluation use-cases.
+
+The `nano-quickstart` is an even smaller configuration, targeting a machine with 1 CPU and 4GiB memory. It is meant for limited evaluations in resource constrained environments, such as small Docker containers.
+
+The other configurations are intended for general use single-machine deployments. They are sized for hardware roughly based on Amazon's i3 series of EC2 instances.
+
+The startup scripts for these example configurations run a single ZK instance along with the Druid services. You can choose to deploy ZK separately as well.
diff --git a/docs/35.0.0/operations/tls-support.md b/docs/35.0.0/operations/tls-support.md
new file mode 100644
index 0000000000..23dc133244
--- /dev/null
+++ b/docs/35.0.0/operations/tls-support.md
@@ -0,0 +1,108 @@
+---
+id: tls-support
+title: "TLS support"
+---
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+## General configuration
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.enablePlaintextPort`|Enable/Disable HTTP connector.|`true`|
+|`druid.enableTlsPort`|Enable/Disable HTTPS connector.|`false`|
+
+Although not recommended, the HTTP and HTTPS connectors can both be enabled at a time. The respective ports are configurable using `druid.plaintextPort`
+and `druid.tlsPort` properties on each process. Please see `Configuration` section of individual processes to check the valid and default values for these ports.
+
+## Jetty server configuration
+
+Apache Druid uses Jetty as its embedded web server. 
+
+To get familiar with TLS/SSL, along with related concepts like keys and certificates,
+read [Configuring Secure Protocols](https://www.eclipse.org/jetty/documentation/jetty-12/operations-guide/index.html#og-protocols-ssl) in the Jetty documentation.
+To get more in-depth knowledge of TLS/SSL support in Java in general, refer to the [Java Secure Socket Extension (JSSE) Reference Guide](https://docs.oracle.com/en/java/javase/17/security/java-secure-socket-extension-jsse-reference-guide.html).
+The [Class SslContextFactory](https://javadoc.jetty.org/jetty-12/org/eclipse/jetty/util/ssl/SslContextFactory.html)
+reference doc can help in understanding TLS/SSL configurations listed below. Finally, [Java Cryptography Architecture
+Standard Algorithm Name Documentation for JDK 17](https://docs.oracle.com/en/java/javase/17/docs/specs/security/standard-names.html) lists all possible
+values for the configs below, among others provided by Java implementation.
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|--------|
+|`druid.server.https.keyStorePath`|The file path or URL of the TLS/SSL Key store.|none|yes|
+|`druid.server.https.keyStoreType`|The type of the key store.|none|yes|
+|`druid.server.https.certAlias`|Alias of TLS/SSL certificate for the connector.|none|yes|
+|`druid.server.https.keyStorePassword`|The [Password Provider](../operations/password-provider.md) or String password for the Key Store.|none|yes|
+|`druid.server.https.reloadSslContext`| Should Druid server detect Key Store file change and reload.|false|no|
+|`druid.server.https.reloadSslContextSeconds`| How frequently should Druid server scan for Key Store file change.|60|yes|
+|`druid.server.https.forceApplyConfig`|Whether to apply TLS server configs even if an existing `SslContextFactory.Server` instance is bound.|false|no|
+
+The following table contains configuration options related to client certificate authentication.
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|--------|
+|`druid.server.https.requireClientCertificate`|If set to true, clients must identify themselves by providing a TLS certificate, without which connections will fail.|false|no|
+|`druid.server.https.requestClientCertificate`|If set to true, clients may optionally identify themselves by providing a TLS certificate. Connections will not fail if TLS certificate is not provided. This property is ignored if `requireClientCertificate` is set to true. If `requireClientCertificate` and `requestClientCertificate` are false, the rest of the options in this table are ignored.|false|no|
+|`druid.server.https.trustStoreType`|The type of the trust store containing certificates used to validate client certificates. Not needed if `requireClientCertificate` and `requestClientCertificate` are false.|`java.security.KeyStore.getDefaultType()`|no|
+|`druid.server.https.trustStorePath`|The file path or URL of the trust store containing certificates used to validate client certificates. Not needed if `requireClientCertificate` and `requestClientCertificate` are false.|none|yes, only if `requireClientCertificate` is true|
+|`druid.server.https.trustStoreAlgorithm`|Algorithm to be used by TrustManager to validate client certificate chains. Not needed if `requireClientCertificate` and `requestClientCertificate` are false.|`javax.net.ssl.TrustManagerFactory.getDefaultAlgorithm()`|no|
+|`druid.server.https.trustStorePassword`|The [password provider](../operations/password-provider.md) or String password for the Trust Store.  Not needed if `requireClientCertificate` and `requestClientCertificate` are false.|none|no|
+|`druid.server.https.validateHostnames`|If set to true, check that the client's hostname matches the CN/subjectAltNames in the client certificate.  Not used if `requireClientCertificate` and `requestClientCertificate` are false.|true|no|
+|`druid.server.https.crlPath`|Specifies a path to a file containing static [Certificate Revocation Lists](https://en.wikipedia.org/wiki/Certificate_revocation_list), used to check if a client certificate has been revoked. Not used if `requireClientCertificate` and `requestClientCertificate` are false.|null|no|
+
+The following table contains non-mandatory advanced configuration options, use caution.
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|--------|
+|`druid.server.https.keyManagerFactoryAlgorithm`|Algorithm to use for creating KeyManager, more details [here](https://docs.oracle.com/javase/7/docs/technotes/guides/security/jsse/JSSERefGuide.html#KeyManager).|`javax.net.ssl.KeyManagerFactory.getDefaultAlgorithm()`|no|
+|`druid.server.https.keyManagerPassword`|The [Password Provider](../operations/password-provider.md) or String password for the Key Manager.|none|no|
+|`druid.server.https.includeCipherSuites`|List of cipher suite names to include. You can either use the exact cipher suite name or a regular expression.|Jetty's default include cipher list|no|
+|`druid.server.https.excludeCipherSuites`|List of cipher suite names to exclude. You can either use the exact cipher suite name or a regular expression.|Jetty's default exclude cipher list|no|
+|`druid.server.https.includeProtocols`|List of exact protocols names to include.|Jetty's default include protocol list|no|
+|`druid.server.https.excludeProtocols`|List of exact protocols names to exclude.|Jetty's default exclude protocol list|no|
+
+## Internal communication over TLS
+
+Whenever possible Druid processes will use HTTPS to talk to each other. To enable this communication Druid's HttpClient needs to
+be configured with a proper [SSLContext](https://docs.oracle.com/en/java/javase/17/docs/api/java.base/javax/net/ssl/SSLContext.html) that is able
+to validate the Server Certificates, otherwise communication will fail.
+
+Since, there are various ways to configure SSLContext, by default, Druid looks for an instance of SSLContext Guice binding
+while creating the HttpClient. This binding can be achieved writing a [Druid extension](../configuration/extensions.md)
+which can provide an instance of SSLContext. Druid comes with a simple extension present [here](../development/extensions-core/simple-client-sslcontext.md)
+which should be useful enough for most simple cases, see [this](../configuration/extensions.md#loading-extensions) for how to include extensions.
+If this extension does not satisfy the requirements then please follow the extension [implementation](https://github.com/apache/druid/tree/master/extensions-core/simple-client-sslcontext)
+to create your own extension.
+
+When Druid Coordinator/Overlord have both HTTP and HTTPS enabled and Client sends request to non-leader process, then Client is always redirected to the HTTPS endpoint on leader process.
+So, Clients should be first upgraded to be able to handle redirect to HTTPS. Then Druid Overlord/Coordinator should be upgraded and configured to run both HTTP and HTTPS ports. Then Client configuration should be changed to refer to Druid Coordinator/Overlord via the HTTPS endpoint and then HTTP port on Druid Coordinator/Overlord should be disabled.
+
+## Custom certificate checks
+
+Druid supports custom certificate check extensions. Please refer to the `org.apache.druid.server.security.TLSCertificateChecker` interface for details on the methods to be implemented.
+
+To use a custom TLS certificate checker, specify the following property:
+
+|Property|Description|Default|Required|
+|--------|-----------|-------|--------|
+|`druid.tls.certificateChecker`|Type name of custom TLS certificate checker, provided by extensions. Please refer to extension documentation for the type name that should be specified.|"default"|no|
+
+The default checker delegates to the standard trust manager and performs no additional actions or checks.
+
+If using a non-default certificate checker, please refer to the extension documentation for additional configuration properties needed.
diff --git a/docs/35.0.0/operations/use_sbt_to_build_fat_jar.md b/docs/35.0.0/operations/use_sbt_to_build_fat_jar.md
new file mode 100644
index 0000000000..eeb58c9734
--- /dev/null
+++ b/docs/35.0.0/operations/use_sbt_to_build_fat_jar.md
@@ -0,0 +1,127 @@
+---
+id: use_sbt_to_build_fat_jar
+title: "Content for build.sbt"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+```scala
+libraryDependencies ++= Seq(
+  "com.amazonaws" % "aws-java-sdk" % "1.9.23" exclude("common-logging", "common-logging"),
+  "org.joda" % "joda-convert" % "1.7",
+  "joda-time" % "joda-time" % "2.7",
+  "org.apache.druid" % "druid" % "0.8.1" excludeAll (
+    ExclusionRule("org.ow2.asm"),
+    ExclusionRule("com.fasterxml.jackson.core"),
+    ExclusionRule("com.fasterxml.jackson.datatype"),
+    ExclusionRule("com.fasterxml.jackson.dataformat"),
+    ExclusionRule("com.fasterxml.jackson.jaxrs"),
+    ExclusionRule("com.fasterxml.jackson.module")
+  ),
+  "org.apache.druid" % "druid-services" % "0.8.1" excludeAll (
+    ExclusionRule("org.ow2.asm"),
+    ExclusionRule("com.fasterxml.jackson.core"),
+    ExclusionRule("com.fasterxml.jackson.datatype"),
+    ExclusionRule("com.fasterxml.jackson.dataformat"),
+    ExclusionRule("com.fasterxml.jackson.jaxrs"),
+    ExclusionRule("com.fasterxml.jackson.module")
+  ),
+  "org.apache.druid" % "druid-indexing-service" % "0.8.1" excludeAll (
+    ExclusionRule("org.ow2.asm"),
+    ExclusionRule("com.fasterxml.jackson.core"),
+    ExclusionRule("com.fasterxml.jackson.datatype"),
+    ExclusionRule("com.fasterxml.jackson.dataformat"),
+    ExclusionRule("com.fasterxml.jackson.jaxrs"),
+    ExclusionRule("com.fasterxml.jackson.module")
+  ),
+  "org.apache.druid" % "druid-indexing-hadoop" % "0.8.1" excludeAll (
+    ExclusionRule("org.ow2.asm"),
+    ExclusionRule("com.fasterxml.jackson.core"),
+    ExclusionRule("com.fasterxml.jackson.datatype"),
+    ExclusionRule("com.fasterxml.jackson.dataformat"),
+    ExclusionRule("com.fasterxml.jackson.jaxrs"),
+    ExclusionRule("com.fasterxml.jackson.module")
+  ),
+  "org.apache.druid.extensions" % "mysql-metadata-storage" % "0.8.1" excludeAll (
+    ExclusionRule("org.ow2.asm"),
+    ExclusionRule("com.fasterxml.jackson.core"),
+    ExclusionRule("com.fasterxml.jackson.datatype"),
+    ExclusionRule("com.fasterxml.jackson.dataformat"),
+    ExclusionRule("com.fasterxml.jackson.jaxrs"),
+    ExclusionRule("com.fasterxml.jackson.module")
+  ),
+  "org.apache.druid.extensions" % "druid-s3-extensions" % "0.8.1" excludeAll (
+    ExclusionRule("org.ow2.asm"),
+    ExclusionRule("com.fasterxml.jackson.core"),
+    ExclusionRule("com.fasterxml.jackson.datatype"),
+    ExclusionRule("com.fasterxml.jackson.dataformat"),
+    ExclusionRule("com.fasterxml.jackson.jaxrs"),
+    ExclusionRule("com.fasterxml.jackson.module")
+  ),
+  "org.apache.druid.extensions" % "druid-histogram" % "0.8.1" excludeAll (
+    ExclusionRule("org.ow2.asm"),
+    ExclusionRule("com.fasterxml.jackson.core"),
+    ExclusionRule("com.fasterxml.jackson.datatype"),
+    ExclusionRule("com.fasterxml.jackson.dataformat"),
+    ExclusionRule("com.fasterxml.jackson.jaxrs"),
+    ExclusionRule("com.fasterxml.jackson.module")
+  ),
+  "org.apache.druid.extensions" % "druid-hdfs-storage" % "0.8.1" excludeAll (
+    ExclusionRule("org.ow2.asm"),
+    ExclusionRule("com.fasterxml.jackson.core"),
+    ExclusionRule("com.fasterxml.jackson.datatype"),
+    ExclusionRule("com.fasterxml.jackson.dataformat"),
+    ExclusionRule("com.fasterxml.jackson.jaxrs"),
+    ExclusionRule("com.fasterxml.jackson.module")
+  ),
+  "com.fasterxml.jackson.core" % "jackson-annotations" % "2.3.0",
+  "com.fasterxml.jackson.core" % "jackson-core" % "2.3.0",
+  "com.fasterxml.jackson.core" % "jackson-databind" % "2.3.0",
+  "com.fasterxml.jackson.datatype" % "jackson-datatype-guava" % "2.3.0",
+  "com.fasterxml.jackson.datatype" % "jackson-datatype-joda" % "2.3.0",
+  "com.fasterxml.jackson.jaxrs" % "jackson-jaxrs-base" % "2.3.0",
+  "com.fasterxml.jackson.jaxrs" % "jackson-jaxrs-json-provider" % "2.3.0",
+  "com.fasterxml.jackson.jaxrs" % "jackson-jaxrs-smile-provider" % "2.3.0",
+  "com.fasterxml.jackson.module" % "jackson-module-jaxb-annotations" % "2.3.0",
+  "com.sun.jersey" % "jersey-servlet" % "1.17.1",
+  "mysql" % "mysql-connector-java" % "8.2.0",
+  "org.scalatest" %% "scalatest" % "2.2.3" % "test",
+  "org.mockito" % "mockito-core" % "1.10.19" % "test"
+)
+
+assemblyMergeStrategy in assembly := {
+  case path if path contains "pom." => MergeStrategy.first
+  case path if path contains "javax.inject.Named" => MergeStrategy.first
+  case path if path contains "mime.types" => MergeStrategy.first
+  case path if path contains "org/apache/commons/logging/impl/SimpleLog.class" => MergeStrategy.first
+  case path if path contains "org/apache/commons/logging/impl/SimpleLog$1.class" => MergeStrategy.first
+  case path if path contains "org/apache/commons/logging/impl/NoOpLog.class" => MergeStrategy.first
+  case path if path contains "org/apache/commons/logging/LogFactory.class" => MergeStrategy.first
+  case path if path contains "org/apache/commons/logging/LogConfigurationException.class" => MergeStrategy.first
+  case path if path contains "org/apache/commons/logging/Log.class" => MergeStrategy.first
+  case path if path contains "META-INF/jersey-module-version" => MergeStrategy.first
+  case path if path contains ".properties" => MergeStrategy.first
+  case path if path contains ".class" => MergeStrategy.first
+  case x =>
+    val oldStrategy = (assemblyMergeStrategy in assembly).value
+    oldStrategy(x)
+}
+```
diff --git a/docs/35.0.0/operations/web-console.md b/docs/35.0.0/operations/web-console.md
new file mode 100644
index 0000000000..ef1118ebc4
--- /dev/null
+++ b/docs/35.0.0/operations/web-console.md
@@ -0,0 +1,182 @@
+---
+id: web-console
+title: "Web console"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+Druid includes a web console for loading data, managing datasources and tasks, and viewing server status and segment information.
+You can also run SQL and native Druid queries in the console.
+
+Enable the following cluster settings to use the web console. Note that these settings are enabled by default.
+- Enable the Router's [management proxy](../design/router.md#enable-the-management-proxy).
+- Enable [Druid SQL](../configuration/index.md#sql) for the Broker processes in the cluster.
+
+The [Router](../design/router.md) service hosts the web console.
+Access the web console at the following address:
+```
+http://<ROUTER_IP>:<ROUTER_PORT>
+```
+
+:::info
+ **Security note:** Without [Druid user permissions](../operations/security-overview.md) configured, any user of the
+API or web console has effectively the same level of access to local files and network services as the user under which
+Druid runs. It is a best practice to avoid running Druid as the root user, and to use Druid permissions or network
+firewalls to restrict which users have access to potentially sensitive resources.
+:::
+
+This topic presents the high-level features and functionality of the web console.
+
+## Home
+
+The **Home** view provides a high-level overview of the cluster.
+Each card is clickable and links to the appropriate view.
+
+The **Home** view displays the following cards:
+
+* __Status__. Click this card for information on the Druid version and any extensions loaded on the cluster.
+* [Datasources](#datasources)
+* [Segments](#segments)
+* [Supervisors](#supervisors)
+* [Tasks](#tasks)
+* [Services](#services)
+* [Lookups](#lookups)
+
+You can access the [data loader](#data-loader) and [lookups view](#lookups) from the top-level navigation of the **Home** view.
+
+![Web console home view](../assets/web-console-01-home-view.png "home view")
+
+## Query
+
+SQL-based ingestion and the multi-stage query task engine use the **Query** view, which provides you with a UI to edit and use SQL queries. You should see this UI automatically in Druid 24.0 and later since the multi-stage query extension is loaded by default. 
+
+The following screenshot shows a populated enhanced **Query** view along with a description of its parts:
+
+![Annotated multi-stage Query view](../assets/multi-stage-query/ui-annotated.png)
+
+1. The multi-stage, tab-enabled, **Query** view is where you can issue queries and see results.
+All other views are unchanged from the non-enhanced version. You can still access the original **Query** view by navigating to `#query` in the URL.
+You can tell that you're looking at the updated **Query** view by the presence of the tabs (3).
+2. The **druid** panel shows the available schemas, datasources, and columns.
+3. Query tabs allow you to manage and run several queries at once.
+Click the plus icon to open a new tab.
+To manipulate existing tabs, click the tab name.
+4. The tab bar contains some helpful tools including the **Connect external data** button that samples external data and creates an initial query with the appropriate `EXTERN` definition that you can then edit as needed.
+5. The **Recent query tasks** panel lets you see currently running and previous queries from all users in the cluster.
+It is equivalent to the **Task** view in the **Ingestion** view with the filter of `type='query_controller'`.
+6. You can click on each query entry to attach to that query in a new tab.
+7. You can download an archive of all the pertinent details about the query that you can share.
+8. The **Run** button runs the query.
+9. The **Preview** button appears when you enter an INSERT/REPLACE query. It runs the query inline without the INSERT/REPLACE clause and with an added LIMIT to give you a preview of the data that would be ingested if you click **Run**.
+The added LIMIT makes the query run faster but provides incomplete results.
+10. The engine selector lets you choose which engine (API endpoint) to send a query to. By default, it automatically picks which endpoint to use based on an analysis of the query, but you can select a specific engine explicitly. You can also configure the engine specific context parameters from this menu.
+11. The **Max tasks** picker appears when you have the **SQL MSQ-task** engine selected. It lets you configure the degree of parallelism.
+12. The More menu (**...**) contains the following helpful tools:
+- **Explain SQL query** shows you the logical plan returned by `EXPLAIN PLAN FOR` for a SQL query.
+- **Query history** shows you previously executed queries.
+- **Convert ingestion spec to SQL** lets you convert a native batch ingestion spec to an equivalent SQL query.
+- **Attach tab from task ID** lets you create a new tab from the task ID of a query executed on this cluster.
+- **Open query detail archive** lets you open a detail archive generated on any cluster by (7).
+13. The query timer indicates how long the query has been running for.
+14. The **(cancel)** link cancels the currently running query.
+15. The main progress bar shows the overall progress of the query.
+The progress is computed from the various counters in the live reports (16).
+16. The **Current stage** progress bar shows the progress for the currently running query stage.
+If several stages are executing concurrently, it conservatively shows the information for the earliest executing stage.
+17. The live query reports show detailed information of all the stages (past, present, and future). The live reports are shown while the query is running. You can hide the report if you want.
+After queries finish, you can access them by clicking on the query time indicator or from the **Recent query tasks** panel (6).
+18. You can expand each stage of the live query report by clicking on the triangle to show per worker and per partition statistics.
+
+
+## Data loader
+
+You can use the data loader to build an ingestion spec with a step-by-step wizard.
+
+![Data loader tiles](../assets/web-console-02-data-loader-1.png)
+
+After selecting the location of your data, follow the series of steps displaying incremental previews of the data as it is ingested.
+After filling in the required details on every step you can navigate to the next step by clicking **Next**.
+You can also freely navigate between the steps from the top navigation.
+
+Navigating with the top navigation leaves the underlying spec unmodified while clicking **Next** attempts to fill in the subsequent steps with appropriate defaults.
+
+![Data loader ingestion](../assets/web-console-03-data-loader-2.png)
+
+## Datasources
+
+The **Datasources** view shows all the datasources currently loaded on the cluster, as well as their sizes and availability.
+From the **Datasources** view, you can edit the retention rules, configure automatic compaction, and drop data in a datasource.
+
+A datasource is partitioned into one or more segments organized by time chunks.
+To display a timeline of segments, toggle the option for **Show segment timeline**.
+
+Like any view that is powered by a Druid SQL query, you can click **View SQL query for table** from the ellipsis menu to run the underlying SQL query directly.
+
+![Datasources](../assets/web-console-04-datasources.png)
+
+You can view and edit retention rules to determine the general availability of a datasource.
+
+![Retention](../assets/web-console-05-retention.png)
+
+## Segments
+
+The **Segments** view shows all the [segments](../design/segments.md) in the cluster.
+Each segment has a detail view that provides more information.
+The Segment ID is also conveniently broken down into Datasource, Start, End, Version, and Partition columns for ease of filtering and sorting.
+
+![Segments](../assets/web-console-06-segments.png)
+
+## Supervisors
+
+From this view, you can check the status of existing supervisors as well as suspend, resume, and reset them.
+The supervisor oversees the state of the indexing tasks to coordinate handoffs, manage failures, and ensure that the scalability and replication requirements are maintained. Submit a supervisor spec manually by clicking the ellipsis icon and selecting **Submit JSON supervisor**.
+
+![Supervisors](../assets/web-console-07-supervisors.png)
+
+Click the magnifying glass icon for any supervisor to see detailed reports of its progress.
+
+![Supervisors status](../assets/web-console-08-supervisor-status.png)
+
+## Tasks
+
+The tasks table allows you to see the currently running and recently completed tasks.
+To navigate your tasks more easily, you can group them by their **Type**, **Datasource**, or **Status**.
+Submit a task manually by clicking the ellipsis icon and selecting **Submit JSON task**.
+
+![Tasks](../assets/web-console-0.7-tasks.png)
+
+Click the magnifying glass icon for any task to see more detail about it.
+
+![Tasks status](../assets/web-console-09-task-status.png)
+
+## Services
+
+The **Services** view lets you see the current status of the nodes making up your cluster.
+You can group the nodes by **Type** or by **Tier** to get meaningful summary statistics. 
+
+![Services](../assets/web-console-10-servers.png)
+
+
+## Lookups
+
+Access the **Lookups** view from the **Lookups** card in the home view or by clicking the ellipsis icon in the top-level navigation.
+Here you can create and edit query time [lookups](../querying/lookups.md).
+
+![Lookups](../assets/web-console-13-lookups.png)
diff --git a/docs/35.0.0/querying/aggregations.md b/docs/35.0.0/querying/aggregations.md
new file mode 100644
index 0000000000..c7b7d4e4ef
--- /dev/null
+++ b/docs/35.0.0/querying/aggregations.md
@@ -0,0 +1,647 @@
+---
+id: aggregations
+title: "Aggregations"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+Apache Druid supports two query languages: [Druid SQL](sql.md) and [native queries](querying.md).
+This document describes the native
+language. For information about aggregators available in SQL, refer to the
+[SQL documentation](sql-aggregations.md).
+:::
+
+You can use aggregations:
+-  in the ingestion spec during ingestion to summarize data before it enters Apache Druid.
+-  at query time to summarize result data.
+
+The following sections list the available aggregate functions. Unless otherwise noted, aggregations are available at both ingestion and query time.
+
+## Exact aggregations
+
+### Count aggregator
+
+`count` computes the count of Druid rows that match the filters.
+
+| Property | Description | Required |
+| --- | --- | --- |
+| `type` | Must be "count". | Yes |
+| `name` | Output name of the aggregator | Yes |
+
+Example:
+```json
+{ "type" : "count", "name" : "count" }
+```
+
+The `count` aggregator counts the number of Druid rows, which does not always reflect the number of raw events ingested.
+This is because Druid can be configured to roll up data at ingestion time. To
+count the number of ingested rows of data, include a `count` aggregator at ingestion time and a `longSum` aggregator at
+query time.
+
+### Sum aggregators
+
+| Property | Description | Required |
+| --- | --- | --- |
+| `type` | Must be "longSum", "doubleSum", or "floatSum". | Yes |
+| `name` | Output name for the summed value. | Yes |
+| `fieldName` | Name of the input column to sum over. | No. You must specify `fieldName` or `expression`. |
+| `expression` | You can specify an inline [expression](./math-expr.md) as an alternative to `fieldName`. | No. You must specify `fieldName` or `expression`. |
+
+#### `longSum` aggregator
+
+Computes the sum of values as a 64-bit, signed integer.
+
+Example:
+```json
+{ "type" : "longSum", "name" : "sumLong", "fieldName" : "aLong" }
+```
+
+#### `doubleSum` aggregator
+
+Computes and stores the sum of values as a 64-bit floating point value. Similar to `longSum`.
+
+Example:
+```json
+{ "type" : "doubleSum", "name" : "sumDouble", "fieldName" : "aDouble" }
+```
+
+#### `floatSum` aggregator
+
+Computes and stores the sum of values as a 32-bit floating point value. Similar to `longSum` and `doubleSum`.
+
+Example:
+```json
+{ "type" : "floatSum", "name" : "sumFloat", "fieldName" : "aFloat" }
+```
+
+### Min and max aggregators
+
+| Property | Description | Required |
+| --- | --- | --- |
+| `type` | Must be "doubleMin", "doubleMax", "floatMin", "floatMax", "longMin", or "longMax". | Yes |
+| `name` | Output name for the min or max value. | Yes |
+| `fieldName` | Name of the input column to compute the minimum or maximum value over. | No. You must specify `fieldName` or `expression`. |
+| `expression` | You can specify an inline [expression](./math-expr.md) as an alternative to `fieldName`. | No. You must specify `fieldName` or `expression`. |
+
+#### `doubleMin` aggregator
+
+`doubleMin` computes the minimum of all input values and null.
+
+Example:
+```json
+{ "type" : "doubleMin", "name" : "maxDouble", "fieldName" : "aDouble" }
+```
+
+#### `doubleMax` aggregator
+
+`doubleMax` computes the maximum of all input values and null.
+
+Example:
+```json
+{ "type" : "doubleMax", "name" : "minDouble", "fieldName" : "aDouble" }
+```
+
+#### `floatMin` aggregator
+
+`floatMin` computes the minimum of all input values and null.
+
+Example:
+```json
+{ "type" : "floatMin", "name" : "minFloat", "fieldName" : "aFloat" }
+```
+
+#### `floatMax` aggregator
+
+`floatMax` computes the maximum of all input values and null.
+
+Example:
+```json
+{ "type" : "floatMax", "name" : "maxFloat", "fieldName" : "aFloat" }
+```
+
+#### `longMin` aggregator
+
+`longMin` computes the minimum of all input values and null.
+
+Example:
+```json
+{ "type" : "longMin", "name" : "minLong", "fieldName" : "aLong" }
+```
+
+#### `longMax` aggregator
+
+`longMax` computes the maximum of all metric values and null.
+
+Example:
+```json
+{ "type" : "longMax", "name" : "maxLong", "fieldName" : "aLong" }
+```
+
+### `doubleMean` aggregator
+
+Computes and returns the arithmetic mean of a column's values as a 64-bit floating point value. 
+
+| Property | Description | Required |
+| --- | --- | --- |
+| `type` | Must be "doubleMean". | Yes |
+| `name` | Output name for the mean value. | Yes |
+| `fieldName` | Name of the input column to compute the arithmetic mean value over. | Yes |
+
+Example:
+```json
+{ "type" : "doubleMean", "name" : "aMean", "fieldName" : "aDouble" }
+```
+
+`doubleMean` is a query time aggregator only. It is not available for indexing. To accomplish mean aggregation on ingestion, refer to the [Quantiles aggregator](../development/extensions-core/datasketches-quantiles.md#aggregator) from the DataSketches extension.
+
+
+### First and last aggregators
+
+The first and last aggregators determine the metric values that respectively correspond to the earliest and latest values of a time column.
+
+Queries with first or last aggregators on a segment created with rollup return the rolled up value, not the first or last value from the 
+raw ingested data. The `timeColumn` will get ignored in such cases, and the aggregation will use the original value of the time column
+stored at the time the segment was created.
+
+#### Numeric first and last aggregators
+
+| Property | Description | Required |
+| --- | --- | --- |
+| `type` | Must be "doubleFirst", "doubleLast", "floatFirst", "floatLast", "longFirst", "longLast". | Yes |
+| `name` | Output name for the first or last value. | Yes |
+| `fieldName` | Name of the input column to compute the first or last value over. | Yes |
+| `timeColumn` | Name of the input column to use for time values. Must be a LONG typed column. | No. Defaults to `__time`. |
+
+##### `doubleFirst` aggregator
+
+`doubleFirst` computes the input value with the minimum value for time column or 0 in default mode, or `null` in SQL-compatible mode if no row exists.
+
+Example:
+```json
+{
+  "type" : "doubleFirst",
+  "name" : "firstDouble",
+  "fieldName" : "aDouble"
+}
+```
+
+##### `doubleLast` aggregator
+
+`doubleLast` computes the input value with the maximum value for time column or 0 in default mode, or `null` in SQL-compatible mode if no row exists.
+
+Example:
+```json
+{
+  "type" : "doubleLast",
+  "name" : "lastDouble",
+  "fieldName" : "aDouble",
+  "timeColumn" : "longTime"
+}
+```
+
+##### `floatFirst` aggregator
+
+`floatFirst` computes the input value with the minimum value for time column or 0 in default mode, or `null` in SQL-compatible mode if no row exists.
+
+Example:
+```json
+{
+  "type" : "floatFirst",
+  "name" : "firstFloat",
+  "fieldName" : "aFloat"
+}
+```
+
+##### `floatLast` aggregator
+
+`floatLast` computes the metric value with the maximum value for time column or 0 in default mode, or `null` in SQL-compatible mode if no row exists.
+
+Example:
+```json
+{
+  "type" : "floatLast",
+  "name" : "lastFloat",
+  "fieldName" : "aFloat"
+}
+```
+
+##### `longFirst` aggregator
+
+`longFirst` computes the metric value with the minimum value for time column or 0 in default mode, or `null` in SQL-compatible mode if no row exists.
+
+Example:
+```json
+{
+  "type" : "longFirst",
+  "name" : "firstLong",
+  "fieldName" : "aLong"
+}
+```
+
+##### `longLast` aggregator
+
+`longLast` computes the metric value with the maximum value for time column or 0 in default mode, or `null` in SQL-compatible mode if no row exists.
+
+Example:
+```json
+{
+  "type" : "longLast",
+  "name" : "lastLong",
+  "fieldName" : "aLong",
+  "timeColumn" : "longTime"
+}
+```
+
+#### String first and last aggregators
+
+| Property | Description | Required |
+| --- | --- | --- |
+| `type` | Must be "stringFirst", "stringLast". | Yes |
+| `name` | Output name for the first or last value. | Yes |
+| `fieldName` | Name of the input column to compute the first or last value over. | Yes |
+| `timeColumn` | Name of the input column to use for time values. Must be a LONG typed column. | No. Defaults to `__time`. |
+| `maxStringBytes` | Maximum size of string values to accumulate when computing the first or last value per group. Values longer than this will be truncated. | No. Defaults to 1024. |
+
+
+#### `stringFirst` aggregator
+
+`stringFirst` computes the metric value with the minimum value for time column or `null` if no row exists.
+
+Example:
+```json
+{
+  "type" : "stringFirst",
+  "name" : "firstString",
+  "fieldName" : "aString",
+  "maxStringBytes" : 2048,
+  "timeColumn" : "longTime"
+}
+```
+
+#### `stringLast` aggregator
+
+`stringLast` computes the metric value with the maximum value for time column or `null` if no row exists.
+
+Example:
+```json
+{
+  "type" : "stringLast",
+  "name" : "lastString",
+  "fieldName" : "aString"
+}
+```
+
+### ANY aggregators
+
+(Double/Float/Long/String) ANY aggregator cannot be used in ingestion spec, and should only be specified as part of queries.
+
+Returns any value including null. This aggregator can simplify and optimize the performance by returning the first encountered value (including null)
+
+#### Numeric any aggregators
+| Property | Description | Required |
+| --- | --- | --- |
+| `type` | Must be "doubleAny", "floatAny", or "longAny". | Yes |
+| `name` | Output name for the value. | Yes |
+| `fieldName` | Name of the input column to compute the value over. | Yes |
+
+##### `doubleAny` aggregator
+
+`doubleAny` returns any double metric value.
+
+Example:
+```json
+{
+  "type" : "doubleAny",
+  "name" : "anyDouble",
+  "fieldName" : "aDouble"
+}
+```
+
+##### `floatAny` aggregator
+
+`floatAny` returns any float metric value.
+
+Example:
+```json
+{
+  "type" : "floatAny",
+  "name" : "anyFloat",
+  "fieldName" : "aFloat"
+}
+```
+
+##### `longAny` aggregator
+
+`longAny` returns any long metric value.
+
+Example:
+```json
+{
+  "type" : "longAny",
+  "name" : "anyLong",
+  "fieldName" : "aLong"
+}
+```
+
+#### `stringAny` aggregator
+
+`stringAny` returns any string value present in the input.
+
+| Property | Description | Required |
+| --- | --- | --- |
+| `type` | Must be "stringAny". | Yes |
+| `name` | Output name for the value. | Yes |
+| `fieldName` | Name of the input column to compute the value over. | Yes |
+| `maxStringBytes` | Maximum size of string values to accumulate when computing the first or last value per group. Values longer than this will be truncated. | No. Defaults to 1024. |
+| `aggregateMultipleValues` | `aggregateMultipleValues` is an optional boolean flag controls the behavior of aggregating a [multi-value dimension](./multi-value-dimensions.md). `aggregateMultipleValues` is set as true by default and returns the stringified array in case of a multi-value dimension. By setting it to false, function will return first value instead. | No. Defaults to true. |
+
+Example:
+```json
+{
+  "type" : "stringAny",
+  "name" : "anyString",
+  "fieldName" : "aString",
+  "maxStringBytes" : 2048
+}
+```
+
+<a name="approx"></a>
+
+## Approximate aggregations
+
+### Count distinct
+
+#### Apache DataSketches Theta Sketch
+
+The [DataSketches Theta Sketch](../development/extensions-core/datasketches-theta.md) extension-provided aggregator gives distinct count estimates with support for set union, intersection, and difference post-aggregators, using Theta sketches from the [Apache DataSketches](https://datasketches.apache.org/) library.
+
+#### Apache DataSketches HLL Sketch
+
+The [DataSketches HLL Sketch](../development/extensions-core/datasketches-hll.md) extension-provided aggregator gives distinct count estimates using the HyperLogLog algorithm.
+
+Compared to the Theta sketch, the HLL sketch does not support set operations and has slightly slower update and merge speed, but requires significantly less space.
+
+#### Cardinality, hyperUnique
+
+:::info
+For new use cases, we recommend evaluating [DataSketches Theta Sketch](../development/extensions-core/datasketches-theta.md) or [DataSketches HLL Sketch](../development/extensions-core/datasketches-hll.md) instead.
+The DataSketches aggregators are generally able to offer more flexibility and better accuracy than the classic Druid `cardinality` and `hyperUnique` aggregators.
+:::
+
+The [Cardinality and HyperUnique](../querying/hll-old.md) aggregators are older aggregator implementations available by default in Druid that also provide distinct count estimates using the HyperLogLog algorithm. The newer DataSketches Theta and HLL extension-provided aggregators described above have superior accuracy and performance and are recommended instead.
+
+The DataSketches team has published a [comparison study](https://datasketches.apache.org/docs/HLL/HllSketchVsDruidHyperLogLogCollector.html) between Druid's original HLL algorithm and the DataSketches HLL algorithm. Based on the demonstrated advantages of the DataSketches implementation, we are recommending using them in preference to Druid's original HLL-based aggregators.
+However, to ensure backwards compatibility, we will continue to support the classic aggregators.
+
+Please note that `hyperUnique` aggregators are not mutually compatible with Datasketches HLL or Theta sketches.
+
+##### Multi-column handling
+
+Note the DataSketches Theta and HLL aggregators currently only support single-column inputs. If you were previously using the Cardinality aggregator with multiple-column inputs, equivalent operations using Theta or HLL sketches are described below:
+
+* Multi-column `byValue` Cardinality can be replaced with a union of Theta sketches on the individual input columns
+* Multi-column `byRow` Cardinality can be replaced with a Theta or HLL sketch on a single [virtual column](../querying/virtual-columns.md) that combines the individual input columns.
+
+### Histograms and quantiles
+
+#### DataSketches Quantiles Sketch
+
+The [DataSketches Quantiles Sketch](../development/extensions-core/datasketches-quantiles.md) extension-provided aggregator provides quantile estimates and histogram approximations using the numeric quantiles DoublesSketch from the [datasketches](https://datasketches.apache.org/) library.
+
+We recommend this aggregator in general for quantiles/histogram use cases, as it provides formal error bounds and has distribution-independent accuracy.
+
+#### Moments Sketch (Experimental)
+
+The [Moments Sketch](../development/extensions-contrib/momentsketch-quantiles.md) extension-provided aggregator is an experimental aggregator that provides quantile estimates using the [Moments Sketch](https://github.com/stanford-futuredata/momentsketch).
+
+The Moments Sketch aggregator is provided as an experimental option. It is optimized for merging speed and it can have higher aggregation performance compared to the DataSketches quantiles aggregator. However, the accuracy of the Moments Sketch is distribution-dependent, so users will need to empirically verify that the aggregator is suitable for their input data.
+
+As a general guideline for experimentation, the [Moments Sketch paper](https://arxiv.org/pdf/1803.01969.pdf) points out that this algorithm works better on inputs with high entropy. In particular, the algorithm is not a good fit when the input data consists of a small number of clustered discrete values.
+
+#### Fixed Buckets Histogram
+
+Druid also provides a [simple histogram implementation](../development/extensions-core/approximate-histograms.md#fixed-buckets-histogram) that uses a fixed range and fixed number of buckets with support for quantile estimation, backed by an array of bucket count values.
+
+The fixed buckets histogram can perform well when the distribution of the input data allows a small number of buckets to be used.
+
+We do not recommend the fixed buckets histogram for general use, as its usefulness is extremely data dependent. However, it is made available for users that have already identified use cases where a fixed buckets histogram is suitable.
+
+#### Approximate Histogram (deprecated)
+
+:::info
+The Approximate Histogram aggregator is deprecated.
+There are a number of other quantile estimation algorithms that offer better performance, accuracy, and memory footprint.
+We recommend using [DataSketches Quantiles](../development/extensions-core/datasketches-quantiles.md) instead.
+:::
+
+The [Approximate Histogram](../development/extensions-core/approximate-histograms.md) extension-provided aggregator also provides quantile estimates and histogram approximations, based on [http://jmlr.org/papers/volume11/ben-haim10a/ben-haim10a.pdf](http://jmlr.org/papers/volume11/ben-haim10a/ben-haim10a.pdf).
+
+The algorithm used by this deprecated aggregator is highly distribution-dependent and its output is subject to serious distortions when the input does not fit within the algorithm's limitations.
+
+A [study published by the DataSketches team](https://datasketches.apache.org/docs/QuantilesStudies/DruidApproxHistogramStudy.html) demonstrates some of the known failure modes of this algorithm:
+
+- The algorithm's quantile calculations can fail to provide results for a large range of rank values (all ranks less than 0.89 in the example used in the study), returning all zeroes instead.
+- The algorithm can completely fail to record spikes in the tail ends of the distribution
+- In general, the histogram produced by the algorithm can deviate significantly from the true histogram, with no bounds on the errors.
+
+It is not possible to determine a priori how well this aggregator will behave for a given input stream, nor does the aggregator provide any indication that serious distortions are present in the output.
+
+For these reasons, we have deprecated this aggregator and recommend using the DataSketches Quantiles aggregator instead for new and existing use cases, although we will continue to support Approximate Histogram for backwards compatibility.
+
+
+## Expression aggregations
+
+### Expression aggregator
+
+Aggregator applicable only at query time. Aggregates results using [Druid expressions](./math-expr.md) functions to facilitate building custom functions.
+
+| Property | Description | Required |
+| --- | --- | --- |
+| `type` | Must be "expression". | Yes |
+| `name` | The aggregator output name. | Yes |
+| `fields` | The list of aggregator input columns. | Yes |
+| `accumulatorIdentifier` | The variable which identifies the accumulator value in the `fold` and `combine` expressions. | No. Default `__acc`.|
+| `fold` | The expression to accumulate values from `fields`. The result of the expression is stored in `accumulatorIdentifier` and available to the next computation. | Yes |
+| `combine` | The expression to combine the results of various `fold` expressions of each segment when merging results. The input is available to the expression as a variable identified by the `name`. | No. Default to `fold` expression if the expression has a single input in `fields`.|
+| `compare` | The comparator expression which can only refer to two input variables, `o1` and `o2`, where `o1` and `o2` are the output of `fold` or `combine` expressions, and must adhere to the Java comparator contract. If not set, the aggregator will try to fall back to an output type appropriate comparator. | No |
+| `finalize` | The finalize expression which can only refer to a single input variable, `o`. This expression is used to perform any final transformation of the output of the `fold` or `combine` expressions. If not set, then the value is not transformed. | No |
+| `initialValue` | The initial value of the accumulator for the `fold` (and `combine`, if `InitialCombineValue` is null) expression. | Yes |
+| `initialCombineValue` | The initial value of the accumulator for the `combine` expression. | No. Default `initialValue`. |
+| `isNullUnlessAggregated` | If true, sets the default output value to `null` when the aggregator does not process any rows. If false, Druid computes the value as the result of running the expressions with initial values. | No. Defaults to `true`. |
+| `shouldAggregateNullInputs` | Indicates if the `fold` expression should operate on any `null` input values. | No. Defaults to `true`. |
+| `shouldCombineAggregateNullInputs` | Indicates if the `combine` expression should operate on any `null` input values. | No. Defaults to the value of `shouldAggregateNullInputs`. |
+| `maxSizeBytes` | Maximum size in bytes that variably sized aggregator output types such as strings and arrays are allowed to grow to before the aggregation fails. | No. Default is 8192 bytes. |
+
+#### Example: a "count" aggregator
+The initial value is `0`. `fold` adds `1` for each row processed.
+
+```json
+{
+  "type": "expression",
+  "name": "expression_count",
+  "fields": [],
+  "initialValue": "0",
+  "fold": "__acc + 1",
+  "combine": "__acc + expression_count"
+}
+```
+
+#### Example: a "sum" aggregator
+The initial value is `0`. `fold` adds the numeric value `column_a` for each row processed.
+
+```json
+{
+  "type": "expression",
+  "name": "expression_sum",
+  "fields": ["column_a"],
+  "initialValue": "0",
+  "fold": "__acc + column_a"
+}
+```
+
+#### Example: a "distinct array element" aggregator, sorted by array_length
+The initial value is an empty array. `fold` adds the elements of `column_a` to the accumulator using set semantics, `combine` merges the sets, and `compare` orders the values by `array_length`.
+
+```json
+{
+  "type": "expression",
+  "name": "expression_array_agg_distinct",
+  "fields": ["column_a"],
+  "initialValue": "[]",
+  "fold": "array_set_add(__acc, column_a)",
+  "combine": "array_set_add_all(__acc, expression_array_agg_distinct)",
+  "compare": "if(array_length(o1) > array_length(o2), 1, if (array_length(o1) == array_length(o2), 0, -1))"
+}
+```
+
+#### Example: an "approximate count" aggregator using the built-in hyper-unique
+Similar to the cardinality aggregator, the default value is an empty hyper-unique sketch, `fold` adds the value of `column_a` to the sketch, `combine` merges the sketches, and `finalize` gets the estimated count from the accumulated sketch.
+
+```json
+{
+  "type": "expression",
+  "name": "expression_cardinality",
+  "fields": ["column_a"],
+  "initialValue": "hyper_unique()",
+  "fold": "hyper_unique_add(column_a, __acc)",
+  "combine": "hyper_unique_add(expression_cardinality, __acc)",
+  "finalize": "hyper_unique_estimate(o)"
+}
+```
+
+### JavaScript aggregator
+
+Computes an arbitrary JavaScript function over a set of columns (both metrics and dimensions are allowed). Your
+JavaScript functions are expected to return floating-point values.
+
+| Property | Description | Required |
+| --- | --- | --- |
+| `type` | Must be "javascript". | Yes |
+| `name` | The aggregator output name. | Yes |
+| `fieldNames` | The list of aggregator input columns. | Yes |
+| `fnAggregate` | JavaScript function that updates partial aggregate based on the current row values, and returns the updated partial aggregate. | Yes |
+| `fnCombine` | JavaScript function to combine partial aggregates and return the combined result. | Yes |
+| `fnReset` | JavaScript function that returns the 'initial' value. | Yes |
+
+#### Example
+
+```json
+{
+  "type": "javascript",
+  "name": "sum(log(x)*y) + 10",
+  "fieldNames": ["x", "y"],
+  "fnAggregate" : "function(current, a, b)      { return current + (Math.log(a) * b); }",
+  "fnCombine"   : "function(partialA, partialB) { return partialA + partialB; }",
+  "fnReset"     : "function()                   { return 10; }"
+}
+```
+
+:::info
+JavaScript-based functionality is disabled by default. Refer to the Druid [JavaScript programming guide](../development/javascript.md) for guidelines about using Druid's JavaScript functionality, including instructions on how to enable it.
+:::
+
+
+## Miscellaneous aggregations
+
+### Filtered aggregator
+
+A filtered aggregator wraps any given aggregator, but only aggregates the values for which the given dimension filter matches.
+
+This makes it possible to compute the results of a filtered and an unfiltered aggregation simultaneously, without having to issue multiple queries, and use both results as part of post-aggregations.
+
+If only the filtered results are required, consider putting the filter on the query itself. This will be much faster since it does not require scanning all the data.
+
+| Property | Description | Required |
+| --- | --- | --- |
+| `type` | Must be "filtered". | Yes |
+| `name` | The aggregator output name. | No |
+| `aggregator` | Inline aggregator specification. | Yes |
+| `filter` | Inline [filter](./filters.md) specification. | Yes |
+
+Example:
+```json
+{
+  "type": "filtered",
+  "name": "filteredSumLong",
+  "filter": {
+    "type" : "selector",
+    "dimension" : "someColumn",
+    "value" : "abcdef"
+  },
+  "aggregator": {
+    "type": "longSum",
+    "name": "sumLong",
+    "fieldName": "aLong"
+  }
+}
+```
+
+### Grouping aggregator
+
+A grouping aggregator can only be used as part of GroupBy queries which have a subtotal spec. It returns a number for
+each output row that lets you infer whether a particular dimension is included in the sub-grouping used for that row. You can pass
+a *non-empty* list of dimensions to this aggregator which *must* be a subset of dimensions that you are grouping on. 
+
+| Property | Description | Required |
+| --- | --- | --- |
+| `type` | Must be "grouping". | Yes |
+| `name` | The aggregator output name. | Yes |
+| `groupings` | The list of columns to use in the grouping set. | Yes |
+
+
+For example, the following aggregator has `["dim1", "dim2"]` as input dimensions:
+
+```json
+{ "type" : "grouping", "name" : "someGrouping", "groupings" : ["dim1", "dim2"] }
+```
+
+and used in a grouping query with `[["dim1", "dim2"], ["dim1"], ["dim2"], []]` as subtotals, the
+possible output of the aggregator is:
+
+| subtotal used in query | Output | (bits representation) |
+|------------------------|--------|-----------------------|
+| `["dim1", "dim2"]`       | 0      | (00)                  |
+| `["dim1"]`               | 1      | (01)                  |
+| `["dim2"]`               | 2      | (10)                  |
+| `[]`                     | 3      | (11)                  |  
+
+As the example illustrates, you can think of the output number as an unsigned _n_ bit number where _n_ is the number of dimensions passed to the aggregator. 
+Druid sets the bit at position X for the number to 0 if the sub-grouping includes a dimension at position X in the aggregator input. Otherwise, Druid sets this bit to 1.
diff --git a/docs/35.0.0/querying/arrays.md b/docs/35.0.0/querying/arrays.md
new file mode 100644
index 0000000000..d9a9f39118
--- /dev/null
+++ b/docs/35.0.0/querying/arrays.md
@@ -0,0 +1,292 @@
+---
+id: arrays
+title: "Arrays"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+Apache Druid supports SQL standard `ARRAY` typed columns for `VARCHAR`, `BIGINT`, and `DOUBLE` types (native types `ARRAY<STRING>`, `ARRAY<LONG>`, and `ARRAY<DOUBLE>`). Other more complicated ARRAY types must be stored in [nested columns](nested-columns.md). Druid ARRAY types are distinct from [multi-value dimension](multi-value-dimensions.md), which have significantly different behavior than standard arrays.
+
+This document describes inserting, filtering, and grouping behavior for `ARRAY` typed columns.
+Refer to the [Druid SQL data type documentation](sql-data-types.md#arrays) and [SQL array function reference](sql-array-functions.md) for additional details
+about the functions available to use with ARRAY columns and types in SQL.
+
+The following sections describe inserting, filtering, and grouping behavior based on the following example data, which includes 3 array typed columns:
+
+```json lines
+{"timestamp": "2023-01-01T00:00:00", "label": "row1", "arrayString": ["a", "b"],  "arrayLong":[1, null,3], "arrayDouble":[1.1, 2.2, null]}
+{"timestamp": "2023-01-01T00:00:00", "label": "row2", "arrayString": [null, "b"], "arrayLong":null,        "arrayDouble":[999, null, 5.5]}
+{"timestamp": "2023-01-01T00:00:00", "label": "row3", "arrayString": [],          "arrayLong":[1, 2, 3],   "arrayDouble":[null, 2.2, 1.1]} 
+{"timestamp": "2023-01-01T00:00:00", "label": "row4", "arrayString": ["a", "b"],  "arrayLong":[1, 2, 3],   "arrayDouble":[]}
+{"timestamp": "2023-01-01T00:00:00", "label": "row5", "arrayString": null,        "arrayLong":[],          "arrayDouble":null}
+```
+
+## Ingesting arrays
+
+### Native batch and streaming ingestion
+When using native [batch](../ingestion/native-batch.md) or streaming ingestion such as with [Apache Kafka](../ingestion/kafka-ingestion.md), arrays can be ingested using the [`"auto"`](../ingestion/ingestion-spec.md#dimension-objects) type dimension schema which is shared with [type-aware schema discovery](../ingestion/schema-design.md#type-aware-schema-discovery).
+
+When ingesting from TSV or CSV data, you can specify the array delimiters using the `listDelimiter` field in the `inputFormat`. JSON data must be formatted as a JSON array to be ingested as an array type. JSON data does not require `inputFormat` configuration.
+
+The following shows an example `dimensionsSpec` for native ingestion of the data used in this document:
+
+```
+"dimensions": [
+  {
+    "type": "auto",
+    "name": "label"
+  },
+  {
+    "type": "auto",
+    "name": "arrayString"
+  },
+  {
+    "type": "auto",
+    "name": "arrayLong"
+  },
+  {
+    "type": "auto",
+    "name": "arrayDouble"
+  }
+],
+```
+
+### SQL-based ingestion
+
+Arrays can be inserted with [SQL-based ingestion](../multi-stage-query/index.md).
+
+#### Examples
+
+```sql
+REPLACE INTO "array_example" OVERWRITE ALL
+WITH "ext" AS (
+  SELECT *
+  FROM TABLE(
+    EXTERN(
+      '{"type":"inline","data":"{\"timestamp\": \"2023-01-01T00:00:00\", \"label\": \"row1\", \"arrayString\": [\"a\", \"b\"],  \"arrayLong\":[1, null,3], \"arrayDouble\":[1.1, 2.2, null]}\n{\"timestamp\": \"2023-01-01T00:00:00\", \"label\": \"row2\", \"arrayString\": [null, \"b\"], \"arrayLong\":null,        \"arrayDouble\":[999, null, 5.5]}\n{\"timestamp\": \"2023-01-01T00:00:00\", \"label\": \"row3\", \"arrayString\": [],          \"arrayLong\":[1, 2, 3],   \"arrayDouble\":[null, 2.2, 1.1]} \n{\"timestamp\": \"2023-01-01T00:00:00\", \"label\": \"row4\", \"arrayString\": [\"a\", \"b\"],  \"arrayLong\":[1, 2, 3],   \"arrayDouble\":[]}\n{\"timestamp\": \"2023-01-01T00:00:00\", \"label\": \"row5\", \"arrayString\": null,        \"arrayLong\":[],          \"arrayDouble\":null}"}',
+      '{"type":"json"}'
+    )
+  ) EXTEND (
+    "timestamp" VARCHAR,
+    "label" VARCHAR,
+    "arrayString" VARCHAR ARRAY,
+    "arrayLong" BIGINT ARRAY,
+    "arrayDouble" DOUBLE ARRAY
+  )
+)
+SELECT
+  TIME_PARSE("timestamp") AS "__time",
+  "label",
+  "arrayString",
+  "arrayLong",
+  "arrayDouble"
+FROM "ext"
+PARTITIONED BY DAY
+```
+
+Arrays can also be used as `GROUP BY` keys for rollup:
+
+```sql
+REPLACE INTO "array_example_rollup" OVERWRITE ALL
+WITH "ext" AS (
+  SELECT *
+  FROM TABLE(
+    EXTERN(
+      '{"type":"inline","data":"{\"timestamp\": \"2023-01-01T00:00:00\", \"label\": \"row1\", \"arrayString\": [\"a\", \"b\"],  \"arrayLong\":[1, null,3], \"arrayDouble\":[1.1, 2.2, null]}\n{\"timestamp\": \"2023-01-01T00:00:00\", \"label\": \"row2\", \"arrayString\": [null, \"b\"], \"arrayLong\":null,        \"arrayDouble\":[999, null, 5.5]}\n{\"timestamp\": \"2023-01-01T00:00:00\", \"label\": \"row3\", \"arrayString\": [],          \"arrayLong\":[1, 2, 3],   \"arrayDouble\":[null, 2.2, 1.1]} \n{\"timestamp\": \"2023-01-01T00:00:00\", \"label\": \"row4\", \"arrayString\": [\"a\", \"b\"],  \"arrayLong\":[1, 2, 3],   \"arrayDouble\":[]}\n{\"timestamp\": \"2023-01-01T00:00:00\", \"label\": \"row5\", \"arrayString\": null,        \"arrayLong\":[],          \"arrayDouble\":null}"}',
+      '{"type":"json"}'
+    )
+  ) EXTEND (
+    "timestamp" VARCHAR,
+    "label" VARCHAR,
+    "arrayString" VARCHAR ARRAY,
+    "arrayLong" BIGINT ARRAY,
+    "arrayDouble" DOUBLE ARRAY
+  )
+)
+SELECT
+  TIME_PARSE("timestamp") AS "__time",
+  "label",
+  "arrayString",
+  "arrayLong",
+  "arrayDouble",
+  COUNT(*) as "count"
+FROM "ext"
+GROUP BY 1,2,3,4,5
+PARTITIONED BY DAY
+```
+
+#### `arrayIngestMode`
+
+For seamless backwards compatible behavior with Druid versions older than 31, there is an `arrayIngestMode` query context flag.
+
+When `arrayIngestMode` is `array`, SQL ARRAY types are stored using Druid array columns. This is recommended for new
+tables and the default configuration for Druid 31 and newer.
+
+When `arrayIngestMode` is `mvd` (legacy), SQL `VARCHAR ARRAY` are implicitly wrapped in [`ARRAY_TO_MV`](sql-functions.md#array_to_mv).
+This causes them to be stored as [multi-value strings](multi-value-dimensions.md), using the same `STRING` column type
+as regular scalar strings. SQL `BIGINT ARRAY` and `DOUBLE ARRAY` cannot be loaded under `arrayIngestMode: mvd`. This
+mode is not recommended and will be removed in a future release, but provided for backwards compatibility.
+
+The following table summarizes the differences in SQL ARRAY handling between `arrayIngestMode: array` and
+`arrayIngestMode: mvd`.
+
+| SQL type | Stored type when `arrayIngestMode: array` (default) | Stored type when `arrayIngestMode: mvd` |
+|---|---|---|
+|`VARCHAR ARRAY`|`ARRAY<STRING>`|[multi-value `STRING`](multi-value-dimensions.md)|
+|`BIGINT ARRAY`|`ARRAY<LONG>`|not possible (validation error)|
+|`DOUBLE ARRAY`|`ARRAY<DOUBLE>`|not possible (validation error)|
+
+In either mode, you can explicitly wrap string arrays in `ARRAY_TO_MV` to cause them to be stored as
+[multi-value strings](multi-value-dimensions.md).
+
+When validating a SQL INSERT or REPLACE statement that contains arrays, Druid checks whether the statement would lead
+to mixing string arrays and multi-value strings in the same column. If this condition is detected, the statement fails
+validation unless the column is named under the `skipTypeVerification` context parameter. This parameter can be either
+a comma-separated list of column names, or a JSON array in string form. This validation is done to prevent accidentally
+mixing arrays and multi-value strings in the same column.
+
+## Querying arrays
+
+### Filtering
+
+All query types, as well as [filtered aggregators](aggregations.md#filtered-aggregator), can filter on array typed columns. Filters follow these rules for array types:
+
+- All filters match against the entire array value for the row
+- Native value filters like [equality](filters.md#equality-filter) and [range](filters.md#range-filter) match on entire array values, as do SQL constructs that plan into these native filters
+- The [`IS NULL`](filters.md#null-filter) filter will match rows where the entire array value is null
+- [Array specific functions](sql-array-functions.md) like `ARRAY_CONTAINS` and `ARRAY_OVERLAP` follow the behavior specified by those functions
+- All other filters do not directly support ARRAY types and will result in a query error
+
+#### Example: equality
+```sql
+SELECT *
+FROM "array_example"
+WHERE arrayLong = ARRAY[1,2,3]
+```
+
+```json lines
+{"__time":"2023-01-01T00:00:00.000Z","label":"row3","arrayString":"[]","arrayLong":"[1,2,3]","arrayDouble":"[null,2.2,1.1]"}
+{"__time":"2023-01-01T00:00:00.000Z","label":"row4","arrayString":"[\"a\",\"b\"]","arrayLong":"[1,2,3]","arrayDouble":"[]"}
+```
+
+#### Example: null
+```sql
+SELECT *
+FROM "array_example"
+WHERE arrayLong IS NULL
+```
+
+```json lines
+{"__time":"2023-01-01T00:00:00.000Z","label":"row2","arrayString":"[null,\"b\"]","arrayLong":null,"arrayDouble":"[999.0,null,5.5]"}
+```
+
+#### Example: range
+```sql
+SELECT *
+FROM "array_example"
+WHERE arrayString >= ARRAY['a','b']
+```
+
+```json lines
+{"__time":"2023-01-01T00:00:00.000Z","label":"row1","arrayString":"[\"a\",\"b\"]","arrayLong":"[1,null,3]","arrayDouble":"[1.1,2.2,null]"}
+{"__time":"2023-01-01T00:00:00.000Z","label":"row4","arrayString":"[\"a\",\"b\"]","arrayLong":"[1,2,3]","arrayDouble":"[]"}
+```
+
+#### Example: ARRAY_CONTAINS
+```sql
+SELECT *
+FROM "array_example"
+WHERE ARRAY_CONTAINS(arrayString, 'a')
+```
+
+```json lines
+{"__time":"2023-01-01T00:00:00.000Z","label":"row1","arrayString":"[\"a\",\"b\"]","arrayLong":"[1,null,3]","arrayDouble":"[1.1,2.2,null]"}
+{"__time":"2023-01-01T00:00:00.000Z","label":"row4","arrayString":"[\"a\",\"b\"]","arrayLong":"[1,2,3]","arrayDouble":"[]"}
+```
+
+### Grouping
+
+When grouping on an array with SQL or a native [groupBy query](groupbyquery.md), grouping follows standard SQL behavior and groups on the entire array as a single value. The [`UNNEST`](sql.md#unnest) function allows grouping on the individual array elements.
+
+#### Example: SQL grouping query with no filtering
+```sql
+SELECT label, arrayString
+FROM "array_example"
+GROUP BY 1,2
+```
+results in:
+```json lines
+{"label":"row1","arrayString":"[\"a\",\"b\"]"}
+{"label":"row2","arrayString":"[null,\"b\"]"}
+{"label":"row3","arrayString":"[]"}
+{"label":"row4","arrayString":"[\"a\",\"b\"]"}
+{"label":"row5","arrayString":null}
+```
+
+#### Example: SQL grouping query with a filter
+```sql
+SELECT label, arrayString
+FROM "array_example"
+WHERE arrayLong = ARRAY[1,2,3]
+GROUP BY 1,2
+```
+
+results:
+```json lines
+{"label":"row3","arrayString":"[]"}
+{"label":"row4","arrayString":"[\"a\",\"b\"]"}
+```
+
+#### Example: UNNEST
+```sql
+SELECT label, strings
+FROM "array_example" CROSS JOIN UNNEST(arrayString) as u(strings)
+GROUP BY 1,2
+```
+
+results:
+```json lines
+{"label":"row1","strings":"a"}
+{"label":"row1","strings":"b"}
+{"label":"row2","strings":null}
+{"label":"row2","strings":"b"}
+{"label":"row4","strings":"a"}
+{"label":"row4","strings":"b"}
+```
+
+## Differences between arrays and multi-value dimensions
+Avoid confusing string arrays with [multi-value dimensions](multi-value-dimensions.md). Arrays and multi-value dimensions are stored in different column types, and query behavior is different. You can use the functions `MV_TO_ARRAY` and `ARRAY_TO_MV` to convert between the two if needed. In general, we recommend using arrays whenever possible, since they are a newer and more powerful feature and have SQL compliant behavior.
+
+Use care during ingestion to ensure you get the type you want.
+
+To get arrays when performing an ingestion using JSON ingestion specs, such as [native batch](../ingestion/native-batch.md) or streaming ingestion such as with [Apache Kafka](../ingestion/kafka-ingestion.md), use dimension type `auto` or enable `useSchemaDiscovery`. When performing a [SQL-based ingestion](../multi-stage-query/index.md), write a query that generates arrays. Arrays may contain strings or numbers.
+
+To get multi-value dimensions when performing an ingestion using JSON ingestion specs, use dimension type `string` and do not enable `useSchemaDiscovery`. When performing a [SQL-based ingestion](../multi-stage-query/index.md), wrap arrays in [`ARRAY_TO_MV`](multi-value-dimensions.md#sql-based-ingestion), which ensures you get multi-value dimensions. Multi-value dimensions can only contain strings.
+
+You can tell which type you have by checking the `INFORMATION_SCHEMA.COLUMNS` table, using a query like:
+
+```sql
+SELECT COLUMN_NAME, DATA_TYPE
+FROM INFORMATION_SCHEMA.COLUMNS
+WHERE TABLE_NAME = 'mytable'
+```
+
+Arrays are type `ARRAY`, multi-value strings are type `VARCHAR`.
\ No newline at end of file
diff --git a/docs/35.0.0/querying/caching.md b/docs/35.0.0/querying/caching.md
new file mode 100644
index 0000000000..cbd70d6581
--- /dev/null
+++ b/docs/35.0.0/querying/caching.md
@@ -0,0 +1,119 @@
+---
+id: caching
+title: "Query caching"
+description: "Describes Apache Druid per-segment and whole-query cache types. Identifies services where you can enable caching and suggestions for caching strategy."
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+You can enable caching in Apache Druid to improve query times for frequently accessed data. This topic defines the different types of caching for Druid. It describes the default caching behavior and provides guidance and examples to help you hone your caching strategy.
+
+If you're unfamiliar with Druid architecture, review the following topics before proceeding with caching:
+- [Druid Design](../design/architecture.md)
+- [Segments](../design/segments.md)
+- [Query execution](./query-execution.md)
+
+For instructions to configure query caching see [Using query caching](./using-caching.md).
+
+Cache monitoring, including the hit rate and number of evictions, is available in [Druid metrics](../operations/metrics.md#cache).
+
+Query-level caching is in addition to [data-level caching](../design/historical.md) on Historicals.
+
+## Cache types
+
+Druid supports two types of query caching:
+
+- [Per-segment caching](#per-segment-caching) stores partial query results for a specific segment. It is enabled by default.
+- [Whole-query caching](#whole-query-caching) stores final query results.
+
+Druid invalidates any cache the moment any underlying data change to avoid returning stale results. This is especially important for `table` datasources that have highly-variable underlying data segments, including real-time data segments.
+
+:::info
+ **Druid can store cache data on the local JVM heap or in an external distributed key/value store (e.g. memcached)**
+
+ The default is a local cache based upon [Caffeine](https://github.com/ben-manes/caffeine). The default maximum cache storage size is the minimum of 1 GiB / ten percent of maximum runtime memory for the JVM, with no cache expiration. See [Cache configuration](../configuration/index.md#cache-configuration) for information on how to configure cache storage.  When using caffeine, the cache is inside the JVM heap and is directly measurable.  Heap usage will grow up to the maximum configured size, and then the least recently used segment results will be evicted and replaced with newer results.
+:::
+
+### Per-segment caching
+
+The primary form of caching in Druid is a *per-segment results cache*.  This cache stores partial query results on a per-segment basis and is enabled on Historical services by default.
+
+The per-segment results cache allows Druid to maintain a low-eviction-rate cache for segments that do not change, especially important for those segments that [historical](../design/historical.md) processes pull into their local _segment cache_ from [deep storage](../design/deep-storage.md). Real-time segments, on the other hand, continue to have results computed at query time.
+
+Druid may potentially merge per-segment cached results with the results of later queries that use a similar basic shape with similar filters, aggregations, etc. For example, if the query is identical except that it covers a different time period.
+
+Per-segment caching is controlled by the parameters `useCache` and `populateCache`.
+
+Use per-segment caching with real-time data. For example, your queries request data actively arriving from Kafka alongside intervals in segments that are loaded on Historicals. Druid can merge cached results from Historical segments with real-time results from the stream. [Whole-query caching](#whole-query-caching), on the other hand, is not helpful in this scenario because new data from real-time ingestion will continually invalidate the entire cached result.
+
+### Whole-query caching
+
+With *whole-query caching*, Druid caches the entire results of individual queries, meaning the Broker no longer needs to merge per-segment results from data processes.
+
+Use *whole-query caching* on the Broker to increase query efficiency when there is little risk of ingestion invalidating the cache at a segment level. This applies particularly, for example, when _not_ using real-time ingestion. Perhaps your queries tend to use batch-ingested data, in which case per-segment caching would be less efficient since the underlying segments hardly ever change, yet Druid would continue to acquire per-segment results for each query.
+
+## Where to enable caching
+
+**Per-segment cache** is available as follows:
+
+- On Historicals, the default. Enable segment-level cache population on Historicals for larger production clusters to prevent Brokers from having to merge all query results. When you enable cache population on Historicals instead of Brokers, the Historicals merge their own local results and put less strain on the Brokers.
+
+- On ingestion tasks in the Peon or Indexer service. Larger production clusters should enable segment-level cache population on task services only to prevent Brokers from having to merge all query results. When you enable cache population on task execution services instead of Brokers, the task execution services to merge their own local results and put less strain on the Brokers.
+
+     Task executor services only support caches that store data locally. For example the `caffeine` cache. This restriction exists because the cache stores results at the level of intermediate partial segments generated by the ingestion tasks. These intermediate partial segments may not be identical across task replicas. Therefore task executor services ignore remote cache types such as `memcached`.
+
+- On Brokers for small production clusters with less than five servers. 
+
+Avoid using per-segment cache at the Broker for large production clusters. When the Broker cache is enabled (`druid.broker.cache.populateCache` is `true`) and `populateCache` _is not_ `false` in the [query context](../querying/query-context-reference.md), individual Historicals will _not_ merge individual segment-level results, and instead pass these back to the lead Broker. The Broker must then carry out a large merge from _all_ segments on its own.
+
+**Whole-query cache** is available exclusively on Brokers.
+
+## Performance considerations for caching
+Caching enables increased concurrency on the same system, therefore leading to noticeable performance improvements for queries on Druid clusters handling throughput for concurrent, mixed workloads.
+
+If you are looking to improve response time for a single query or page load, you should ignore caching. In general, response time for a single task should meet performance objectives even when the cache is cold.
+
+During query processing, the per-segment cache intercepts the query and sends the results directly to the Broker. This way the query bypasses the data server processing threads. For queries requiring minimal processing in the Broker, cached queries are very quick. If work done on the Broker causes a query bottleneck, enabling caching results in little noticeable query improvement.
+
+The largest performance gains from segment caching tend to apply to `topN` and time series queries. For `groupBy` queries, if the bottleneck is in the merging phase on the broker, the impact is less. The same applies to queries with or without joins.
+
+### Scenarios where caching does not increase query performance
+
+Caching does not solve all types of query performance issues. For each cache type there are scenarios where caching is likely to be of little benefit.
+
+**Per-segment caching** doesn't work for the following:
+- queries containing a sub-query in them. However the output of sub-queries may be cached. See [Query execution](./query-execution.md) for more details on sub-queries execution.
+- queries with joins do not support any caching on the broker.
+- GroupBy queries do not support segment level caching on broker.
+- queries with `bySegment` set in the query context are not cached on the broker.
+
+**Whole-query caching** doesn't work for the following:
+- queries that involve an inline datasource or a lookup datasource.
+- queries with joins.
+- queries with a union datasource.
+
+
+## Learn more
+See the following topics for more information:
+- [Using query caching](./using-caching.md) to learn how to configure and use caching.
+- [Druid Design](../design/architecture.md) to learn about Druid processes.  
+- [Segments](../design/segments.md) to learn how Druid stores data.
+- [Query execution](./query-execution.md) to learn how Druid services process query statements.
+
diff --git a/docs/35.0.0/querying/dart.md b/docs/35.0.0/querying/dart.md
new file mode 100644
index 0000000000..b68158b5c3
--- /dev/null
+++ b/docs/35.0.0/querying/dart.md
@@ -0,0 +1,145 @@
+---
+id: dart
+title: "SQL queries using the Dart engine"
+sidebar_label: "Dart engine"
+description: The Dart engine, a profile of MSQ, is an alternative to the native query engine that offers better parallelism and better performance for certain types of queries.
+---
+
+import Tabs from '@theme/Tabs';
+import TabItem from '@theme/TabItem';
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ License); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ AS IS BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info[Experimental]
+
+Dart is experimental. Use it in situations where it fits your use case better than the native query engine. But be aware that Dart has not received as much testing as the other query engines.
+
+:::
+
+
+Dart is a query engine that runs SELECT queries on Brokers and Historicals instead of on tasks.
+It is a profile of MSQ in which Brokers act as controllers and the Historicals act as workers.
+
+Use Dart as an alternative to the native query engine since it offers better parallelism, excelling at queries that involve:
+
+- Large joins, which Dart performs using parallel sort-merges.
+- High-cardinality exact groupBy operations.
+- High-cardinality exact count distinct.
+
+When processing these kinds of queries, Dart can parallelize through the entire query, leading to better performance.
+
+By default, Dart queries include results from published segments and realtime tasks.
+
+## Enable Dart
+
+To enable Dart, add the following line to your `_common/common.runtime.properties` files:
+
+```
+druid.msq.dart.enabled = true
+```
+
+### Configure resource consumption
+
+You can configure the Broker and the Historical to tune Dart's resource consumption. Since Brokers only act as controllers, they don't require substantial resources. Historicals, on the other hand, are processing the queries. More resources for Historicals can result in faster query processing.
+
+For Brokers, you can set the following configs:
+
+| Property name | Description | Default |
+|---|---|---|
+| `druid.msq.dart.controller.concurrentQueries` | Maximum number of query controllers that can run concurrently on that Broker. Druid queues additional controllers. Queries can get stuck waiting for each other if the total value on Brokers exceeds the setting on a single Historical (`druid.msq.dart.worker.concurrentQueries` ).| 1 |
+| `druid.msq.dart.query.context.targetPartitionsPerWorker` |To parallelize queries as much as possible on each Historical, set this to the same value as `druid.processing.numThreads` on the Historicals. | 1 (Multithreading is turned off on Historicals) |
+
+
+For Historicals, you can set the following configs:
+
+| Property name | Description | Default Value |
+|---|---|---|
+| `druid.msq.dart.worker.concurrentQueries` | Maximum number of query workers that can run concurrently on a Historical. We recommend leaving this config at the default value. If need to change this value, set it to a value equal to or larger than `druid.msq.dart.controller.concurrentQueries` on your Brokers. If you don't, queries can get stuck waiting for each other. Don't set it to a value higher than the number of merge buffers. | Equal to the number of merge buffers |
+| `druid.msq.dart.worker.heapFraction` | Maximum amount of heap available for use across all Dart queries as a decimal. | 0.35 (35% of heap) |
+
+
+## Run a Dart query
+
+Once enabled, you can use Dart in the Druid console or the SQL query API to issue queries.
+
+### Druid console
+
+In the **Query** view, select **Engine: SQL (Dart)** from the engine selector menu.
+
+### API
+
+Dart uses the SQL endpoint `/druid/v2/sql`. To use Dart, include the query context parameter `engine` and set it to `msq-dart`:
+
+<Tabs>
+<TabItem value="SET" label="SET" default>
+
+As part of your query using `SET engine = 'msq-dart'`:
+
+```json
+{
+"query":"SET \"engine\"='msq-dart';\nSELECT\n  user,\n  commentLength,\n  COUNT(*) AS \"COUNT\"\nFROM \"wikipedia\"\nGROUP BY 1, 2\nORDER BY 2 DESC"
+}
+```
+
+</TabItem>
+
+<TabItem value="context_block" label="Context block">
+
+As part of a `context` block: 
+
+```json
+{
+  "query": "SELECT\n  user,\n  commentLength,\n  COUNT(*) AS \"COUNT\"\nFROM \"wikipedia\"\nGROUP BY 1, 2\nORDER BY 2 DESC",
+  "context": {
+    "engine": "msq-dart"
+  }
+}
+```
+
+
+  </TabItem>
+  </Tabs>
+
+## Query context parameters
+
+You can use any SQL query context parameters to control Dart's behavior unless otherwise stated. Additionally, the following table lists the supported MSQ engine query context parameters that Dart supports:
+
+| Parameter | Description | Default value |
+|---|---|---|
+| `finalizeAggregations` | Determines the type of aggregation to return. If true, Druid finalizes the results of complex aggregations that directly appear in query results. If false, Druid returns the aggregation's intermediate type rather than finalized type. This parameter is useful during ingestion, where it enables storing sketches directly in Druid tables. For more information about aggregations, see [SQL aggregation functions](../querying/sql-aggregations.md). | `true` |
+| `includeSegmentSource` |  Controls the sources Druid queries for results in addition to the segments present on deep storage. Can be `NONE` or `REALTIME`. If set to `NONE`, only non-realtime (published and used) segments are downloaded from deep storage. If set to `REALTIME`, results are also included from realtime tasks.|  `REALTIME` |
+| `removeNullBytes` |The MSQ engine can't process null bytes in strings and throws `InvalidNullByteFault` if it encounters them in the source data. If the parameter is set to true, the MSQ engine removes the null bytes in string fields when reading the data. | `false` |
+|`maxConcurrentStages`|Number of stages that can run concurrently for a query. A higher number can potentially improve pipelining but results in less memory available for each stage.|2|
+|`maxNonLeafWorkers`|Number of workers to use for stages beyond the leaf stage.| 1 (Scatter-gather style)|
+| `sqlJoinAlgorithm` | Algorithm to use for JOIN. Use `broadcast` (the default) for broadcast hash join or `sortMerge` for sort-merge join. Affects all JOIN operations in the query. This is a hint to the MSQ engine and the actual joins in the query may proceed in a different way than specified. See [Joins](../multi-stage-query/reference.md#joins) for more details. | `broadcast` |
+|`targetPartitionsPerWorker`|Number of partitions Druid generates for each worker. This number controls how much parallelism can be maintained throughout a query.|1|
+
+
+  ## Known issues and limitations
+
+- Dart doesn't do the following:
+  - Verify that `druid.msq.dart.controller.concurrentQueries` is set properly. If set too high, queries can get stuck on each other.
+  - Use the query cache.
+  - Perform query prioritization or laning.
+- TopN queries are always exact. Approximate TopN queries (`useApproximateTopN`) aren't supported.
+- Dart doesn't support JDBC connections. Druid ignores the `engine` context parameter when its passed through a JDBC connection.
+- Realtime scans from the MSQ engine can't reliably read complex types. This can happen in situations such as if your data includes HLL Sketches for realtime data. Dart returns a `NullPointerException`. For more information, see [#18340](https://github.com/apache/druid/issues/18340).
+- The `NilStageOutputReader` can sometimes lead to a `NoClassDefFoundError`. For more information, see [#18336](https://github.com/apache/druid/pull/18336).
+- Broadcast joins with realtime data aren't supported. If the left table of a join has realtime data and you're doing a broadcast join, you must set `sqlJoinAlgorithm` to `sortMerge`.
\ No newline at end of file
diff --git a/docs/35.0.0/querying/datasource.md b/docs/35.0.0/querying/datasource.md
new file mode 100644
index 0000000000..3cc6265bfb
--- /dev/null
+++ b/docs/35.0.0/querying/datasource.md
@@ -0,0 +1,501 @@
+---
+id: datasource
+title: "Datasources"
+---
+
+import Tabs from '@theme/Tabs';
+import TabItem from '@theme/TabItem';
+
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+Datasources in Apache Druid are things that you can query. The most common kind of datasource is a table datasource,
+and in many contexts the word "datasource" implicitly refers to table datasources. This is especially true
+[during data ingestion](../ingestion/index.md), where ingestion is always creating or writing into a table
+datasource. But at query time, there are many other types of datasources available.
+
+The word "datasource" is generally spelled `dataSource` (with a capital S) when it appears in API requests and
+responses.
+
+## Datasource type
+
+### `table`
+
+<Tabs>
+<TabItem value="1" label="SQL">
+
+```sql
+SELECT column1, column2 FROM "druid"."dataSourceName"
+```
+</TabItem>
+<TabItem value="2" label="Native">
+
+```json
+{
+  "queryType": "scan",
+  "dataSource": "dataSourceName",
+  "columns": ["column1", "column2"],
+  "intervals": ["0000/3000"]
+}
+```
+</TabItem>
+</Tabs>
+
+The table datasource is the most common type. This is the kind of datasource you get when you perform
+[data ingestion](../ingestion/index.md). They are split up into segments, distributed around the cluster,
+and queried in parallel.
+
+In [Druid SQL](sql.md#from), table datasources reside in the `druid` schema. This is the default schema, so table
+datasources can be referenced as either `druid.dataSourceName` or simply `dataSourceName`.
+
+In native queries, table datasources can be referenced using their names as strings (as in the example above), or by
+using JSON objects of the form:
+
+```json
+"dataSource": {
+  "type": "table",
+  "name": "dataSourceName"
+}
+```
+
+To see a list of all table datasources, use the SQL query
+`SELECT * FROM INFORMATION_SCHEMA.TABLES WHERE TABLE_SCHEMA = 'druid'`.
+
+### `lookup`
+
+<Tabs>
+<TabItem value="3" label="SQL">
+
+```sql
+SELECT k, v FROM lookup.countries
+```
+</TabItem>
+<TabItem value="4" label="Native">
+
+```json
+{
+  "queryType": "scan",
+  "dataSource": {
+    "type": "lookup",
+    "lookup": "countries"
+  },
+  "columns": ["k", "v"],
+  "intervals": ["0000/3000"]
+}
+```
+</TabItem>
+</Tabs>
+
+Lookup datasources correspond to Druid's key-value [lookup](lookups.md) objects. In [Druid SQL](sql.md#from),
+they reside in the `lookup` schema. They are preloaded in memory on all servers, so they can be accessed rapidly.
+They can be joined onto regular tables using the [join operator](#join).
+
+Lookup datasources are key-value oriented and always have exactly two columns: `k` (the key) and `v` (the value), and
+both are always strings.
+
+To see a list of all lookup datasources, use the SQL query
+`SELECT * FROM INFORMATION_SCHEMA.TABLES WHERE TABLE_SCHEMA = 'lookup'`.
+
+:::info
+ Performance tip: Lookups can be joined with a base table either using an explicit [join](#join), or by using the
+ SQL [`LOOKUP` function](sql-scalar.md#string-functions).
+ However, the join operator must evaluate the condition on each row, whereas the
+ `LOOKUP` function can defer evaluation until after an aggregation phase. This means that the `LOOKUP` function is
+ usually faster than joining to a lookup datasource.
+:::
+
+Refer to the [Query execution](query-execution.md#table) page for more details on how queries are executed when you
+use table datasources.
+
+### `union`
+
+<Tabs>
+<TabItem value="5" label="SQL">
+
+```sql
+SELECT column1, column2
+FROM (
+  SELECT column1, column2 FROM table1
+  UNION ALL
+  SELECT column1, column2 FROM table2
+  UNION ALL
+  SELECT column1, column2 FROM table3
+)
+```
+</TabItem>
+<TabItem value="6" label="Native">
+
+```json
+{
+  "queryType": "scan",
+  "dataSource": {
+    "type": "union",
+    "dataSources": ["table1", "table2", "table3"]
+  },
+  "columns": ["column1", "column2"],
+  "intervals": ["0000/3000"]
+}
+```
+</TabItem>
+</Tabs>
+
+Unions allow you to treat two or more tables as a single datasource. In SQL, this is done with the UNION ALL operator
+applied directly to tables, called a ["table-level union"](sql.md#table-level). In native queries, this is done with a
+"union" datasource.
+
+With SQL [table-level unions](sql.md#table-level) the same columns must be selected from each table in the same order,
+and those columns must either have the same types, or types that can be implicitly cast to each other (such as different
+numeric types). For this reason, it is more robust to write your queries to select specific columns.
+
+With the native union datasource, the tables being unioned do not need to have identical schemas. If they do not fully
+match up, then columns that exist in one table but not another will be treated as if they contained all null values in
+the tables where they do not exist.
+
+In either case, features like expressions, column aliasing, JOIN, GROUP BY, ORDER BY, and so on cannot be used with
+table unions.
+
+Refer to the [Query execution](query-execution.md#union) page for more details on how queries are executed when you
+use union datasources.
+
+#### Dynamic table append
+
+<Tabs>
+<TabItem value="sql" label="SQL">
+
+```sql
+SELECT column1, column2, column3
+FROM TABLE(APPEND('table1','table2','table3'))
+```
+</TabItem>
+</Tabs>
+
+Perform dynamic table appends in SQL using `TABLE(APPEND(...))`. This simplifies SQL syntax to match columns by name from multiple tables. The native query syntax remains the same as for native union datasources.
+Suppose you have three tables:
+* `table1` has `column1`
+* `table2` has `column2`
+* `table3` has `column1`, `column2`, `column3`
+
+You can create a union view of all the tables by using [table-level union](sql.md#table-level):
+```sql
+SELECT * from (
+  SELECT column1,NULL AS column2,NULL AS column3 FROM table1
+  UNION ALL
+  SELECT NULL AS column1,column2,NULL AS column3 FROM table2
+  UNION ALL
+  SELECT column1,column2,column3 FROM table3
+) t
+```
+
+However depending on the size of the table's schema it might be quite complicated to do that; `TABLE(APPEND('table1','table2','table3'))` represents the same in a more compact form.
+
+:::info
+Only tables defined in the catalog are supported in `TABLE(APPEND())` - due to that; common table expressions result in `table not found` errors for queries like:
+```sql
+WITH cte_table AS (SELECT * from TABLE1) SELECT * FROM TABLE(APPEND('cte_table'))
+```
+:::
+
+### `inline`
+
+<Tabs>
+<TabItem value="sql" label="SQL">
+
+```sql
+SELECT * from (VALUES ('United States', 'San Francisco'),
+                      ('Canada', 'Calgary')
+              ) t (country, city)
+```
+</TabItem>
+<TabItem value="native" label="Native">
+
+```json
+{
+  "queryType": "scan",
+  "dataSource": {
+    "type": "inline",
+    "columnNames": ["country", "city"],
+    "rows": [
+      ["United States", "San Francisco"],
+      ["Canada", "Calgary"]
+    ]
+  },
+  "columns": ["country", "city"],
+  "intervals": ["0000/3000"]
+}
+```
+</TabItem>
+</Tabs>
+
+Inline datasources allow you to query a small amount of data that is embedded in the query itself. They are useful when
+you want to write a query on a small amount of data without loading it first. They are also useful as inputs into a
+[join](#join). Druid also uses them internally to handle subqueries that need to be inlined on the Broker. See the
+[`query` datasource](#query) documentation for more details.
+
+There are two fields in an inline datasource: an array of `columnNames` and an array of `rows`. Each row is an array
+that must be exactly as long as the list of `columnNames`. The first element in each row corresponds to the first
+column in `columnNames`, and so on.
+
+Inline datasources are not available in Druid SQL.
+
+Refer to the [Query execution](query-execution.md#inline) page for more details on how queries are executed when you
+use inline datasources.
+
+### `query`
+
+<Tabs>
+<TabItem value="8" label="SQL">
+
+```sql
+-- Uses a subquery to count hits per page, then takes the average.
+SELECT
+  AVG(cnt) AS average_hits_per_page
+FROM
+  (SELECT page, COUNT(*) AS hits FROM site_traffic GROUP BY page)
+```
+</TabItem>
+<TabItem value="9" label="Native">
+
+```json
+{
+  "queryType": "timeseries",
+  "dataSource": {
+    "type": "query",
+    "query": {
+      "queryType": "groupBy",
+      "dataSource": "site_traffic",
+      "intervals": ["0000/3000"],
+      "granularity": "all",
+      "dimensions": ["page"],
+      "aggregations": [
+        { "type": "count", "name": "hits" }
+      ]
+    }
+  },
+  "intervals": ["0000/3000"],
+  "granularity": "all",
+  "aggregations": [
+    { "type": "longSum", "name": "hits", "fieldName": "hits" },
+    { "type": "count", "name": "pages" }
+  ],
+  "postAggregations": [
+    { "type": "expression", "name": "average_hits_per_page", "expression": "hits / pages" }
+  ]
+}
+```
+</TabItem>
+</Tabs>
+
+Query datasources allow you to issue subqueries. In native queries, they can appear anywhere that accepts a
+`dataSource` (except underneath a `union`). In SQL, they can appear in the following places, always surrounded by parentheses:
+
+- The FROM clause: `FROM (<subquery>)`.
+- As inputs to a JOIN: `<table-or-subquery-1> t1 INNER JOIN <table-or-subquery-2> t2 ON t1.<col1> = t2.<col2>`.
+- In the WHERE clause: `WHERE <column> { IN | NOT IN } (<subquery>)`. These are translated to joins by the SQL planner.
+
+:::info
+ Performance tip: In most cases, subquery results are fully buffered in memory on the Broker and then further
+ processing occurs on the Broker itself. This means that subqueries with large result sets can cause performance
+ bottlenecks or run into memory usage limits on the Broker. See the [Query execution](query-execution.md#query)
+ page for more details on how subqueries are executed and what limits will apply.
+:::
+
+### `join`
+
+<Tabs>
+<TabItem value="10" label="SQL">
+
+```sql
+-- Joins "sales" with "countries" (using "store" as the join key) to get sales by country.
+SELECT
+  store_to_country.v AS country,
+  SUM(sales.revenue) AS country_revenue
+FROM
+  sales
+  INNER JOIN lookup.store_to_country ON sales.store = store_to_country.k
+GROUP BY
+  countries.v
+```
+</TabItem>
+<TabItem value="11" label="Native">
+
+```json
+{
+  "queryType": "groupBy",
+  "dataSource": {
+    "type": "join",
+    "left": "sales",
+    "right": {
+      "type": "lookup",
+      "lookup": "store_to_country"
+    },
+    "rightPrefix": "r.",
+    "condition": "store == \"r.k\"",
+    "joinType": "INNER"
+  },
+  "intervals": ["0000/3000"],
+  "granularity": "all",
+  "dimensions": [
+    { "type": "default", "outputName": "country", "dimension": "r.v" }
+  ],
+  "aggregations": [
+    { "type": "longSum", "name": "country_revenue", "fieldName": "revenue" }
+  ]
+}
+```
+</TabItem>
+</Tabs>
+
+Join datasources allow you to do a SQL-style join of two datasources. Stacking joins on top of each other allows
+you to join arbitrarily many datasources.
+
+Joins in native queries are implemented with a broadcast hash-join algorithm. This means
+that all datasources other than the leftmost "base" datasource must fit in memory. In native queries, the join condition
+must be an equality. In SQL, any join condition is accepted, but only equalities of a certain form
+(see [Joins in SQL](#joins-in-sql)) execute efficiently as part of a native join. For other kinds of conditions, planner will try
+to re-arrange condition such that some of the sub-conditions are evaluated as a filter on top of join and other 
+sub-conditions are left out in the join condition. In worst case scenario, SQL will execute the join condition as a 
+cross join (cartesian product) plus a filter.
+
+This feature is intended mainly to allow joining regular Druid tables with [lookup](#lookup), [inline](#inline), and
+[query](#query) datasources. Refer to the [Query execution](query-execution.md#join) page for more details on how
+queries are executed when you use join datasources.
+
+#### Joins in SQL
+
+SQL joins take the form:
+
+```
+<o1> [ INNER | LEFT [OUTER] ] JOIN <o2> ON <condition>
+```
+
+Any condition is accepted, but only certain kinds of conditions execute efficiently
+as a native join. The condition must be a single clause like the following, or an `AND` of clauses involving at
+least one of the following:
+
+- Equality between fields of the same type on each side, like `t1 JOIN t2 ON t1.x = t2.x`.
+- Equality between a function call on one side, and a field on the other side, like `t1 JOIN t2 ON LOWER(t1.x) = t2.x`.
+- The equality operator may be `=` (which does not match nulls) or `IS NOT DISTINCT FROM` (which does match nulls).
+
+In other cases, Druid will either insert a subquery below the join, or will use a cross join (cartesian product)
+followed by a filter. Joins executed in these ways may run into resource or performance constraints. To determine
+if your query is using one of these execution paths, run `EXPLAIN PLAN FOR <query>` and look for the following:
+
+- `query` type datasources under the `left` or `right` key of your `join` datasource.
+- `join` type datasource with `condition` set to `"1"` (cartesian product) followed by a `filter` that encodes the
+  condition you provided.
+
+In these cases, you may be able to improve the performance of your query by rewriting it.
+
+For more information about how Druid translates SQL to native queries, refer to the
+[Druid SQL](sql-translation.md) documentation.
+
+#### Joins in native queries
+
+Native join datasources have the following properties. All are required.
+
+|Field|Description|
+|-----|-----------|
+|`left`|Left-hand datasource. Must be of type `table`, `join`, `lookup`, `query`, or `inline`. Placing another join as the left datasource allows you to join arbitrarily many datasources.|
+|`right`|Right-hand datasource. Must be of type `lookup`, `query`, or `inline`. Note that this is more rigid than what Druid SQL requires.|
+|`rightPrefix`|String prefix that will be applied to all columns from the right-hand datasource, to prevent them from colliding with columns from the left-hand datasource. Can be any string, so long as it is nonempty and is not be a prefix of the string `__time`. Any columns from the left-hand side that start with your `rightPrefix` will be shadowed. It is up to you to provide a prefix that will not shadow any important columns from the left side.|
+|`condition`|[Expression](math-expr.md) that must be an equality where one side is an expression of the left-hand side, and the other side is a simple column reference to the right-hand side. Note that this is more rigid than what Druid SQL requires: here, the right-hand reference must be a simple column reference; in SQL it can be an expression.|
+|`joinType`|`INNER` or `LEFT`.|
+
+#### Join performance
+
+Joins are a feature that can significantly affect performance of your queries. Some performance tips and notes:
+
+1. Joins are especially useful with [lookup datasources](#lookup), but in most cases, the
+[`LOOKUP` function](sql-scalar.md#string-functions) performs better than a join. Consider using the `LOOKUP` function if
+it is appropriate for your use case.
+2. When using joins in Druid SQL, keep in mind that it can generate subqueries that you did not explicitly include in
+your queries. Refer to the [Druid SQL](sql-translation.md) documentation for more details about when this happens
+and how to detect it.
+3. One common reason for implicit subquery generation is if the types of the two halves of an equality do not match.
+For example, since lookup keys are always strings, the condition `druid.d JOIN lookup.l ON d.field = l.field` will
+perform best if `d.field` is a string.
+4. The join operator must evaluate the condition for each row. 
+5. Currently, Druid does not support pushing down predicates (condition and filter) past a Join (i.e. into
+Join's children). Druid only supports pushing predicates into the join if they originated from
+above the join. Hence, the location of predicates and filters in your Druid SQL is very important.
+Also, as a result of this, comma joins should be avoided.
+
+#### Limitations for joins
+
+Joins in Druid have the following limitations:
+
+- The order of joins is not entirely optimized. Join operations are not reordered to get the most performant plan.
+- Preloaded dimension tables that are wider than lookups (i.e. supporting more than a single key and single value) are not supported.
+- RIGHT OUTER and FULL OUTER joins in the native query engine are not fully implemented. Queries run
+  but results are not always correct.
+- Join conditions on a column can't contain a multi-value dimension.
+
+### `unnest`
+
+Use the `unnest` datasource to unnest a column with multiple values in an array.
+For example, you have a source column that looks like this:
+
+| Nested |
+| -- |
+| [a, b] |
+| [c, d] |
+| [e, [f,g]] |
+
+When you use the `unnest` datasource, the unnested column looks like this:
+
+| Unnested |
+| -- |
+| a |
+| b |
+| c |
+| d |
+| e |
+| [f, g] |
+
+When unnesting data, keep the following in mind:
+
+- The total number of rows will grow to accommodate the new rows that the unnested data occupy.
+- You can unnest the values in more than one column in a single `unnest` datasource, but this can lead to a very large number of new rows depending on your dataset.
+
+The `unnest` datasource uses the following syntax:
+
+```json
+  "dataSource": {
+    "type": "unnest",
+    "base": {
+      "type": "table",
+      "name": "nested_data"
+    },
+    "virtualColumn": {
+      "type": "expression",
+      "name": "output_column",
+      "expression": "\"column_reference\""
+    },
+    "unnestFilter": "optional_filter"
+  }
+```
+
+* `dataSource.type`: Set this to `unnest`.
+* `dataSource.base`: Defines the datasource you want to unnest.
+  * `dataSource.base.type`: The type of datasource you want to unnest, such as a table.
+* `dataSource.virtualColumn`: [Virtual column](virtual-columns.md) that references the nested values. The output name of this column is reused as the name of the column that contains unnested values. You can replace the source column with the unnested column by specifying the source column's name or a new column by specifying a different name. Outputting it to a new column can help you verify that you get the results that you expect but isn't required.
+* `unnestFilter`: A filter only on the output column. You can omit this or set it to null if there are no filters.
+
+To learn more about how to use the `unnest` datasource, see the [unnest tutorial](../tutorials/tutorial-unnest-arrays.md).
diff --git a/docs/35.0.0/querying/datasourcemetadataquery.md b/docs/35.0.0/querying/datasourcemetadataquery.md
new file mode 100644
index 0000000000..c7fc2fb35a
--- /dev/null
+++ b/docs/35.0.0/querying/datasourcemetadataquery.md
@@ -0,0 +1,62 @@
+---
+id: datasourcemetadataquery
+title: "DatasourceMetadata queries"
+sidebar_label: "DatasourceMetadata"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ Apache Druid supports two query languages: [Druid SQL](sql.md) and [native queries](querying.md).
+ This document describes a query
+ type that is only available in the native language.
+:::
+
+Data Source Metadata queries return metadata information for a dataSource.  These queries return information about:
+
+* `maxIngestedEventTime`: The timestamp of the latest ingested event for the dataSource. For realtime datasources, this may be later than `MAX(__time)` if `queryGranularity` is being used. For non-realtime datasources, this is equivalent to `MAX(__time)`.
+
+The grammar for these queries is:
+
+```json
+{
+    "queryType" : "dataSourceMetadata",
+    "dataSource": "sample_datasource"
+}
+```
+
+There are 2 main parts to a Data Source Metadata query:
+
+|property|description|required?|
+|--------|-----------|---------|
+|queryType|This String should always be "dataSourceMetadata"; this is the first thing Apache Druid looks at to figure out how to interpret the query|yes|
+|dataSource|A String or Object defining the data source to query, very similar to a table in a relational database. See [DataSource](../querying/datasource.md) for more information.|yes|
+|context|See [Query context reference](../querying/query-context-reference.md)|no|
+
+The format of the result is:
+
+```json
+[ {
+  "timestamp" : "2013-05-09T18:24:00.000Z",
+  "result" : {
+    "maxIngestedEventTime" : "2013-05-09T18:24:09.007Z"
+  }
+} ]
+```
diff --git a/docs/35.0.0/querying/dimensionspecs.md b/docs/35.0.0/querying/dimensionspecs.md
new file mode 100644
index 0000000000..dba52abcc6
--- /dev/null
+++ b/docs/35.0.0/querying/dimensionspecs.md
@@ -0,0 +1,550 @@
+---
+id: dimensionspecs
+title: "Query dimensions"
+sidebar_label: "Dimensions"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ Apache Druid supports two query languages: [Druid SQL](sql.md) and [native queries](querying.md).
+ This document describes the native
+ language. For information about functions available in SQL, refer to the
+ [SQL documentation](sql-scalar.md).
+:::
+
+The following JSON fields can be used in a query to operate on dimension values.
+
+## DimensionSpec
+
+A `DimensionSpec` defines how to transform dimension values prior to aggregation.
+
+### Default DimensionSpec
+
+Returns dimension values as is and optionally renames the dimension.
+
+```json
+{
+  "type" : "default",
+  "dimension" : <dimension>,
+  "outputName": <output_name>,
+  "outputType": <"STRING"|"LONG"|"FLOAT">
+}
+```
+
+When specifying a `DimensionSpec` on a numeric column, you should include the type of the column in the `outputType` field. The `outputType` defaults to STRING when not specified.
+
+See [Output Types](#output-types) for more details.
+
+### Extraction DimensionSpec
+
+Returns dimension values transformed using the given [extraction function](#extraction-functions).
+
+```json
+{
+  "type" : "extraction",
+  "dimension" : <dimension>,
+  "outputName" :  <output_name>,
+  "outputType": <"STRING"|"LONG"|"FLOAT">,
+  "extractionFn" : <extraction_function>
+}
+```
+
+You can specify an `outputType` in an `ExtractionDimensionSpec` to apply type conversion to results before merging. The `outputType` defaults to STRING when not specified.
+
+Please refer to the [Output Types](#output-types) section for more details.
+
+### Filtered DimensionSpecs
+
+A filtered `DimensionSpec` is only useful for multi-value dimensions. Say you have a row in Apache Druid that has a multi-value dimension with values ["v1", "v2", "v3"] and you send a groupBy/topN query grouping by that dimension with a [query filter](filters.md) for a value of "v1". In the response you will get 3 rows containing "v1", "v2" and "v3". This behavior might be unintuitive for some use cases.
+
+This happens because Druid uses the "query filter" internally on bitmaps to match the row to include in query result processing. With multi-value dimensions, "query filter" behaves like a contains check, which matches the row with dimension value ["v1", "v2", "v3"]. 
+
+See the section on "Multi-value columns" in [segment](../design/segments.md) for more details.
+
+Then the groupBy/topN processing pipeline "explodes" all multi-value dimensions resulting 3 rows for "v1", "v2" and "v3" each.
+
+In addition to "query filter", which efficiently selects the rows to be processed, you can use the filtered dimension spec to filter for specific values within the values of a multi-value dimension. These dimension specs take a delegate `DimensionSpec` and a filtering criteria. From the "exploded" rows, only rows matching the given filtering criteria are returned in the query result.
+
+The following filtered dimension spec defines the values to include or exclude as per the `isWhitelist` attribute value.
+
+```json
+{ "type" : "listFiltered", "delegate" : <dimensionSpec>, "values": <array of strings>, "isWhitelist": <optional attribute for true/false, default is true> }
+```
+
+The following filtered dimension spec retains only the values matching a regex.  You should use the `listFiltered` function for inclusion and exclusion use cases because it is faster.
+
+```json
+{ "type" : "regexFiltered", "delegate" : <dimensionSpec>, "pattern": <java regex pattern> }
+```
+
+The following filtered dimension spec retains only the values starting with the same prefix.
+
+```json
+{ "type" : "prefixFiltered", "delegate" : <dimensionSpec>, "prefix": <prefix string> }
+```
+
+For more details and examples, see [multi-value dimensions](multi-value-dimensions.md).
+
+### Lookup DimensionSpecs
+
+You can use lookup dimension specs to define a lookup implementation as a dimension spec directly.
+Generally, there are two kinds of lookup implementations.
+The first kind is passed at the query time like `map` implementation.
+
+```json
+{
+  "type":"lookup",
+  "dimension":"dimensionName",
+  "outputName":"dimensionOutputName",
+  "replaceMissingValueWith":"missing_value",
+  "retainMissingValue":false,
+  "lookup":{"type": "map", "map":{"key":"value"}, "isOneToOne":false}
+}
+```
+
+A property of `retainMissingValue` and `replaceMissingValueWith` can be specified at query time to hint how to handle missing values. Setting `replaceMissingValueWith` to `""` has the same effect as setting it to `null` or omitting the property.
+Setting `retainMissingValue` to true will use the dimension's original value if it is not found in the lookup.
+The default values are `replaceMissingValueWith = null` and `retainMissingValue = false` which causes missing values to be treated as missing.
+
+It is illegal to set `retainMissingValue = true` and also specify a `replaceMissingValueWith`.
+
+A property `optimize` can be supplied to allow optimization of lookup based extraction filter (by default `optimize = true`).
+
+The second kind where it is not possible to pass at query time due to their size, will be based on an external lookup table or resource that is already registered via configuration file or/and Coordinator.
+
+```json
+{
+  "type":"lookup",
+  "dimension":"dimensionName",
+  "outputName":"dimensionOutputName",
+  "name":"lookupName"
+}
+```
+
+## Output Types
+
+The dimension specs provide an option to specify the output type of a column's values. This is necessary as it is possible for a column with given name to have different value types in different segments; results will be converted to the type specified by `outputType` before merging.
+
+Note that not all use cases for DimensionSpec currently support `outputType`, the table below shows which use cases support this option:
+
+|Query Type|Supported?|
+|--------|---------|
+|GroupBy (v1)|no|
+|GroupBy (v2)|yes|
+|TopN|yes|
+|Search|no|
+|Select|no|
+|Cardinality Aggregator|no|
+
+## Extraction Functions
+
+Extraction functions define the transformation applied to each dimension value.
+
+Transformations can be applied to both regular (string) dimensions, as well
+as the special `__time` dimension, which represents the current time bucket
+according to the query [aggregation granularity](../querying/granularities.md).
+
+**Note**: for functions taking string values (such as regular expressions),
+`__time` dimension values will be formatted in [ISO-8601 format](https://en.wikipedia.org/wiki/ISO_8601)
+before getting passed to the extraction function.
+
+### Regular Expression Extraction Function
+
+Returns the first matching group for the given regular expression.
+If there is no match, it returns the dimension value as is.
+
+```json
+{
+  "type" : "regex",
+  "expr" : <regular_expression>,
+  "index" : <group to extract, default 1>
+  "replaceMissingValue" : true,
+  "replaceMissingValueWith" : "foobar"
+}
+```
+
+For example, using `"expr" : "(\\w\\w\\w).*"` will transform
+`'Monday'`, `'Tuesday'`, `'Wednesday'` into `'Mon'`, `'Tue'`, `'Wed'`.
+
+If "index" is set, it will control which group from the match to extract. Index zero extracts the string matching the
+entire pattern.
+
+If the `replaceMissingValue` property is true, the extraction function will transform dimension values that do not match the regex pattern to a user-specified String. Default value is `false`.
+
+The `replaceMissingValueWith` property sets the String that unmatched dimension values will be replaced with, if `replaceMissingValue` is true. If `replaceMissingValueWith` is not specified, unmatched dimension values will be replaced with nulls.
+
+For example, if `expr` is `"(a\w+)"` in the example JSON above, a regex that matches words starting with the letter `a`, the extraction function will convert a dimension value like `banana` to `foobar`.
+
+
+### Partial Extraction Function
+
+Returns the dimension value unchanged if the regular expression matches, otherwise returns null.
+
+```json
+{ "type" : "partial", "expr" : <regular_expression> }
+```
+
+### Search query extraction function
+
+Returns the dimension value unchanged if the given [`SearchQuerySpec`](../querying/searchquery.md#searchqueryspec)
+matches, otherwise returns null.
+
+```json
+{ "type" : "searchQuery", "query" : <search_query_spec> }
+```
+
+### Substring Extraction Function
+
+Returns a substring of the dimension value starting from the supplied index and of the desired length. Both index
+and length are measured in the number of Unicode code units present in the string as if it were encoded in UTF-16.
+Note that some Unicode characters may be represented by two code units. This is the same behavior as the Java String
+class's "substring" method.
+
+If the desired length exceeds the length of the dimension value, the remainder of the string starting at index will
+be returned. If index is greater than the length of the dimension value, null will be returned.
+
+```json
+{ "type" : "substring", "index" : 1, "length" : 4 }
+```
+
+The length may be omitted for substring to return the remainder of the dimension value starting from index,
+or null if index greater than the length of the dimension value.
+
+```json
+{ "type" : "substring", "index" : 3 }
+```
+
+### Strlen Extraction Function
+
+Returns the length of dimension values, as measured in the number of Unicode code units present in the string as if it
+were encoded in UTF-16. Note that some Unicode characters may be represented by two code units. This is the same
+behavior as the Java String class's "length" method.
+
+null strings are considered as having zero length.
+
+```json
+{ "type" : "strlen" }
+```
+
+### Time Format Extraction Function
+
+Returns the dimension value formatted according to the given format string, time zone, and locale.
+
+For `__time` dimension values, this formats the time value bucketed by the
+[aggregation granularity](../querying/granularities.md)
+
+For a regular dimension, it assumes the string is formatted in
+[ISO-8601 date and time format](https://en.wikipedia.org/wiki/ISO_8601).
+
+* `format` : date time format for the resulting dimension value, in [Joda Time DateTimeFormat](http://www.joda.org/joda-time/apidocs/org/joda/time/format/DateTimeFormat.html), or null to use the default ISO8601 format.
+* `locale` : locale (language and country) to use, given as a [IETF BCP 47 language tag](https://www.oracle.com/java/technologies/javase/jdk17-suported-locales.html#util-text), e.g. `en-US`, `en-GB`, `fr-FR`, `fr-CA`, etc.
+* `timeZone` : time zone to use in [IANA tz database format](http://en.wikipedia.org/wiki/List_of_tz_database_time_zones), e.g. `Europe/Berlin` (this can possibly be different than the aggregation time-zone)
+* `granularity` : [granularity](granularities.md) to apply before formatting, or omit to not apply any granularity.
+* `asMillis` : boolean value, set to true to treat input strings as millis rather than ISO8601 strings. Additionally, if `format` is null or not specified, output will be in millis rather than ISO8601.
+
+```json
+{ "type" : "timeFormat",
+  "format" : <output_format> (optional),
+  "timeZone" : <time_zone> (optional, default UTC),
+  "locale" : <locale> (optional, default current locale),
+  "granularity" : <granularity> (optional, default none) },
+  "asMillis" : <true or false> (optional) }
+```
+
+For example, the following dimension spec returns the day of the week for Montréal in French:
+
+```json
+{
+  "type" : "extraction",
+  "dimension" : "__time",
+  "outputName" :  "dayOfWeek",
+  "extractionFn" : {
+    "type" : "timeFormat",
+    "format" : "EEEE",
+    "timeZone" : "America/Montreal",
+    "locale" : "fr"
+  }
+}
+```
+
+### Time Parsing Extraction Function
+
+Parses dimension values as timestamps using the given input format,
+and returns them formatted using the given output format.
+
+Note, if you are working with the `__time` dimension, you should consider using the
+[time extraction function instead](#time-format-extraction-function) instead,
+which works on time value directly as opposed to string values.
+
+If "joda" is true, time formats are described in the [Joda DateTimeFormat documentation](http://www.joda.org/joda-time/apidocs/org/joda/time/format/DateTimeFormat.html).
+If "joda" is false (or unspecified) then formats are described in the [SimpleDateFormat documentation](http://icu-project.org/apiref/icu4j/com/ibm/icu/text/SimpleDateFormat.html).
+In general, we recommend setting "joda" to true since Joda format strings are more common in Druid APIs and since Joda handles certain edge cases (like weeks and weekyears near
+the start and end of calendar years) in a more ISO8601 compliant way.
+
+If a value cannot be parsed using the provided timeFormat, it will be returned as-is.
+
+```json
+{ "type" : "time",
+  "timeFormat" : <input_format>,
+  "resultFormat" : <output_format>,
+  "joda" : <true, false> }
+```
+
+
+### JavaScript Extraction Function
+
+Returns the dimension value, as transformed by the given JavaScript function.
+
+For regular dimensions, the input value is passed as a string.
+
+For the `__time` dimension, the input value is passed as a number
+representing the number of milliseconds since January 1, 1970 UTC.
+
+Example for a regular dimension
+
+```json
+{
+  "type" : "javascript",
+  "function" : "function(str) { return str.substr(0, 3); }"
+}
+```
+
+```json
+{
+  "type" : "javascript",
+  "function" : "function(str) { return str + '!!!'; }",
+  "injective" : true
+}
+```
+
+A property of `injective` specifies if the JavaScript function preserves uniqueness. The default value is `false` meaning uniqueness is not preserved
+
+Example for the `__time` dimension:
+
+```json
+{
+  "type" : "javascript",
+  "function" : "function(t) { return 'Second ' + Math.floor((t % 60000) / 1000); }"
+}
+```
+
+:::info
+ JavaScript-based functionality is disabled by default. Please refer to the Druid [JavaScript programming guide](../development/javascript.md) for guidelines about using Druid's JavaScript functionality, including instructions on how to enable it.
+:::
+
+### Registered lookup extraction function
+
+Lookups are a concept in Druid where dimension values are (optionally) replaced with new values.
+For more documentation on using lookups, please see [Lookups](../querying/lookups.md).
+The "registeredLookup" extraction function lets you refer to a lookup that has been registered in the cluster-wide
+configuration.
+
+An example:
+
+```json
+{
+  "type":"registeredLookup",
+  "lookup":"some_lookup_name",
+  "retainMissingValue":true
+}
+```
+
+A property of `retainMissingValue` and `replaceMissingValueWith` can be specified at query time to hint how to handle
+missing values. Setting `replaceMissingValueWith` to `""` has the same effect as setting it to `null` or omitting the
+property. Setting `retainMissingValue` to true will use the dimension's original value if it is not found in the lookup.
+The default values are `replaceMissingValueWith = null` and `retainMissingValue = false` which causes missing values to
+be treated as missing.
+
+It is illegal to set `retainMissingValue = true` and also specify a `replaceMissingValueWith`.
+
+A property of `injective` can override the lookup's own sense of whether or not it is
+[injective](lookups.md#injective-lookups). If left unspecified, Druid will use the registered cluster-wide lookup
+configuration.
+
+A property `optimize` can be supplied to allow optimization of lookup based extraction filter (by default `optimize = true`).
+The optimization layer will run on the Broker and it will rewrite the extraction filter as clause of selector filters.
+For instance the following filter
+
+```json
+{
+    "filter": {
+        "type": "selector",
+        "dimension": "product",
+        "value": "bar_1",
+        "extractionFn": {
+            "type": "registeredLookup",
+            "optimize": true,
+            "lookup": "some_lookup_name"
+        }
+    }
+}
+```
+
+will be rewritten as the following simpler query, assuming a lookup that maps "product_1" and "product_3" to the value
+"bar_1":
+
+```json
+{
+   "filter":{
+      "type":"or",
+      "fields":[
+         {
+            "filter":{
+               "type":"selector",
+               "dimension":"product",
+               "value":"product_1"
+            }
+         },
+         {
+            "filter":{
+               "type":"selector",
+               "dimension":"product",
+               "value":"product_3"
+            }
+         }
+      ]
+   }
+}
+```
+
+A null dimension value can be mapped to a specific value by specifying the empty string as the key in your lookup file.
+This allows distinguishing between a null dimension and a lookup resulting in a null.
+For example, specifying `{"":"bar","bat":"baz"}` with dimension values `[null, "foo", "bat"]` and replacing missing values with `"oof"` will yield results of `["bar", "oof", "baz"]`.
+Omitting the empty string key will cause the missing value to take over. For example, specifying `{"bat":"baz"}` with dimension values `[null, "foo", "bat"]` and replacing missing values with `"oof"` will yield results of `["oof", "oof", "baz"]`.
+
+### Inline lookup extraction function
+
+Lookups are a concept in Druid where dimension values are (optionally) replaced with new values.
+For more documentation on using lookups, please see [Lookups](../querying/lookups.md).
+The "lookup" extraction function lets you specify an inline lookup map without registering one in the cluster-wide
+configuration.
+
+Examples:
+
+```json
+{
+  "type":"lookup",
+  "lookup":{
+    "type":"map",
+    "map":{"foo":"bar", "baz":"bat"}
+  },
+  "retainMissingValue":true,
+  "injective":true
+}
+```
+
+```json
+{
+  "type":"lookup",
+  "lookup":{
+    "type":"map",
+    "map":{"foo":"bar", "baz":"bat"}
+  },
+  "retainMissingValue":false,
+  "injective":false,
+  "replaceMissingValueWith":"MISSING"
+}
+```
+
+The inline lookup should be of type `map`.
+
+The properties `retainMissingValue`, `replaceMissingValueWith`, `injective`, and `optimize` behave similarly to the
+[registered lookup extraction function](#registered-lookup-extraction-function).
+
+### Cascade Extraction Function
+
+Provides chained execution of extraction functions.
+
+A property of `extractionFns` contains an array of any extraction functions, which is executed in the array index order.
+
+Example for chaining [regular expression extraction function](#regular-expression-extraction-function), [JavaScript extraction function](#javascript-extraction-function), and [substring extraction function](#substring-extraction-function) is as followings.
+
+```json
+{
+  "type" : "cascade",
+  "extractionFns": [
+    {
+      "type" : "regex",
+      "expr" : "/([^/]+)/",
+      "replaceMissingValue": false,
+      "replaceMissingValueWith": null
+    },
+    {
+      "type" : "javascript",
+      "function" : "function(str) { return \"the \".concat(str) }"
+    },
+    {
+      "type" : "substring",
+      "index" : 0, "length" : 7
+    }
+  ]
+}
+```
+
+It will transform dimension values with specified extraction functions in the order named.
+For example, `'/druid/prod/historical'` is transformed to `'the dru'` as regular expression extraction function first transforms it to `'druid'` and then, JavaScript extraction function transforms it to `'the druid'`, and lastly, substring extraction function transforms it to `'the dru'`.
+
+### String Format Extraction Function
+
+Returns the dimension value formatted according to the given format string.
+
+```json
+{ "type" : "stringFormat", "format" : <sprintf_expression>, "nullHandling" : <optional attribute for handling null value> }
+```
+
+For example if you want to concat "[" and "]" before and after the actual dimension value, you need to specify "[%s]" as format string. "nullHandling" can be one of `nullString`, `emptyString` or `returnNull`. With "[%s]" format, each configuration will result `[null]`, `[]`, `null`. Default is `nullString`.
+
+### Upper and Lower extraction functions.
+
+Returns the dimension values as all upper case or lower case.
+Optionally user can specify the language to use in order to perform upper or lower transformation
+
+```json
+{
+  "type" : "upper",
+  "locale":"fr"
+}
+```
+
+or without setting "locale" (in this case, the current value of the default locale for this instance of the Java Virtual Machine.)
+
+```json
+{
+  "type" : "lower"
+}
+```
+
+### Bucket Extraction Function
+
+Bucket extraction function is used to bucket numerical values in each range of the given size by converting them to the same base value. Non numeric values are converted to null.
+
+* `size` : the size of the buckets (optional, default 1)
+* `offset` : the offset for the buckets (optional, default 0)
+
+The following extraction function creates buckets of 5 starting from 2. In this case, values in the range of [2, 7) will be converted to 2, values in [7, 12) will be converted to 7, etc.
+
+```json
+{
+  "type" : "bucket",
+  "size" : 5,
+  "offset" : 2
+}
+```
diff --git a/docs/35.0.0/querying/filters.md b/docs/35.0.0/querying/filters.md
new file mode 100644
index 0000000000..d088d92641
--- /dev/null
+++ b/docs/35.0.0/querying/filters.md
@@ -0,0 +1,901 @@
+---
+id: filters
+title: "Query filters"
+sidebar_label: "Filters"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+A filter is a JSON object indicating which rows of data should be included in the computation for a query. It’s essentially the equivalent of the WHERE clause in SQL.
+Filters are commonly applied on dimensions, but can be applied on aggregated metrics, for example, see [Filtered aggregator](./aggregations.md#filtered-aggregator) and [Having filters](./having.md).
+
+By default, Druid uses SQL compatible three-value logic when filtering. See [Boolean logic](./sql-data-types.md#boolean-logic) for more details.
+
+:::info
+ Apache Druid supports two query languages: [Druid SQL](sql.md) and [native queries](querying.md).
+ This document describes the native
+ language. For information about aggregators available in SQL, refer to the
+ [SQL documentation](sql-scalar.md).
+:::
+
+This topic describes the filter types supported in Apache Druid.
+
+## Selector filter
+
+The simplest filter is a selector filter. The selector filter matches a specific dimension with a specific value. Selector filters can be used as the base filters for more complex Boolean expressions of filters.
+
+| Property | Description | Required |
+| -------- | ----------- | -------- |
+| `type` | Must be `selector`.| Yes |
+| `dimension` | Input column or virtual column name to filter on. | Yes |
+| `value` | String value to match. | No. If not specified the filter matches NULL values. |
+| `extractionFn` | [Extraction function](./dimensionspecs.md#extraction-functions) to apply to `dimension` prior to value matching. See [filtering with extraction functions](#filtering-with-extraction-functions) for details. | No |
+
+The selector filter can only match against `STRING` (single and multi-valued), `LONG`, `FLOAT`, `DOUBLE` types. Use the newer null and equality filters to match against `ARRAY` or `COMPLEX` types.
+
+When the selector filter matches against numeric inputs, the string `value` will be best-effort coerced into a numeric value.
+
+**Example**: equivalent of `WHERE someColumn = 'hello'`
+
+``` json
+{ "type": "selector", "dimension": "someColumn", "value": "hello" }
+```
+
+**Example**: equivalent of `WHERE someColumn IS NULL`
+
+``` json
+{ "type": "selector", "dimension": "someColumn", "value": null }
+```
+
+## Equality filter
+
+The equality filter is a replacement for the selector filter with the ability to match against any type of column. The equality filter is designed to have more SQL compatible behavior than the selector filter and so can not match null values. To match null values use the null filter.
+
+Druid's SQL planner uses the equality filter by default instead of selector filter whenever unless `sqlUseBoundAndSelectors` is set to true on the [SQL query context](./sql-query-context.md).
+
+| Property | Description | Required |
+| -------- | ----------- | -------- |
+| `type` | Must be `equals`.| Yes |
+| `column` | Input column or virtual column name to filter on. | Yes |
+| `matchValueType` | String specifying the type of value to match. For example `STRING`, `LONG`, `DOUBLE`, `FLOAT`, `ARRAY<STRING>`, `ARRAY<LONG>`, or any other Druid type. The `matchValueType` determines how Druid interprets the `matchValue` to assist in converting to the type of the matched `column`. | Yes |
+| `matchValue` | Value to match, must not be null. | Yes |
+
+**Example**: equivalent of `WHERE someColumn = 'hello'`
+
+```json
+{ "type": "equals", "column": "someColumn", "matchValueType": "STRING", "matchValue": "hello" }
+```
+
+**Example**: equivalent of `WHERE someNumericColumn = 1.23`
+
+```json
+{ "type": "equals", "column": "someNumericColumn", "matchValueType": "DOUBLE", "matchValue": 1.23 }
+```
+
+**Example**: equivalent of `WHERE someArrayColumn = ARRAY[1, 2, 3]`
+
+```json
+{ "type": "equals", "column": "someArrayColumn", "matchValueType": "ARRAY<LONG>", "matchValue": [1, 2, 3] }
+```
+
+## Null filter
+
+The null filter is a partial replacement for the selector filter. It is dedicated to matching NULL values.
+
+Druid's SQL planner uses the null filter by default instead of selector filter unless `sqlUseBoundAndSelectors` is set to true on the [SQL query context](./sql-query-context.md).
+
+| Property | Description | Required |
+| -------- | ----------- | -------- |
+| `type` | Must be `null`.| Yes |
+| `column` | Input column or virtual column name to filter on. | Yes |
+
+**Example**: equivalent of `WHERE someColumn IS NULL`
+
+```json
+{ "type": "null", "column": "someColumn" }
+```
+
+## Column comparison filter
+
+The column comparison filter is similar to the selector filter, but compares dimensions to each other. For example:
+
+| Property | Description | Required |
+| -------- | ----------- | -------- |
+| `type` | Must be `selector`.| Yes |
+| `dimensions` | List of [`DimensionSpec`](./dimensionspecs.md) to compare. | Yes |
+
+`dimensions` is list of [DimensionSpecs](./dimensionspecs.md), making it possible to apply an extraction function if needed.
+
+Note that the column comparison filter converts all values to strings prior to comparison. This allows differently-typed input columns to match without a cast operation.
+
+**Example**: equivalent of `WHERE someColumn = someLongColumn`
+
+``` json
+{
+  "type": "columnComparison",
+  "dimensions": [
+    "someColumn",
+    {
+      "type" : "default",
+      "dimension" : someLongColumn,
+      "outputType": "LONG"
+    }
+  ]
+}
+```
+
+## Logical expression filters
+
+### AND
+
+| Property | Description | Required |
+| -------- | ----------- | -------- |
+| `type` | Must be `and`.| Yes |
+| `fields` | List of filter JSON objects, such as any other filter defined on this page or provided by extensions. | Yes |
+
+
+**Example**: equivalent of `WHERE someColumn = 'a' AND otherColumn = 1234 AND anotherColumn IS NULL`
+
+``` json
+{
+  "type": "and",
+  "fields": [
+    { "type": "equals", "column": "someColumn", "matchValue": "a", "matchValueType": "STRING" },
+    { "type": "equals", "column": "otherColumn", "matchValue": 1234, "matchValueType": "LONG" },
+    { "type": "null", "column": "anotherColumn" } 
+  ]
+}
+```
+
+### OR
+
+| Property | Description | Required |
+| -------- | ----------- | -------- |
+| `type` | Must be `or`.| Yes |
+| `fields` | List of filter JSON objects, such as any other filter defined on this page or provided by extensions. | Yes |
+
+**Example**: equivalent of `WHERE someColumn = 'a' OR otherColumn = 1234 OR anotherColumn IS NULL`
+
+``` json
+{
+  "type": "or",
+  "fields": [
+    { "type": "equals", "column": "someColumn", "matchValue": "a", "matchValueType": "STRING" },
+    { "type": "equals", "column": "otherColumn", "matchValue": 1234, "matchValueType": "LONG" },
+    { "type": "null", "column": "anotherColumn" } 
+  ]
+}
+```
+
+### NOT
+
+| Property | Description | Required |
+| -------- | ----------- | -------- |
+| `type` | Must be `not`.| Yes |
+| `field` | Filter JSON objects, such as any other filter defined on this page or provided by extensions. | Yes |
+
+**Example**: equivalent of `WHERE someColumn IS NOT NULL`
+
+```json
+{ "type": "not", "field": { "type": "null", "column": "someColumn" }}
+```
+
+## In filter
+The in filter can match input rows against a set of values, where a match occurs if the value is contained in the set.
+
+| Property | Description | Required |
+| -------- | ----------- | -------- |
+| `type` | Must be `in`.| Yes |
+| `dimension` | Input column or virtual column name to filter on. | Yes |
+| `values` | List of string value to match. | Yes |
+| `extractionFn` | [Extraction function](./dimensionspecs.md#extraction-functions) to apply to `dimension` prior to value matching. See [filtering with extraction functions](#filtering-with-extraction-functions) for details. | No |
+
+
+If an empty `values` array is passed to the "in" filter, it will simply return an empty result.
+
+If the `values` array contains `null`, the "in" filter matches null values. This differs from the SQL IN filter, which
+does not match NULL values.
+
+**Example**: equivalent of `WHERE `outlaw` IN ('Good', 'Bad', 'Ugly')`
+
+```json
+{
+    "type": "in",
+    "dimension": "outlaw",
+    "values": ["Good", "Bad", "Ugly"]
+}
+```
+
+## Bound filter
+
+Bound filters can be used to filter on ranges of dimension values. It can be used for comparison filtering like
+greater than, less than, greater than or equal to, less than or equal to, and "between" (if both "lower" and
+"upper" are set).
+
+| Property | Description | Required |
+| -------- | ----------- | -------- |
+| `type` | Must be `bound`. | Yes |
+| `dimension` | Input column or virtual column name to filter on. | Yes |
+| `lower` | The lower bound string match value for the filter. | No |
+| `upper`| The upper bound string match value for the filter. | No |
+| `lowerStrict` | Boolean indicating whether to perform strict comparison on the `lower` bound (`>` instead of `>=`). | No, default: `false` |
+| `upperStrict` | Boolean indicating whether to perform strict comparison on the upper bound (`<` instead of `<=`). | No, default: `false`|
+| `ordering` | String that specifies the sorting order to use when comparing values against the bound. Can be one of the following values: `"lexicographic"`, `"alphanumeric"`, `"numeric"`, `"strlen"`, `"version"`. See [Sorting Orders](./sorting-orders.md) for more details. | No, default: `"lexicographic"`|
+| `extractionFn` | [Extraction function](./dimensionspecs.md#extraction-functions) to apply to `dimension` prior to value matching. See [filtering with extraction functions](#filtering-with-extraction-functions) for details. | No |
+
+When the bound filter matches against numeric inputs, the string `lower` and `upper` bound values are best-effort coerced into a numeric value when using the `"numeric"` mode of ordering.
+
+The bound filter can only match against `STRING` (single and multi-valued), `LONG`, `FLOAT`, `DOUBLE` types. Use the newer range to match against `ARRAY` or `COMPLEX` types.
+
+Note that the bound filter matches null values if you don't specify a lower bound. Use the range filter if SQL-compatible behavior.
+
+**Example**: equivalent to `WHERE 21 <= age <= 31`
+
+```json
+{
+    "type": "bound",
+    "dimension": "age",
+    "lower": "21",
+    "upper": "31" ,
+    "ordering": "numeric"
+}
+```
+
+**Example**: equivalent to `WHERE 'foo' <= name <= 'hoo'`, using the default lexicographic sorting order
+
+```json
+{
+    "type": "bound",
+    "dimension": "name",
+    "lower": "foo",
+    "upper": "hoo"
+}
+```
+
+**Example**: equivalent to `WHERE 21 < age < 31`
+
+```json
+{
+    "type": "bound",
+    "dimension": "age",
+    "lower": "21",
+    "lowerStrict": true,
+    "upper": "31" ,
+    "upperStrict": true,
+    "ordering": "numeric"
+}
+```
+
+**Example**: equivalent to `WHERE age < 31`
+
+```json
+{
+    "type": "bound",
+    "dimension": "age",
+    "upper": "31" ,
+    "upperStrict": true,
+    "ordering": "numeric"
+}
+```
+
+**Example**: equivalent to `WHERE age >= 18`
+
+```json
+{
+    "type": "bound",
+    "dimension": "age",
+    "lower": "18" ,
+    "ordering": "numeric"
+}
+```
+
+## Range filter
+
+The range filter is a replacement for the bound filter. It compares against any type of column and is designed to have has more SQL compliant behavior than the bound filter. It won't match null values, even if you don't specify a lower bound.
+
+Druid's SQL planner uses the range filter by default instead of bound filter unless `sqlUseBoundAndSelectors` is set to true on the [SQL query context](./sql-query-context.md).
+
+| Property | Description | Required |
+| -------- | ----------- | -------- |
+| `type` | Must be `range`.| Yes |
+| `column` | Input column or virtual column name to filter on. | Yes |
+| `matchValueType` | String specifying the type of bounds to match. For example `STRING`, `LONG`, `DOUBLE`, `FLOAT`, `ARRAY<STRING>`, `ARRAY<LONG>`, or any other Druid type. The `matchValueType` determines how Druid interprets the `matchValue` to assist in converting to the type of the matched `column` and also defines the type of comparison used when matching values. | Yes |
+| `lower` | Lower bound value to match. | No. At least one of `lower` or `upper` must not be null. |
+| `upper` | Upper bound value to match. | No. At least one of `lower` or `upper` must not be null. |
+| `lowerOpen` | Boolean indicating if lower bound is open in the interval of values defined by the range (`>` instead of `>=`). | No |
+| `upperOpen` | Boolean indicating if upper bound is open on the interval of values defined by range (`<` instead of `<=`). | No |
+
+**Example**: equivalent to `WHERE 21 <= age <= 31`
+
+```json
+{
+    "type": "range",
+    "column": "age",
+    "matchValueType": "LONG",
+    "lower": 21,
+    "upper": 31
+}
+```
+
+**Example**: equivalent to `WHERE 'foo' <= name <= 'hoo'`, using STRING comparison
+
+```json
+{
+    "type": "range",
+    "column": "name",
+    "matchValueType": "STRING",
+    "lower": "foo",
+    "upper": "hoo"
+}
+```
+
+**Example**: equivalent to `WHERE 21 < age < 31`
+
+```json
+{
+    "type": "range",
+    "column": "age",
+    "matchValueType": "LONG",
+    "lower": "21",
+    "lowerOpen": true,
+    "upper": "31" ,
+    "upperOpen": true
+}
+```
+
+**Example**: equivalent to `WHERE age < 31`
+
+```json
+{
+    "type": "range",
+    "column": "age",
+    "matchValueType": "LONG",
+    "upper": "31" ,
+    "upperOpen": true
+}
+```
+
+**Example**: equivalent to `WHERE age >= 18`
+
+```json
+{
+    "type": "range",
+    "column": "age",
+    "matchValueType": "LONG",
+    "lower": 18
+}
+```
+
+**Example**: equivalent to `WHERE ARRAY['a','b','c'] < arrayColumn < ARRAY['d','e','f']`, using ARRAY comparison
+
+```json
+{
+    "type": "range",
+    "column": "name",
+    "matchValueType": "ARRAY<STRING>",
+    "lower": ["a","b","c"],
+    "lowerOpen": true,
+    "upper": ["d","e","f"],
+    "upperOpen": true
+}
+```
+
+
+## Like filter
+
+Like filters can be used for basic wildcard searches. They are equivalent to the SQL LIKE operator. Special characters
+supported are "%" (matches any number of characters) and "\_" (matches any one character).
+
+| Property | Description | Required |
+| -------- | ----------- | -------- |
+| `type` | Must be `like`.| Yes |
+| `dimension` | Input column or virtual column name to filter on. | Yes |
+| `pattern` | String LIKE pattern, such as "foo%" or "___bar".| Yes |
+| `escape`| A string escape character that can be used to escape special characters. | No |
+| `extractionFn` | [Extraction function](./dimensionspecs.md#extraction-functions) to apply to `dimension` prior to value matching. See [filtering with extraction functions](#filtering-with-extraction-functions) for details. | No |
+
+Like filters support the use of extraction functions, see [Filtering with Extraction Functions](#filtering-with-extraction-functions) for details.
+
+**Example**: equivalent of `WHERE last_name LIKE "D%"` (last_name starts with "D")
+
+```json
+{
+    "type": "like",
+    "dimension": "last_name",
+    "pattern": "D%"
+}
+```
+
+## Regular expression filter
+
+The regular expression filter is similar to the selector filter, but using regular expressions. It matches the specified dimension with the given pattern.
+
+| Property | Description | Required |
+| -------- | ----------- | -------- |
+| `type` | Must be `regex`.| Yes |
+| `dimension` | Input column or virtual column name to filter on. | Yes |
+| `pattern` | String pattern to match - any standard [Java regular expression](https://docs.oracle.com/en/java/javase/17/docs/api/java.base/java/util/regex/Pattern.html). | Yes |
+| `extractionFn` | [Extraction function](./dimensionspecs.md#extraction-functions) to apply to `dimension` prior to value matching. See [filtering with extraction functions](#filtering-with-extraction-functions) for details. | No |
+
+Note that it is often more optimal to use a like filter instead of a regex for simple matching of prefixes.
+
+**Example**: matches values that start with `50.`
+
+``` json
+{ "type": "regex", "dimension": "someColumn", "pattern": ^50.* }
+```
+
+## Array contains element filter
+
+The `arrayContainsElement` filter checks if an `ARRAY` contains a specific element but can also match against any type of column. When matching against scalar columns, scalar columns are treated as single-element arrays.
+
+| Property | Description | Required |
+| -------- | ----------- | -------- |
+| `type` | Must be `arrayContainsElement`.| Yes |
+| `column` | Input column or virtual column name to filter on. | Yes |
+| `elementMatchValueType` | String specifying the type of element value to match. For example `STRING`, `LONG`, `DOUBLE`, `FLOAT`, `ARRAY<STRING>`, `ARRAY<LONG>`, or any other Druid type. The `elementMatchValueType` determines how Druid interprets the `elementMatchValue` to assist in converting to the type of elements contained in the matched `column`. | Yes |
+| `elementMatchValue` | Array element value to match. This value can be null. | Yes |
+
+**Example**: equivalent of `WHERE ARRAY_CONTAINS(someArrayColumn, 'hello')`
+
+```json
+{ "type": "arrayContainsElement", "column": "someArrayColumn", "elementMatchValueType": "STRING", "elementMatchValue": "hello" }
+```
+
+**Example**: equivalent of `WHERE ARRAY_CONTAINS(someNumericArrayColumn, 1.23)`
+
+```json
+{ "type": "arrayContainsElement", "column": "someNumericArrayColumn", "elementMatchValueType": "DOUBLE", "elementMatchValue": 1.23 }
+```
+
+**Example**: equivalent of `WHERE ARRAY_CONTAINS(someNumericArrayColumn, ARRAY[1, 2, 3])`
+
+```json
+{
+  "type": "and",
+  "fields": [
+    { "type": "arrayContainsElement", "column": "someNumericArrayColumn", "elementMatchValueType": "LONG", "elementMatchValue": 1 },
+    { "type": "arrayContainsElement", "column": "someNumericArrayColumn", "elementMatchValueType": "LONG", "elementMatchValue": 2 },
+    { "type": "arrayContainsElement", "column": "someNumericArrayColumn", "elementMatchValueType": "LONG", "elementMatchValue": 3 }
+  ]
+}
+
+```
+
+**Example**: equivalent of `WHERE ARRAY_OVERLAPS(someNumericArrayColumn, ARRAY[1, 2, 3])`
+
+```json
+{
+ "type": "or",
+ "fields": [
+  { "type": "arrayContainsElement", "column": "someNumericArrayColumn", "elementMatchValueType": "LONG", "elementMatchValue": 1 },
+  { "type": "arrayContainsElement", "column": "someNumericArrayColumn", "elementMatchValueType": "LONG", "elementMatchValue": 2 },
+  { "type": "arrayContainsElement", "column": "someNumericArrayColumn", "elementMatchValueType": "LONG", "elementMatchValue": 3 }
+ ]
+}
+```
+
+## Interval filter
+
+The Interval filter enables range filtering on columns that contain long millisecond values, with the boundaries specified as ISO 8601 time intervals. It is suitable for the `__time` column, long metric columns, and dimensions with values that can be parsed as long milliseconds.
+
+This filter converts the ISO 8601 intervals to long millisecond start/end ranges and translates to an OR of Bound filters on those millisecond ranges, with numeric comparison. The Bound filters will have left-closed and right-open matching (i.e., start `<=` time `<` end).
+
+| Property | Description | Required |
+| -------- | ----------- | -------- |
+| `type` | Must be `interval`. | Yes |
+| `dimension` | Input column or virtual column name to filter on. | Yes |
+| `intervals` | A JSON array containing ISO-8601 interval strings that defines the time ranges to filter on. | Yes |
+| `extractionFn` | [Extraction function](./dimensionspecs.md#extraction-functions) to apply to `dimension` prior to value matching. See [filtering with extraction functions](#filtering-with-extraction-functions) for details. | No |
+
+The interval filter supports the use of extraction functions, see [Filtering with Extraction Functions](#filtering-with-extraction-functions) for details.
+
+If an extraction function is used with this filter, the extraction function should output values that are parseable as long milliseconds.
+
+The following example filters on the time ranges of October 1-7, 2014 and November 15-16, 2014.
+
+```json
+{
+    "type" : "interval",
+    "dimension" : "__time",
+    "intervals" : [
+      "2014-10-01T00:00:00.000Z/2014-10-07T00:00:00.000Z",
+      "2014-11-15T00:00:00.000Z/2014-11-16T00:00:00.000Z"
+    ]
+}
+```
+
+The filter above is equivalent to the following OR of Bound filters:
+
+```json
+{
+    "type": "or",
+    "fields": [
+      {
+        "type": "bound",
+        "dimension": "__time",
+        "lower": "1412121600000",
+        "lowerStrict": false,
+        "upper": "1412640000000" ,
+        "upperStrict": true,
+        "ordering": "numeric"
+      },
+      {
+         "type": "bound",
+         "dimension": "__time",
+         "lower": "1416009600000",
+         "lowerStrict": false,
+         "upper": "1416096000000" ,
+         "upperStrict": true,
+         "ordering": "numeric"
+      }
+    ]
+}
+```
+
+## True filter
+
+A filter which matches all values. You can use it to temporarily disable other filters without removing them.
+
+```json
+{ "type" : "true" }
+```
+
+## False filter
+
+A filter matches no values. You can use it to force a query to match no values.
+
+```json
+{"type": "false" }
+```
+
+## Search filter
+
+You can use search filters to filter on partial string matches.
+
+```json
+{
+    "filter": {
+        "type": "search",
+        "dimension": "product",
+        "query": {
+          "type": "insensitive_contains",
+          "value": "foo"
+        }
+    }
+}
+```
+
+| Property | Description | Required |
+| -------- | ----------- | -------- |
+| `type` | Must be `search`. | Yes |
+| `dimension` | Input column or virtual column name to filter on. | Yes |
+| `query`| A JSON object for the type of search. See [search query spec](#search-query-spec) for more information. | Yes |
+| `extractionFn` | [Extraction function](./dimensionspecs.md#extraction-functions) to apply to `dimension` prior to value matching. See [filtering with extraction functions](#filtering-with-extraction-functions) for details. | No |
+
+### Search query spec
+
+#### Contains
+
+| Property | Description | Required |
+| -------- | ----------- | -------- |
+| `type` | Must be `contains`. | Yes |
+| `value` | A String value to search. | Yes |
+| `caseSensitive` | Whether the string comparison is case-sensitive or not. | No, default is false (insensitive) |
+
+#### Insensitive contains
+
+| Property | Description | Required |
+| -------- | ----------- | -------- |
+| `type` | Must be `insensitive_contains`. | Yes |
+| `value` | A String value to search. | Yes |
+
+Note that an "insensitive_contains" search is equivalent to a "contains" search with "caseSensitive": false (or not
+provided).
+
+#### Fragment
+
+| Property | Description | Required |
+| -------- | ----------- | -------- |
+| `type` | Must be `fragment`. | Yes |
+| `values` | A JSON array of string values to search. | Yes |
+| `caseSensitive` | Whether the string comparison is case-sensitive or not. | No, default is false (insensitive) |
+
+## Expression filter
+
+The expression filter allows for the implementation of arbitrary conditions, leveraging the Druid expression system. This filter allows for complete flexibility, but it might be less performant than a combination of the other filters on this page because it can't always use the same optimizations available to other filters.
+
+| Property | Description | Required |
+| -------- | ----------- | -------- |
+| `type` | Must be `expression`. | Yes |
+| `expression` | Expression string to evaluate into true or false. See the [Druid expression system](math-expr.md) for more details. | Yes |
+
+**Example**: expression based matching
+
+```json
+{ 
+    "type" : "expression" ,
+    "expression" : "((product_type == 42) && (!is_deleted))"
+}
+```
+
+## JavaScript filter
+
+The JavaScript filter matches a dimension against the specified JavaScript function predicate. The filter matches values for which the function returns true.
+
+| Property | Description | Required |
+| -------- | ----------- | -------- |
+| `type` | Must be `javascript`. | Yes |
+| `dimension` | Input column or virtual column name to filter on. | Yes |
+| `function` | JavaScript function which accepts the dimension value as a single argument, and returns either true or false. | Yes |
+| `extractionFn` | [Extraction function](./dimensionspecs.md#extraction-functions) to apply to `dimension` prior to value matching. See [filtering with extraction functions](#filtering-with-extraction-functions) for details. | No |
+
+**Example**: matching any dimension values for the dimension `name` between `'bar'` and `'foo'`
+
+```json
+{
+  "type" : "javascript",
+  "dimension" : "name",
+  "function" : "function(x) { return(x >= 'bar' && x <= 'foo') }"
+}
+```
+
+:::info
+ JavaScript-based functionality is disabled by default. Please refer to the Druid [JavaScript programming guide](../development/javascript.md) for guidelines about using Druid's JavaScript functionality, including instructions on how to enable it.
+:::
+
+## Extraction filter
+
+:::info
+ The extraction filter is now deprecated. The selector filter with an extraction function specified
+ provides identical functionality and should be used instead.
+:::
+
+Extraction filter matches a dimension using a specific [extraction function](./dimensionspecs.md#extraction-functions).
+The following filter matches the values for which the extraction function has a transformation entry `input_key=output_value` where
+`output_value` is equal to the filter `value` and `input_key` is present as a dimension.
+
+| Property | Description | Required |
+| -------- | ----------- | -------- |
+| `type` | Must be `extraction`. | Yes |
+| `dimension` | Input column or virtual column name to filter on. | Yes |
+| `value` | String value to match. | No. If not specified the filter will match NULL values. |
+| `extractionFn` | [Extraction function](./dimensionspecs.md#extraction-functions) to apply to `dimension` prior to value matching. See [filtering with extraction functions](#filtering-with-extraction-functions) for details. | No |
+
+**Example**: matching dimension values in `[product_1, product_3, product_5]` for the column `product`
+
+```json
+{
+    "filter": {
+        "type": "extraction",
+        "dimension": "product",
+        "value": "bar_1",
+        "extractionFn": {
+            "type": "lookup",
+            "lookup": {
+                "type": "map",
+                "map": {
+                    "product_1": "bar_1",
+                    "product_5": "bar_1",
+                    "product_3": "bar_1"
+                }
+            }
+        }
+    }
+}
+```
+
+## Filtering with extraction functions
+
+All filters except the "spatial" filter support extraction functions.
+An extraction function is defined by setting the "extractionFn" field on a filter.
+See [Extraction function](./dimensionspecs.md#extraction-functions) for more details on extraction functions.
+
+If specified, the extraction function will be used to transform input values before the filter is applied.
+The example below shows a selector filter combined with an extraction function. This filter will transform input values
+according to the values defined in the lookup map; transformed values will then be matched with the string "bar_1".
+
+**Example**: matches dimension values in `[product_1, product_3, product_5]` for the column `product`
+
+```json
+{
+    "filter": {
+        "type": "selector",
+        "dimension": "product",
+        "value": "bar_1",
+        "extractionFn": {
+            "type": "lookup",
+            "lookup": {
+                "type": "map",
+                "map": {
+                    "product_1": "bar_1",
+                    "product_5": "bar_1",
+                    "product_3": "bar_1"
+                }
+            }
+        }
+    }
+}
+```
+
+## Column types
+
+Druid supports filtering on timestamp, string, long, and float columns.
+
+Note that only string columns and columns produced with the ['auto' ingestion spec](../ingestion/ingestion-spec.md#dimension-objects) also used by [type aware schema discovery](../ingestion/schema-design.md#type-aware-schema-discovery) have bitmap indexes. Queries that filter on other column types must
+scan those columns.
+
+### Filtering on multi-value string columns
+
+All filters return true if any one of the dimension values is satisfies the filter.
+
+**Example**: multi-value match behavior
+
+Given a multi-value STRING row with values `['a', 'b', 'c']`, a filter such as
+
+```json
+{ "type": "equals", "column": "someMultiValueColumn", "matchValueType": "STRING", "matchValue": "b" }
+```
+will successfully match the entire row. This can produce sometimes unintuitive behavior when coupled with the implicit UNNEST functionality of Druid [GroupBy](./groupbyquery.md) and [TopN](./topnquery.md) queries.
+
+Additionally, contradictory filters may be defined and perfectly legal in native queries which will not work in SQL.
+
+**Example**: SQL "contradiction"
+
+This query is impossible to express as is in SQL since it is a contradiction that the SQL planner will optimize to false and match nothing.
+
+Given a multi-value STRING row with values `['a', 'b', 'c']`, and filter such as
+```json
+{
+  "type": "and",
+  "fields": [
+    {
+      "type": "equals",
+      "column": "someMultiValueColumn",
+      "matchValueType": "STRING",
+      "matchValue": "a"
+    },
+    {
+      "type": "equals",
+      "column": "someMultiValueColumn",
+      "matchValueType": "STRING",
+      "matchValue": "b"
+    }
+  ]
+}
+```
+will successfully match the entire row, but not match a row with value `['a', 'c']`.
+
+To express this filter in SQL, use [SQL multi-value string functions](./sql-multivalue-string-functions.md) such as `MV_CONTAINS`, which can be optimized by the planner to the same native filters.
+
+### Filtering on numeric columns
+
+Some filters, such as equality and range filters allow accepting numeric match values directly since they include a secondary `matchValueType` parameter.
+
+When filtering on numeric columns using string based filters such as the selector, in, and bounds filters, you can write filter match values as if they were strings. In most cases, your filter will be
+converted into a numeric predicate and will be applied to the numeric column values directly. In some cases (such as
+the "regex" filter) the numeric column values will be converted to strings during the scan.
+
+**Example**: filtering on a specific value, `myFloatColumn = 10.1`
+
+```json
+{
+  "type": "equals",
+  "dimension": "myFloatColumn",
+  "matchValueType": "FLOAT",
+  "value": 10.1
+}
+```
+
+or with a selector filter:
+
+```json
+{
+  "type": "selector",
+  "dimension": "myFloatColumn",
+  "value": "10.1"
+}
+```
+
+**Example**: filtering on a range of values, `10 <= myFloatColumn < 20`
+
+```json
+{
+  "type": "range",
+  "column": "myFloatColumn",
+  "matchvalueType": "FLOAT",
+  "lower": 10.1,
+  "lowerOpen": false,
+  "upper": 20.9,
+  "upperOpen": true
+}
+```
+
+or with a bound filter:
+
+```json
+{
+  "type": "bound",
+  "dimension": "myFloatColumn",
+  "ordering": "numeric",
+  "lower": "10",
+  "lowerStrict": false,
+  "upper": "20",
+  "upperStrict": true
+}
+```
+
+### Filtering on the timestamp column
+
+Query filters can also be applied to the timestamp column. The timestamp column has long millisecond values. To refer
+to the timestamp column, use the string `__time` as the dimension name. Like numeric dimensions, timestamp filters
+should be specified as if the timestamp values were strings.
+
+If you want to interpret the timestamp with a specific format, timezone, or locale, the [Time Format Extraction Function](./dimensionspecs.md#time-format-extraction-function) is useful.
+
+**Example**: filtering on a long timestamp value
+
+```json
+{
+  "type": "equals",
+  "dimension": "__time",
+  "matchValueType": "LONG",
+  "value": 124457387532
+}
+```
+
+or with a selector filter:
+
+```json
+{
+  "type": "selector",
+  "dimension": "__time",
+  "value": "124457387532"
+}
+```
+
+**Example**: filtering on day of week using an extraction function
+
+```json
+{
+  "type": "selector",
+  "dimension": "__time",
+  "value": "Friday",
+  "extractionFn": {
+    "type": "timeFormat",
+    "format": "EEEE",
+    "timeZone": "America/New_York",
+    "locale": "en"
+  }
+}
+```
+
+**Example**: filtering on a set of ISO 8601 intervals
+
+```json
+{
+    "type" : "interval",
+    "dimension" : "__time",
+    "intervals" : [
+      "2014-10-01T00:00:00.000Z/2014-10-07T00:00:00.000Z",
+      "2014-11-15T00:00:00.000Z/2014-11-16T00:00:00.000Z"
+    ]
+}
+```
diff --git a/docs/35.0.0/querying/geo.md b/docs/35.0.0/querying/geo.md
new file mode 100644
index 0000000000..56c4645896
--- /dev/null
+++ b/docs/35.0.0/querying/geo.md
@@ -0,0 +1,156 @@
+---
+id: geo
+title: "Spatial filters"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ Apache Druid supports two query languages: [Druid SQL](../querying/sql.md) and [native queries](../querying/querying.md).
+ This document describes a feature that is only available in the native language.
+:::
+
+Apache Druid supports filtering spatially indexed columns based on an origin and a bound.
+
+This topic explains how to ingest and query spatial filters.
+For information on other filters supported by Druid, see [Query filters](../querying/filters.md).
+
+## Spatial indexing
+
+Spatial indexing refers to ingesting data of a spatial data type, such as geometry or geography, into Druid.
+
+Spatial dimensions are string columns that contain coordinates separated by a comma.
+In the ingestion spec, you configure spatial dimensions in the `dimensionsSpec` object of the `dataSchema` component.
+
+You can provide spatial dimensions in any of the [data formats](../ingestion/data-formats.md) supported by Druid.
+The following example shows an ingestion spec with a spatial dimension named `coordinates`, which is constructed from the input fields `x` and `y`:
+
+```json
+{
+  "type": "hadoop",
+  "dataSchema": {
+    "dataSource": "DatasourceName",
+    "parser": {
+      "type": "string",
+      "parseSpec": {
+        "format": "json",
+        "timestampSpec": {
+          "column": "timestamp",
+          "format": "auto"
+        },
+        "dimensionsSpec": {
+          "dimensions": [
+            {
+              "type": "double",
+              "name": "x"
+            },
+            {
+              "type": "double",
+              "name": "y"
+            }
+          ],
+          "spatialDimensions": [
+            {
+              "dimName": "coordinates",
+              "dims": [
+                "x",
+                "y"
+              ]
+            }
+          ]
+        }
+      }
+    }
+  }
+}
+```
+
+Each spatial dimension object in the `spatialDimensions` array is defined by the following fields:
+
+|Property|Description|Required|
+|--------|-----------|--------|
+|`dimName`|The name of a spatial dimension. You can construct a spatial dimension from other dimensions or it may already exist as part of an event. If a spatial dimension already exists, it must be an array of coordinate values.|yes|
+|`dims`|The list of dimension names that comprise the spatial dimension.|no|
+
+For information on how to use the ingestion spec to configure ingestion, see [Ingestion spec reference](../ingestion/ingestion-spec.md).
+For general information on loading data in Druid, see [Ingestion](../ingestion/index.md).
+
+## Spatial filters
+
+A [filter](../querying/filters.md) is a JSON object indicating which rows of data should be included in the computation for a query.
+You can filter on spatial structures, such as rectangles and polygons, using the spatial filter.
+
+Spatial filters have the following structure:
+
+```json
+"filter": {
+  "type": "spatial",
+  "dimension": <name_of_spatial_dimension>,
+  "bound": <bound_type>
+}
+```
+
+The following example shows a spatial filter with a rectangular bound type:
+
+```json
+"filter" : {
+    "type": "spatial",
+    "dimension": "spatialDim",
+    "bound": {
+        "type": "rectangular",
+        "minCoords": [10.0, 20.0],
+        "maxCoords": [30.0, 40.0]
+    }
+```
+
+The order of the dimension coordinates in the spatial filter must be equal to the order of the dimension coordinates in the `spatialDimensions` array.
+
+### Bound types
+
+The `bound` property of the spatial filter object lets you filter on ranges of dimension values. 
+You can define rectangular, radius, and polygon filter bounds.
+
+#### Rectangular
+
+The `rectangular` bound has the following elements:
+
+|Property|Description|Required|
+|--------|-----------|--------|
+|`minCoords`|The list of minimum dimension coordinates in the form [x, y]|yes|
+|`maxCoords`|The list of maximum dimension coordinates in the form [x, y]|yes|
+
+#### Radius
+
+The `radius` bound has the following elements:
+
+|Property|Description|Required|
+|--------|-----------|--------|
+|`coords`|Center coordinates in the form [x, y]|yes|
+|`radius`|The float radius value according to specified unit|yes|
+|`radiusUnit`|String value of radius unit in lowercase, default value is 'euclidean'. Allowed units are euclidean, meters, miles, kilometers.|no|
+
+#### Polygon
+
+The `polygon` bound has the following elements:
+
+|Property|Description|Required|
+|--------|-----------|--------|
+|`abscissa`|Horizontal coordinates for the corners of the polygon|yes|
+|`ordinate`|Vertical coordinates for the corners of the polygon|yes|
diff --git a/docs/35.0.0/querying/granularities.md b/docs/35.0.0/querying/granularities.md
new file mode 100644
index 0000000000..6c204df105
--- /dev/null
+++ b/docs/35.0.0/querying/granularities.md
@@ -0,0 +1,468 @@
+---
+id: granularities
+title: "Query granularities"
+sidebar_label: "Granularities"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ Apache Druid supports two query languages: [Druid SQL](sql.md) and [native queries](querying.md).
+ This document describes the native
+ language. For information about time functions available in SQL, refer to the
+ [SQL documentation](sql-scalar.md#date-and-time-functions).
+:::
+
+Granularity determines how to bucket data across the time dimension, or how to aggregate data by hour, day, minute, etc and defines how it is stored.
+The granularity formats here apply also to `segmentGranularity` and `queryGranularity` in the `granularitySpec` section of the the [ingestion spec](../ingestion/ingestion-spec.md#granularityspec).
+
+For example, use time granularities in [native queries](querying.md) to bucket results by time, and in the `dataSchema` \\ [`granularitySpec`](../ingestion/ingestion-spec.md#granularityspec) section of ingestion specifications to segment incoming data.
+
+You can specify a time period as a [simple](#simple-granularities) string, as a [duration](#duration-granularities) in milliseconds, or as an arbitrary ISO8601 [period](#period-granularities).
+
+### Simple Granularities
+
+Simple granularities are specified as a string and bucket timestamps by their UTC time (e.g., days start at 00:00 UTC).
+
+Druid supports the following granularity strings: 
+  - `all`
+  - `none`
+  - `second`
+  - `minute`
+  - `five_minute`
+  - `ten_minute`
+  - `fifteen_minute`
+  - `thirty_minute`
+  - `hour`
+  - `six_hour`
+  - `eight_hour`
+  - `day`
+  - `week`*
+  - `month`
+  - `quarter` 
+  - `year`
+
+The minimum and maximum granularities are `none` and `all`, described as follows:
+* `all` buckets everything into a single bucket.
+* `none` does not mean zero bucketing. It buckets data to millisecond granularity—the granularity of the internal index. You can think of `none` as equivalent to `millisecond`.
+:::info
+ Do not use `none` in a [timeseries query](../querying/timeseriesquery.md); Druid fills empty interior time buckets with zeroes, meaning the output will contain results for every single millisecond in the requested interval.
+:::
+
+*Avoid using the `week` granularity for partitioning at ingestion time, because weeks don't align neatly with months and years, making it difficult to partition by coarser granularities later.
+
+#### Example:
+
+Suppose you have data below stored in Apache Druid with millisecond ingestion granularity,
+
+``` json
+{"timestamp": "2013-08-31T01:02:33Z", "page": "AAA", "language" : "en"}
+{"timestamp": "2013-09-01T01:02:33Z", "page": "BBB", "language" : "en"}
+{"timestamp": "2013-09-02T23:32:45Z", "page": "CCC", "language" : "en"}
+{"timestamp": "2013-09-03T03:32:45Z", "page": "DDD", "language" : "en"}
+```
+
+After submitting a groupBy query with `hour` granularity,
+
+``` json
+{
+   "queryType":"groupBy",
+   "dataSource":"my_dataSource",
+   "granularity":"hour",
+   "dimensions":[
+      "language"
+   ],
+   "aggregations":[
+      {
+         "type":"count",
+         "name":"count"
+      }
+   ],
+   "intervals":[
+      "2000-01-01T00:00Z/3000-01-01T00:00Z"
+   ]
+}
+```
+
+you will get
+
+``` json
+[ {
+  "version" : "v1",
+  "timestamp" : "2013-08-31T01:00:00.000Z",
+  "event" : {
+    "count" : 1,
+    "language" : "en"
+  }
+}, {
+  "version" : "v1",
+  "timestamp" : "2013-09-01T01:00:00.000Z",
+  "event" : {
+    "count" : 1,
+    "language" : "en"
+  }
+}, {
+  "version" : "v1",
+  "timestamp" : "2013-09-02T23:00:00.000Z",
+  "event" : {
+    "count" : 1,
+    "language" : "en"
+  }
+}, {
+  "version" : "v1",
+  "timestamp" : "2013-09-03T03:00:00.000Z",
+  "event" : {
+    "count" : 1,
+    "language" : "en"
+  }
+} ]
+```
+
+Note that all the empty buckets are discarded.
+
+
+If you change the granularity to `day`, you will get
+
+``` json
+[ {
+  "version" : "v1",
+  "timestamp" : "2013-08-31T00:00:00.000Z",
+  "event" : {
+    "count" : 1,
+    "language" : "en"
+  }
+}, {
+  "version" : "v1",
+  "timestamp" : "2013-09-01T00:00:00.000Z",
+  "event" : {
+    "count" : 1,
+    "language" : "en"
+  }
+}, {
+  "version" : "v1",
+  "timestamp" : "2013-09-02T00:00:00.000Z",
+  "event" : {
+    "count" : 1,
+    "language" : "en"
+  }
+}, {
+  "version" : "v1",
+  "timestamp" : "2013-09-03T00:00:00.000Z",
+  "event" : {
+    "count" : 1,
+    "language" : "en"
+  }
+} ]
+```
+
+
+If you change the granularity to `none`, you will get the same results as setting it to the ingestion granularity.
+
+``` json
+[ {
+  "version" : "v1",
+  "timestamp" : "2013-08-31T01:02:33.000Z",
+  "event" : {
+    "count" : 1,
+    "language" : "en"
+  }
+}, {
+  "version" : "v1",
+  "timestamp" : "2013-09-01T01:02:33.000Z",
+  "event" : {
+    "count" : 1,
+    "language" : "en"
+  }
+}, {
+  "version" : "v1",
+  "timestamp" : "2013-09-02T23:32:45.000Z",
+  "event" : {
+    "count" : 1,
+    "language" : "en"
+  }
+}, {
+  "version" : "v1",
+  "timestamp" : "2013-09-03T03:32:45.000Z",
+  "event" : {
+    "count" : 1,
+    "language" : "en"
+  }
+} ]
+```
+
+Having a query time `granularity` that is smaller than the `queryGranularity` parameter set at
+[ingestion time](../ingestion/ingestion-spec.md#granularityspec) is unreasonable because information about that
+smaller granularity is not present in the indexed data. So, if the query time granularity is smaller than the ingestion
+time query granularity, Druid produces results that are equivalent to having set `granularity` to `queryGranularity`.
+
+
+If you change the granularity to `all`, you will get everything aggregated in 1 bucket,
+
+``` json
+[ {
+  "version" : "v1",
+  "timestamp" : "2000-01-01T00:00:00.000Z",
+  "event" : {
+    "count" : 4,
+    "language" : "en"
+  }
+} ]
+```
+
+
+### Duration Granularities
+
+Duration granularities are specified as an exact duration in milliseconds and timestamps are returned as UTC. Duration granularity values are in millis.
+
+They also support specifying an optional origin, which defines where to start counting time buckets from (defaults to 1970-01-01T00:00:00Z).
+
+```javascript
+{"type": "duration", "duration": 7200000}
+```
+
+This chunks up every 2 hours.
+
+```javascript
+{"type": "duration", "duration": 3600000, "origin": "2012-01-01T00:30:00Z"}
+```
+
+This chunks up every hour on the half-hour.
+
+#### Example:
+
+Reusing the data in the previous example, after submitting a groupBy query with 24 hours duration,
+
+``` json
+{
+   "queryType":"groupBy",
+   "dataSource":"my_dataSource",
+   "granularity":{"type": "duration", "duration": "86400000"},
+   "dimensions":[
+      "language"
+   ],
+   "aggregations":[
+      {
+         "type":"count",
+         "name":"count"
+      }
+   ],
+   "intervals":[
+      "2000-01-01T00:00Z/3000-01-01T00:00Z"
+   ]
+}
+```
+
+you will get
+
+``` json
+[ {
+  "version" : "v1",
+  "timestamp" : "2013-08-31T00:00:00.000Z",
+  "event" : {
+    "count" : 1,
+    "language" : "en"
+  }
+}, {
+  "version" : "v1",
+  "timestamp" : "2013-09-01T00:00:00.000Z",
+  "event" : {
+    "count" : 1,
+    "language" : "en"
+  }
+}, {
+  "version" : "v1",
+  "timestamp" : "2013-09-02T00:00:00.000Z",
+  "event" : {
+    "count" : 1,
+    "language" : "en"
+  }
+}, {
+  "version" : "v1",
+  "timestamp" : "2013-09-03T00:00:00.000Z",
+  "event" : {
+    "count" : 1,
+    "language" : "en"
+  }
+} ]
+```
+
+if you set the origin for the granularity to `2012-01-01T00:30:00Z`,
+
+``` javascript
+   "granularity":{"type": "duration", "duration": "86400000", "origin":"2012-01-01T00:30:00Z"}
+```
+
+you will get
+
+``` json
+[ {
+  "version" : "v1",
+  "timestamp" : "2013-08-31T00:30:00.000Z",
+  "event" : {
+    "count" : 1,
+    "language" : "en"
+  }
+}, {
+  "version" : "v1",
+  "timestamp" : "2013-09-01T00:30:00.000Z",
+  "event" : {
+    "count" : 1,
+    "language" : "en"
+  }
+}, {
+  "version" : "v1",
+  "timestamp" : "2013-09-02T00:30:00.000Z",
+  "event" : {
+    "count" : 1,
+    "language" : "en"
+  }
+}, {
+  "version" : "v1",
+  "timestamp" : "2013-09-03T00:30:00.000Z",
+  "event" : {
+    "count" : 1,
+    "language" : "en"
+  }
+} ]
+```
+
+Note that the timestamp for each bucket starts at the 30th minute.
+
+### Period Granularities
+
+Period granularities are specified as arbitrary period combinations of years, months, weeks, hours, minutes and seconds (e.g. P2W, P3M, PT1H30M, PT0.750S) in [ISO8601](https://en.wikipedia.org/wiki/ISO_8601) format. They support specifying a time zone which determines where period boundaries start as well as the timezone of the returned timestamps. By default, years start on the first of January, months start on the first of the month and weeks start on Mondays unless an origin is specified.
+
+Time zone is optional (defaults to UTC). Origin is optional (defaults to 1970-01-01T00:00:00 in the given time zone).
+
+```javascript
+{"type": "period", "period": "P2D", "timeZone": "America/Los_Angeles"}
+```
+
+This will bucket by two-day chunks in the Pacific timezone.
+
+```javascript
+{"type": "period", "period": "P3M", "timeZone": "America/Los_Angeles", "origin": "2012-02-01T00:00:00-08:00"}
+```
+
+This will bucket by 3-month chunks in the Pacific timezone where the three-month quarters are defined as starting from February.
+
+#### Example
+
+Reusing the data in the previous example, if you submit a groupBy query with 1 day period in Pacific timezone,
+
+``` json
+{
+   "queryType":"groupBy",
+   "dataSource":"my_dataSource",
+   "granularity":{"type": "period", "period": "P1D", "timeZone": "America/Los_Angeles"},
+   "dimensions":[
+      "language"
+   ],
+   "aggregations":[
+      {
+         "type":"count",
+         "name":"count"
+      }
+   ],
+   "intervals":[
+      "1999-12-31T16:00:00.000-08:00/2999-12-31T16:00:00.000-08:00"
+   ]
+}
+```
+
+you will get
+
+``` json
+[ {
+  "version" : "v1",
+  "timestamp" : "2013-08-30T00:00:00.000-07:00",
+  "event" : {
+    "count" : 1,
+    "language" : "en"
+  }
+}, {
+  "version" : "v1",
+  "timestamp" : "2013-08-31T00:00:00.000-07:00",
+  "event" : {
+    "count" : 1,
+    "language" : "en"
+  }
+}, {
+  "version" : "v1",
+  "timestamp" : "2013-09-02T00:00:00.000-07:00",
+  "event" : {
+    "count" : 2,
+    "language" : "en"
+  }
+} ]
+```
+
+Note that the timestamp for each bucket has been converted to Pacific time. Row `{"timestamp": "2013-09-02T23:32:45Z", "page": "CCC", "language" : "en"}` and
+`{"timestamp": "2013-09-03T03:32:45Z", "page": "DDD", "language" : "en"}` are put in the same bucket because they are in the same day in Pacific time.
+
+Also note that the `intervals` in groupBy query will not be converted to the timezone specified, the timezone specified in granularity is only applied on the
+query results.
+
+If you set the origin for the granularity to `1970-01-01T20:30:00-08:00`,
+
+``` javascript
+   "granularity":{"type": "period", "period": "P1D", "timeZone": "America/Los_Angeles", "origin": "1970-01-01T20:30:00-08:00"}
+```
+
+you will get
+
+``` json
+[ {
+  "version" : "v1",
+  "timestamp" : "2013-08-29T20:30:00.000-07:00",
+  "event" : {
+    "count" : 1,
+    "language" : "en"
+  }
+}, {
+  "version" : "v1",
+  "timestamp" : "2013-08-30T20:30:00.000-07:00",
+  "event" : {
+    "count" : 1,
+    "language" : "en"
+  }
+}, {
+  "version" : "v1",
+  "timestamp" : "2013-09-01T20:30:00.000-07:00",
+  "event" : {
+    "count" : 1,
+    "language" : "en"
+  }
+}, {
+  "version" : "v1",
+  "timestamp" : "2013-09-02T20:30:00.000-07:00",
+  "event" : {
+    "count" : 1,
+    "language" : "en"
+  }
+} ]
+```
+
+Note that the `origin` you specified has nothing to do with the timezone, it only serves as a starting point for locating the very first granularity bucket.
+In this case, Row `{"timestamp": "2013-09-02T23:32:45Z", "page": "CCC", "language" : "en"}` and `{"timestamp": "2013-09-03T03:32:45Z", "page": "DDD", "language" : "en"}`
+are not in the same bucket.
+
+#### Supported Time Zones
+Timezone support is provided by the [Joda Time library](http://www.joda.org), which uses the standard IANA time zones. See the [Joda Time supported timezones](http://joda-time.sourceforge.net/timezones.html).
diff --git a/docs/35.0.0/querying/groupbyquery.md b/docs/35.0.0/querying/groupbyquery.md
new file mode 100644
index 0000000000..58e20fa54d
--- /dev/null
+++ b/docs/35.0.0/querying/groupbyquery.md
@@ -0,0 +1,404 @@
+---
+id: groupbyquery
+title: "GroupBy queries"
+sidebar_label: "GroupBy"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ Apache Druid supports two query languages: [Druid SQL](sql.md) and [native queries](querying.md).
+ This document describes a query
+ type in the native language. For information about when Druid SQL will use this query type, refer to the
+ [SQL documentation](sql-translation.md#query-types).
+:::
+
+These types of Apache Druid queries take a groupBy query object and return an array of JSON objects where each object represents a
+grouping asked for by the query.
+
+:::info
+ Note: If you are doing aggregations with time as your only grouping, or an ordered groupBy over a single dimension,
+ consider [Timeseries](timeseriesquery.md) and [TopN](topnquery.md) queries as well as
+ groupBy. Their performance may be better in some cases. See [Alternatives](#alternatives) below for more details.
+:::
+
+An example groupBy query object is shown below:
+
+``` json
+{
+  "queryType": "groupBy",
+  "dataSource": "sample_datasource",
+  "granularity": "day",
+  "dimensions": ["country", "device"],
+  "limitSpec": { "type": "default", "limit": 5000, "columns": ["country", "data_transfer"] },
+  "filter": {
+    "type": "and",
+    "fields": [
+      { "type": "selector", "dimension": "carrier", "value": "AT&T" },
+      { "type": "or",
+        "fields": [
+          { "type": "selector", "dimension": "make", "value": "Apple" },
+          { "type": "selector", "dimension": "make", "value": "Samsung" }
+        ]
+      }
+    ]
+  },
+  "aggregations": [
+    { "type": "longSum", "name": "total_usage", "fieldName": "user_count" },
+    { "type": "doubleSum", "name": "data_transfer", "fieldName": "data_transfer" }
+  ],
+  "postAggregations": [
+    { "type": "arithmetic",
+      "name": "avg_usage",
+      "fn": "/",
+      "fields": [
+        { "type": "fieldAccess", "fieldName": "data_transfer" },
+        { "type": "fieldAccess", "fieldName": "total_usage" }
+      ]
+    }
+  ],
+  "intervals": [ "2012-01-01T00:00:00.000/2012-01-03T00:00:00.000" ],
+  "having": {
+    "type": "greaterThan",
+    "aggregation": "total_usage",
+    "value": 100
+  }
+}
+```
+
+Following are main parts to a groupBy query:
+
+|property|description|required?|
+|--------|-----------|---------|
+|queryType|This String should always be "groupBy"; this is the first thing Druid looks at to figure out how to interpret the query|yes|
+|dataSource|A String or Object defining the data source to query, very similar to a table in a relational database. See [DataSource](../querying/datasource.md) for more information.|yes|
+|dimensions|A JSON list of dimensions to do the groupBy over; or see [DimensionSpec](../querying/dimensionspecs.md) for ways to extract dimensions. |yes|
+|virtualColumns|A JSON list of [virtual columns](./virtual-columns.md). You can reference the virtual columns in `dimensions`, `aggregations`, or `postAggregations`.| no (default none)|
+|limitSpec|See [LimitSpec](../querying/limitspec.md).|no|
+|having|See [Having](../querying/having.md).|no|
+|granularity|Defines the granularity of the query. See [Granularities](../querying/granularities.md)|yes|
+|filter|See [Filters](../querying/filters.md)|no|
+|aggregations|See [Aggregations](../querying/aggregations.md)|no|
+|postAggregations|See [Post Aggregations](../querying/post-aggregations.md)|no|
+|intervals|A JSON Object representing ISO-8601 Intervals. This defines the time ranges to run the query over.|yes|
+|subtotalsSpec| A JSON array of arrays to return additional result sets for groupings of subsets of top level `dimensions`. It is [described later](groupbyquery.md#more-on-subtotalsspec) in more detail.|no|
+|context|An additional JSON Object which can be used to specify certain flags.|no|
+
+To pull it all together, the above query would return *n\*m* data points, up to a maximum of 5000 points, where n is the cardinality of the `country` dimension, m is the cardinality of the `device` dimension, each day between 2012-01-01 and 2012-01-03, from the `sample_datasource` table. Each data point contains the (long) sum of `total_usage` if the value of the data point is greater than 100, the (double) sum of `data_transfer` and the (double) result of `total_usage` divided by `data_transfer` for the filter set for a particular grouping of `country` and `device`. The output looks like this:
+
+```json
+[
+  {
+    "version" : "v1",
+    "timestamp" : "2012-01-01T00:00:00.000Z",
+    "event" : {
+      "country" : <some_dim_value_one>,
+      "device" : <some_dim_value_two>,
+      "total_usage" : <some_value_one>,
+      "data_transfer" :<some_value_two>,
+      "avg_usage" : <some_avg_usage_value>
+    }
+  },
+  {
+    "version" : "v1",
+    "timestamp" : "2012-01-01T00:00:12.000Z",
+    "event" : {
+      "dim1" : <some_other_dim_value_one>,
+      "dim2" : <some_other_dim_value_two>,
+      "sample_name1" : <some_other_value_one>,
+      "sample_name2" :<some_other_value_two>,
+      "avg_usage" : <some_other_avg_usage_value>
+    }
+  },
+...
+]
+```
+
+## Behavior on multi-value dimensions
+
+groupBy queries can group on multi-value dimensions. When grouping on a multi-value dimension, _all_ values
+from matching rows will be used to generate one group per value. It's possible for a query to return more groups than
+there are rows. For example, a groupBy on the dimension `tags` with filter `"t1" AND "t3"` would match only row1, and
+generate a result with three groups: `t1`, `t2`, and `t3`. If you only need to include values that match
+your filter, you can use a [filtered dimensionSpec](dimensionspecs.md#filtered-dimensionspecs). This can also
+improve performance.
+
+See [Multi-value dimensions](multi-value-dimensions.md) for more details.
+
+## More on subtotalsSpec
+
+The subtotals feature allows computation of multiple sub-groupings in a single query. To use this feature, add a "subtotalsSpec" to your query as a list of subgroup dimension sets. It should contain the `outputName` from dimensions in your `dimensions` attribute, in the same order as they appear in the `dimensions` attribute (although, of course, you may skip some). 
+
+For example, consider a groupBy query like this one:
+
+```json
+{
+"type": "groupBy",
+ ...
+ ...
+"dimensions": [
+  {
+  "type" : "default",
+  "dimension" : "d1col",
+  "outputName": "D1"
+  },
+  {
+  "type" : "extraction",
+  "dimension" : "d2col",
+  "outputName" :  "D2",
+  "extractionFn" : extraction_func
+  },
+  {
+  "type":"lookup",
+  "dimension":"d3col",
+  "outputName":"D3",
+  "name":"my_lookup"
+  }
+],
+...
+...
+"subtotalsSpec":[ ["D1", "D2", "D3"], ["D1", "D3"], ["D3"]],
+..
+
+}
+```
+
+The result of the subtotalsSpec would be equivalent to concatenating the result of three groupBy queries, with the "dimensions" field being `["D1", "D2", "D3"]`, `["D1", "D3"]` and `["D3"]`, given the `DimensionSpec` shown above.
+The response for the query above would look something like: 
+
+```json
+[
+  {
+    "version" : "v1",
+    "timestamp" : "t1",
+    "event" : { "D1": "..", "D2": "..", "D3": ".." }
+    }
+  },
+    {
+    "version" : "v1",
+    "timestamp" : "t2",
+    "event" : { "D1": "..", "D2": "..", "D3": ".." }
+    }
+  },
+  ...
+  ...
+
+   {
+    "version" : "v1",
+    "timestamp" : "t1",
+    "event" : { "D1": "..", "D2": null, "D3": ".." }
+    }
+  },
+    {
+    "version" : "v1",
+    "timestamp" : "t2",
+    "event" : { "D1": "..", "D2": null, "D3": ".." }
+    }
+  },
+  ...
+  ...
+
+  {
+    "version" : "v1",
+    "timestamp" : "t1",
+    "event" : { "D1": null, "D2": null, "D3": ".." }
+    }
+  },
+    {
+    "version" : "v1",
+    "timestamp" : "t2",
+    "event" : { "D1": null, "D2": null, "D3": ".." }
+    }
+  },
+...
+]
+```
+
+:::info
+ Notice that dimensions that are not included in an individual subtotalsSpec grouping are returned with a `null` value. This response format represents a behavior change as of Apache Druid 0.18.0.
+ In release 0.17.0 and earlier, such dimensions were entirely excluded from the result. If you were relying on this old behavior to determine whether a particular dimension was not part of
+ a subtotal grouping, you can now use [Grouping aggregator](aggregations.md#grouping-aggregator) instead.
+:::
+
+
+## Implementation details
+
+### Memory tuning and resource limits
+
+When using groupBy, four parameters control resource usage and limits:
+
+- `druid.processing.buffer.sizeBytes`: size of the off-heap hash table used for aggregation, per query, in bytes. At
+most `druid.processing.numMergeBuffers` of these will be created at once, which also serves as an upper limit on the
+number of concurrently running groupBy queries.
+- `druid.query.groupBy.maxSelectorDictionarySize`: size of the on-heap segment-level dictionary used when grouping on
+string or array-valued expressions that do not have pre-existing dictionaries. There is at most one dictionary per
+processing thread; therefore there are up to `druid.processing.numThreads` of these. Note that the size is based on a
+rough estimate of the dictionary footprint.
+- `druid.query.groupBy.maxMergingDictionarySize`: size of the on-heap query-level dictionary used when grouping on
+any string expression. There is at most one dictionary per concurrently-running query; therefore there are up to
+`druid.server.http.numThreads` of these. Note that the size is based on a rough estimate of the dictionary footprint.
+- `druid.query.groupBy.maxOnDiskStorage`: amount of space on disk used for aggregation, per query, in bytes. By default,
+this is 0, which means aggregation will not use disk.
+
+If `maxOnDiskStorage` is 0 (the default) then a query that exceeds either the on-heap dictionary limit, or the off-heap
+aggregation table limit, will fail with a "Resource limit exceeded" error describing the limit that was exceeded.
+
+If `maxOnDiskStorage` is greater than 0, queries that exceed the in-memory limits will start using disk for aggregation.
+In this case, when either the on-heap dictionary or off-heap hash table fills up, partially aggregated records will be
+sorted and flushed to disk. Then, both in-memory structures will be cleared out for further aggregation. Queries that
+then go on to exceed `maxOnDiskStorage` will fail with a "Resource limit exceeded" error indicating that they ran out of
+disk space.
+
+With groupBy, cluster operators should make sure that the off-heap hash tables and on-heap merging dictionaries
+will not exceed available memory for the maximum possible concurrent query load (given by
+`druid.processing.numMergeBuffers`). See the [basic cluster tuning guide](../operations/basic-cluster-tuning.md) 
+for more details about direct memory usage, organized by Druid process type.
+
+Brokers do not need merge buffers for basic groupBy queries. Queries with subqueries (using a `query` dataSource) require one merge buffer if there is a single subquery, or two merge buffers if there is more than one layer of nested subqueries. Queries with [subtotals](groupbyquery.md#more-on-subtotalsspec) need one merge buffer. These can stack on top of each other: a groupBy query with multiple layers of nested subqueries, and that also uses subtotals, will need three merge buffers.
+
+Historicals and ingestion tasks need one merge buffer for each groupBy query, unless [parallel combination](groupbyquery.md#parallel-combine) is enabled, in which case they need two merge buffers per query.
+
+### Performance tuning for groupBy
+
+#### Limit pushdown optimization
+
+Druid pushes down the `limit` spec in groupBy queries to the segments on Historicals wherever possible to early prune unnecessary intermediate results and minimize the amount of data transferred to Brokers. By default, this technique is applied only when all fields in the `orderBy` spec is a subset of the grouping keys. This is because the `limitPushDown` doesn't guarantee the exact results if the `orderBy` spec includes any fields that are not in the grouping keys. However, you can enable this technique even in such cases if you can sacrifice some accuracy for fast query processing like in topN queries. See `forceLimitPushDown` in [advanced configurations](#advanced-configurations).
+
+
+#### Optimizing hash table
+
+The groupBy engine uses an open addressing hash table for aggregation. The hash table is initialized with a given initial bucket number and gradually grows on buffer full. On hash collisions, the linear probing technique is used.
+
+The default number of initial buckets is 1024 and the default max load factor of the hash table is 0.7. If you can see too many collisions in the hash table, you can adjust these numbers. See `bufferGrouperInitialBuckets` and `bufferGrouperMaxLoadFactor` in [advanced configurations](#advanced-configurations).
+
+
+#### Parallel combine
+
+Once a Historical finishes aggregation using the hash table, it sorts the aggregated results and merges them before sending to the
+Broker for N-way merge aggregation in the broker. By default, Historicals use all their available processing threads
+(configured by `druid.processing.numThreads`) for aggregation, but use a single thread for sorting and merging
+aggregates which is an http thread to send data to Brokers.
+
+This is to prevent some heavy groupBy queries from blocking other queries. In Druid, the processing threads are shared
+between all submitted queries and they are _not interruptible_. It means, if a heavy query takes all available
+processing threads, all other queries might be blocked until the heavy query is finished. GroupBy queries usually take
+longer time than timeseries or topN queries, they should release processing threads as soon as possible.
+
+However, you might care about the performance of some really heavy groupBy queries. Usually, the performance bottleneck
+of heavy groupBy queries is merging sorted aggregates. In such cases, you can use processing threads for it as well.
+This is called _parallel combine_. To enable parallel combine, see `numParallelCombineThreads` in
+[advanced configurations](#advanced-configurations). Note that parallel combine can be enabled only when
+data is actually spilled (see [Memory tuning and resource limits](#memory-tuning-and-resource-limits)).
+
+Once parallel combine is enabled, the groupBy engine can create a combining tree for merging sorted aggregates. Each
+intermediate node of the tree is a thread merging aggregates from the child nodes. The leaf node threads read and merge
+aggregates from hash tables including spilled ones. Usually, leaf processes are slower than intermediate nodes because they
+need to read data from disk. As a result, less threads are used for intermediate nodes by default. You can change the
+degree of intermediate nodes. See `intermediateCombineDegree` in [advanced configurations](#advanced-configurations).
+
+Please note that each Historical needs two merge buffers to process a groupBy query with parallel combine: one for
+computing intermediate aggregates from each segment and another for combining intermediate aggregates in parallel.
+
+
+### Alternatives
+
+There are some situations where other query types may be a better choice than groupBy.
+
+- For queries with no "dimensions" (i.e. grouping by time only) the [Timeseries query](timeseriesquery.md) will
+generally be faster than groupBy. The major differences are that it is implemented in a fully streaming manner (taking
+advantage of the fact that segments are already sorted on time) and does not need to use a hash table for merging.
+
+- For queries with a single "dimensions" element (i.e. grouping by one string dimension), the [TopN query](topnquery.md)
+will sometimes be faster than groupBy. This is especially true if you are ordering by a metric and find approximate
+results acceptable.
+
+### Nested groupBys
+
+Nested groupBys (dataSource of type "query") are performed with the Broker first running the inner groupBy query in the
+usual way. Next, the outer query is run on the inner query's results stream with off-heap fact map and on-heap string
+dictionary that can spill to disk. The outer query is run on the Broker in a single-threaded fashion.
+
+### Configurations
+
+This section describes the configurations for groupBy queries. You can set the runtime properties in the `runtime.properties` file on Broker, Historical, and Middle Manager processes. You can set the query context parameters through the [query context](query-context-reference.md).
+
+Supported runtime properties:
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.query.groupBy.maxSelectorDictionarySize`|Maximum amount of heap space (approximately) to use for per-segment string dictionaries.  If set to `0` (automatic), each query's dictionary can use 10% of the Java heap divided by `druid.processing.numMergeBuffers`, or 1GB, whichever is smaller.<br /><br />See [Memory tuning and resource limits](#memory-tuning-and-resource-limits) for details on changing this property.|0 (automatic)|
+|`druid.query.groupBy.maxMergingDictionarySize`|Maximum amount of heap space (approximately) to use for per-query string dictionaries. When the dictionary exceeds this size, a spill to disk will be triggered. If set to `0` (automatic), each query's dictionary uses 30% of the Java heap divided by `druid.processing.numMergeBuffers`, or 1GB, whichever is smaller.<br /><br />See [Memory tuning and resource limits](#memory-tuning-and-resource-limits) for details on changing this property.|0 (automatic)|
+|`druid.query.groupBy.maxOnDiskStorage`|Maximum amount of disk space to use, per-query, for spilling result sets to disk when either the merging buffer or the dictionary fills up. Queries that exceed this limit will fail. Set to zero to disable disk spilling.|0 (disabled)|
+
+Supported query contexts:
+
+|Key|Description|
+|---|-----------|
+|`maxOnDiskStorage`|Can be used to lower the value of `druid.query.groupBy.maxOnDiskStorage` for this query.|
+
+### Advanced configurations
+
+Supported runtime properties:
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.query.groupBy.singleThreaded`|Merge results using a single thread.|false|
+|`druid.query.groupBy.intermediateResultAsMapCompat`|Whether Brokers are able to understand map-based result rows. Setting this to `true` adds some overhead to all groupBy queries. It is required for compatibility with data servers running versions older than 0.16.0, which introduced [array-based result rows](#array-based-result-rows).|false|
+|`druid.query.groupBy.bufferGrouperInitialBuckets`|Initial number of buckets in the off-heap hash table used for grouping results. Set to 0 to use a reasonable default (1024).|0|
+|`druid.query.groupBy.bufferGrouperMaxLoadFactor`|Maximum load factor of the off-heap hash table used for grouping results. When the load factor exceeds this size, the table will be grown or spilled to disk. Set to 0 to use a reasonable default (0.7).|0|
+|`druid.query.groupBy.forceHashAggregation`|Force to use hash-based aggregation.|false|
+|`druid.query.groupBy.intermediateCombineDegree`|Number of intermediate nodes combined together in the combining tree. Higher degrees will need less threads which might be helpful to improve the query performance by reducing the overhead of too many threads if the server has sufficiently powerful cpu cores.|8|
+|`druid.query.groupBy.numParallelCombineThreads`|Hint for the number of parallel combining threads. This should be larger than 1 to turn on the parallel combining feature. The actual number of threads used for parallel combining is min(`druid.query.groupBy.numParallelCombineThreads`, `druid.processing.numThreads`).|1 (disabled)|
+|`druid.query.groupBy.applyLimitPushDownToSegment`|If Broker pushes limit down to queryable data server (historicals, peons) then limit results during segment scan. If typically there are a large number of segments taking part in a query on a data server, this setting may counterintuitively reduce performance if enabled.|false (disabled)|
+
+Supported query contexts:
+
+|Key|Description|Default|
+|---|-----------|-------|
+|`groupByIsSingleThreaded`|Overrides the value of `druid.query.groupBy.singleThreaded` for this query.|None|
+|`bufferGrouperInitialBuckets`|Overrides the value of `druid.query.groupBy.bufferGrouperInitialBuckets` for this query.|None|
+|`bufferGrouperMaxLoadFactor`|Overrides the value of `druid.query.groupBy.bufferGrouperMaxLoadFactor` for this query.|None|
+|`forceHashAggregation`|Overrides the value of `druid.query.groupBy.forceHashAggregation`|None|
+|`intermediateCombineDegree`|Overrides the value of `druid.query.groupBy.intermediateCombineDegree`|None|
+|`numParallelCombineThreads`|Overrides the value of `druid.query.groupBy.numParallelCombineThreads`|None|
+|`maxSelectorDictionarySize`|Overrides the value of `druid.query.groupBy.maxMergingDictionarySize`|None|
+|`maxMergingDictionarySize`|Overrides the value of `druid.query.groupBy.maxMergingDictionarySize`|None|
+|`mergeThreadLocal`|Whether merge buffers should always be split into thread-local buffers. Setting this to `true` reduces thread contention, but uses memory less efficiently. This tradeoff is beneficial when memory is plentiful. |false|
+|`sortByDimsFirst`|Sort the results first by dimension values and then by timestamp.|false|
+|`forceLimitPushDown`|When all fields in the orderby are part of the grouping key, the Broker will push limit application down to the Historical processes. When the sorting order uses fields that are not in the grouping key, applying this optimization can result in approximate results with unknown accuracy, so this optimization is disabled by default in that case. Enabling this context flag turns on limit push down for limit/orderbys that contain non-grouping key columns.|false|
+|`applyLimitPushDownToSegment`|If Broker pushes limit down to queryable nodes (historicals, peons) then limit results during segment scan. This context value can be used to override `druid.query.groupBy.applyLimitPushDownToSegment`.|true|
+|`groupByEnableMultiValueUnnesting`|Safety flag to enable/disable the implicit unnesting on multi value column's as part of the grouping key. 'true' indicates multi-value grouping keys are unnested. 'false' returns an error if a multi value column is found as part of the grouping key.|true|
+|`deferExpressionDimensions`|When an entry in `dimensions` references an `expression` virtual column, this property influences whether expression evaluation is deferred from cursor processing to the merge step. Options are:<ul><li>`fixedWidth`: Defer expressions with fixed-width inputs (numeric and dictionary-encoded string).</li><li>`fixedWidthNonNumeric`: Defer expressions with fixed-width inputs (numeric and dictionary-encoded string), unless the expression output and all inputs are numeric.</li><li>`singleString`: Defer string-typed expressions with a single dictionary-encoded string input.</li><li>`always`: Defer all expressions. May require building dictionaries for expression inputs.</li></ul><br />These properties only take effect when the `groupBy` query can be vectorized. Non-vectorized queries only defer string-typed expressions of single string inputs.|`fixedWidthNonNumeric`|
+
+#### Array based result rows
+
+Internally Druid always uses an array based representation of groupBy result rows, but by default this is translated
+into a map based result format at the Broker. To reduce the overhead of this translation, results may also be returned
+from the Broker directly in the array based format if `resultAsArray` is set to `true` on the query context.
+
+Each row is positional, and has the following fields, in order:
+
+* Timestamp (optional; only if granularity != ALL)
+* Dimensions (in order)
+* Aggregators (in order)
+* Post-aggregators (optional; in order, if present)
+
+This schema is not available on the response, so it must be computed from the issued query in order to properly read
+the results.
diff --git a/docs/35.0.0/querying/having.md b/docs/35.0.0/querying/having.md
new file mode 100644
index 0000000000..f13020c4b3
--- /dev/null
+++ b/docs/35.0.0/querying/having.md
@@ -0,0 +1,266 @@
+---
+id: having
+title: "Having filters (groupBy)"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ Apache Druid supports two query languages: [Druid SQL](sql.md) and [native queries](querying.md).
+ This document describes the native
+ language. For information about functions available in SQL, refer to the
+ [SQL documentation](sql-scalar.md).
+:::
+
+A having clause is a JSON object identifying which rows from a groupBy query should be returned, by specifying conditions on aggregated values.
+
+It is essentially the equivalent of the HAVING clause in SQL.
+
+Apache Druid supports the following types of having clauses.
+
+### Query filters
+
+Query filter HavingSpecs allow all [Druid query filters](filters.md) to be used in the Having part of the query.
+
+The grammar for a query filter HavingSpec is:
+
+```json
+{
+    "queryType": "groupBy",
+    "dataSource": "sample_datasource",
+    ...
+    "having":
+        {
+            "type" : "filter",
+            "filter" : <any Druid query filter>
+        }
+}
+```
+
+For example, to use a selector filter:
+
+
+```json
+{
+    "queryType": "groupBy",
+    "dataSource": "sample_datasource",
+    ...
+    "having":
+        {
+            "type" : "filter",
+            "filter" : {
+              "type": "selector",
+              "dimension" : "<dimension>",
+              "value" : "<dimension_value>"
+            }
+        }
+}
+```
+
+You can use "filter" HavingSpecs to filter on the timestamp of result rows by applying a filter to the "\_\_time"
+column.
+
+### Numeric filters
+
+The simplest having clause is a numeric filter.
+Numeric filters can be used as the base filters for more complex boolean expressions of filters.
+
+Here's an example of a having-clause numeric filter:
+
+```json
+{
+    "queryType": "groupBy",
+    "dataSource": "sample_datasource",
+    ...
+    "having":
+        {
+            "type": "greaterThan",
+            "aggregation": "<aggregate_metric>",
+            "value": <numeric_value>
+        }
+}
+```
+
+#### Equal To
+
+The equalTo filter will match rows with a specific aggregate value.
+The grammar for an `equalTo` filter is as follows:
+
+```json
+{
+    "queryType": "groupBy",
+    "dataSource": "sample_datasource",
+    ...
+    "having":
+        {
+            "type": "equalTo",
+            "aggregation": "<aggregate_metric>",
+            "value": <numeric_value>
+        }
+}
+```
+
+This is the equivalent of `HAVING <aggregate> = <value>`.
+
+#### Greater Than
+
+The greaterThan filter will match rows with aggregate values greater than the given value.
+The grammar for a `greaterThan` filter is as follows:
+
+```json
+{
+    "queryType": "groupBy",
+    "dataSource": "sample_datasource",
+    ...
+    "having":
+        {
+            "type": "greaterThan",
+            "aggregation": "<aggregate_metric>",
+            "value": <numeric_value>
+        }
+}
+```
+
+This is the equivalent of `HAVING <aggregate> > <value>`.
+
+#### Less Than
+
+The lessThan filter will match rows with aggregate values less than the specified value.
+The grammar for a `greaterThan` filter is as follows:
+
+```json
+{
+    "queryType": "groupBy",
+    "dataSource": "sample_datasource",
+    ...
+    "having":
+        {
+            "type": "lessThan",
+            "aggregation": "<aggregate_metric>",
+            "value": <numeric_value>
+        }
+}
+```
+
+This is the equivalent of `HAVING <aggregate> < <value>`.
+
+
+
+### Dimension Selector Filter
+
+#### dimSelector
+
+The dimSelector filter will match rows with dimension values equal to the specified value.
+The grammar for a `dimSelector` filter is as follows:
+
+```json
+{
+    "queryType": "groupBy",
+    "dataSource": "sample_datasource",
+    ...
+    "having":
+       {
+            "type": "dimSelector",
+            "dimension": "<dimension>",
+            "value": <dimension_value>
+        }
+}
+```
+
+
+### Logical expression filters
+
+#### AND
+
+The grammar for an AND filter is as follows:
+
+```json
+{
+    "queryType": "groupBy",
+    "dataSource": "sample_datasource",
+    ...
+    "having":
+        {
+            "type": "and",
+            "havingSpecs": [
+                {
+                    "type": "greaterThan",
+                    "aggregation": "<aggregate_metric>",
+                    "value": <numeric_value>
+                },
+                {
+                    "type": "lessThan",
+                    "aggregation": "<aggregate_metric>",
+                    "value": <numeric_value>
+                }
+            ]
+        }
+}
+```
+
+#### OR
+
+The grammar for an OR filter is as follows:
+
+```json
+{
+    "queryType": "groupBy",
+    "dataSource": "sample_datasource",
+    ...
+    "having":
+        {
+            "type": "or",
+            "havingSpecs": [
+                {
+                    "type": "greaterThan",
+                    "aggregation": "<aggregate_metric>",
+                    "value": <numeric_value>
+                },
+                {
+                    "type": "equalTo",
+                    "aggregation": "<aggregate_metric>",
+                    "value": <numeric_value>
+                }
+            ]
+        }
+}
+```
+
+#### NOT
+
+The grammar for a NOT filter is as follows:
+
+```json
+{
+    "queryType": "groupBy",
+    "dataSource": "sample_datasource",
+    ...
+    "having":
+        {
+        "type": "not",
+        "havingSpec":
+            {
+                "type": "equalTo",
+                "aggregation": "<aggregate_metric>",
+                "value": <numeric_value>
+            }
+        }
+}
+```
diff --git a/docs/35.0.0/querying/hll-old.md b/docs/35.0.0/querying/hll-old.md
new file mode 100644
index 0000000000..8e40c999fd
--- /dev/null
+++ b/docs/35.0.0/querying/hll-old.md
@@ -0,0 +1,141 @@
+---
+id: hll-old
+title: "Cardinality/HyperUnique aggregators"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+## Cardinality aggregator
+
+Computes the cardinality of a set of Apache Druid dimensions, using HyperLogLog to estimate the cardinality. Please note that this
+aggregator will be much slower than indexing a column with the hyperUnique aggregator. This aggregator also runs over a dimension column, which
+means the string dimension cannot be removed from the dataset to improve rollup. In general, we strongly recommend using the hyperUnique aggregator
+instead of the cardinality aggregator if you do not care about the individual values of a dimension.
+
+```json
+{
+  "type": "cardinality",
+  "name": "<output_name>",
+  "fields": [ <dimension1>, <dimension2>, ... ],
+  "byRow": <false | true> # (optional, defaults to false),
+  "round": <false | true> # (optional, defaults to false)
+}
+```
+
+Each individual element of the "fields" list can be a String or [DimensionSpec](../querying/dimensionspecs.md). A String dimension in the fields list is equivalent to a DefaultDimensionSpec (no transformations).
+
+The HyperLogLog algorithm generates decimal estimates with some error. "round" can be set to true to round off estimated
+values to whole numbers. Note that even with rounding, the cardinality is still an estimate. The "round" field only
+affects query-time behavior, and is ignored at ingestion-time.
+
+### Cardinality by value
+
+When setting `byRow` to `false` (the default) it computes the cardinality of the set composed of the union of all dimension values for all the given dimensions.
+
+* For a single dimension, this is equivalent to
+
+```sql
+SELECT COUNT(DISTINCT(dimension)) FROM <datasource>
+```
+
+* For multiple dimensions, this is equivalent to something akin to
+
+```sql
+SELECT COUNT(DISTINCT(value)) FROM (
+  SELECT dim_1 as value FROM <datasource>
+  UNION
+  SELECT dim_2 as value FROM <datasource>
+  UNION
+  SELECT dim_3 as value FROM <datasource>
+)
+```
+
+### Cardinality by row
+
+When setting `byRow` to `true` it computes the cardinality by row, i.e. the cardinality of distinct dimension combinations.
+This is equivalent to something akin to
+
+```sql
+SELECT COUNT(*) FROM ( SELECT DIM1, DIM2, DIM3 FROM <datasource> GROUP BY DIM1, DIM2, DIM3 )
+```
+
+**Example**
+
+Determine the number of distinct countries people are living in or have come from.
+
+```json
+{
+  "type": "cardinality",
+  "name": "distinct_countries",
+  "fields": [ "country_of_origin", "country_of_residence" ]
+}
+```
+
+Determine the number of distinct people (i.e. combinations of first and last name).
+
+```json
+{
+  "type": "cardinality",
+  "name": "distinct_people",
+  "fields": [ "first_name", "last_name" ],
+  "byRow" : true
+}
+```
+
+Determine the number of distinct starting characters of last names
+
+```json
+{
+  "type": "cardinality",
+  "name": "distinct_last_name_first_char",
+  "fields": [
+    {
+     "type" : "extraction",
+     "dimension" : "last_name",
+     "outputName" :  "last_name_first_char",
+     "extractionFn" : { "type" : "substring", "index" : 0, "length" : 1 }
+    }
+  ],
+  "byRow" : true
+}
+```
+
+
+## HyperUnique aggregator
+
+Uses [HyperLogLog](http://algo.inria.fr/flajolet/Publications/FlFuGaMe07.pdf) to compute the estimated cardinality of a dimension that has been aggregated as a "hyperUnique" metric at indexing time.
+
+```json
+{
+  "type" : "hyperUnique",
+  "name" : <output_name>,
+  "fieldName" : <metric_name>,
+  "isInputHyperUnique" : false,
+  "round" : false
+}
+```
+
+"isInputHyperUnique" can be set to true to index precomputed HLL (Base64 encoded output from druid-hll is expected).
+The "isInputHyperUnique" field only affects ingestion-time behavior, and is ignored at query-time.
+
+The HyperLogLog algorithm generates decimal estimates with some error. "round" can be set to true to round off estimated
+values to whole numbers. Note that even with rounding, the cardinality is still an estimate. The "round" field only
+affects query-time behavior, and is ignored at ingestion-time.
\ No newline at end of file
diff --git a/docs/35.0.0/querying/joins.md b/docs/35.0.0/querying/joins.md
new file mode 100644
index 0000000000..d200b757e4
--- /dev/null
+++ b/docs/35.0.0/querying/joins.md
@@ -0,0 +1,42 @@
+---
+id: joins
+title: "Joins"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+Apache Druid has two features related to joining of data:
+
+1. [Join](datasource.md#join) operators. These are available using a [join datasource](datasource.md#join) in native
+queries, or using the [JOIN operator](sql.md) in Druid SQL. Refer to the
+[join datasource](datasource.md#join) documentation for information about how joins work in Druid native queries,
+or the [multi-stage query join documentation](../multi-stage-query/reference.md#joins) for information about how joins
+work in multi-stage query tasks.
+2. [Query-time lookups](lookups.md), simple key-to-value mappings. These are preloaded on all servers that are involved
+in queries and can be accessed with or without an explicit join operator. Refer to the [lookups](lookups.md)
+documentation for more details.
+
+Whenever possible, for best performance it is good to avoid joins at query time. Often this can be accomplished by
+joining data before it is loaded into Druid. However, there are situations where joins or lookups are the best solution
+available despite the performance overhead, including:
+
+- The fact-to-dimension (star and snowflake schema) case: you need to change dimension values after initial ingestion,
+and aren't able to reingest to do this. In this case, you can use lookups for your dimension tables.
+- Your workload requires joins or filters on subqueries.
diff --git a/docs/35.0.0/querying/kafka-extraction-namespace.md b/docs/35.0.0/querying/kafka-extraction-namespace.md
new file mode 100644
index 0000000000..1cfa91aac5
--- /dev/null
+++ b/docs/35.0.0/querying/kafka-extraction-namespace.md
@@ -0,0 +1,96 @@
+---
+id: kafka-extraction-namespace
+title: "Apache Kafka Lookups"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+To use this Apache Druid extension, [include](../configuration/extensions.md#loading-extensions) `druid-lookups-cached-global` and `druid-kafka-extraction-namespace` in the extensions load list.
+
+If you need updates to populate as promptly as possible, it is possible to plug into a Kafka topic whose key is the old value and message is the desired new value (both in UTF-8) as a LookupExtractorFactory.
+
+```json
+{
+  "type":"kafka",
+  "kafkaTopic":"testTopic",
+  "kafkaProperties":{
+    "bootstrap.servers":"kafka.service:9092"
+  }
+}
+```
+
+| Parameter         | Description                                                                             | Required | Default           |
+|-------------------|-----------------------------------------------------------------------------------------|----------|-------------------|
+| `kafkaTopic`      | The Kafka topic to read the data from                                                   | Yes      ||
+| `kafkaProperties` | Kafka consumer properties (`bootstrap.servers` must be specified)                       | Yes      ||
+| `connectTimeout`  | How long to wait for an initial connection                                              | No       | `0` (do not wait) |
+| `isOneToOne`      | The map is a one-to-one (see [Lookup DimensionSpecs](./dimensionspecs.md)) | No       | `false`           |
+
+The extension `kafka-extraction-namespace` enables reading from an [Apache Kafka](https://kafka.apache.org/) topic which has name/key pairs to allow renaming of dimension values. An example use case would be to rename an ID to a human-readable format.
+
+## How it Works
+
+The extractor works by consuming the configured Kafka topic from the beginning, and appending every record to an internal map. The key of the Kafka record is used as they key of the map, and the payload of the record is used as the value. At query time, a lookup can be used to transform the key into the associated value. See [lookups](./lookups.md) for how to configure and use lookups in a query. Keys and values are both stored as strings by the lookup extractor.
+
+The extractor remains subscribed to the topic, so new records are added to the lookup map as they appear. This allows for lookup values to be updated in near-realtime. If two records are added to the topic with the same key, the record with the larger offset will replace the previous record in the lookup map. A record with a `null` payload will be treated as a tombstone record, and the associated key will be removed from the lookup map.
+
+The extractor treats the input topic much like a [KTable](https://kafka.apache.org/23/javadoc/org/apache/kafka/streams/kstream/KTable.html). As such, it is best to create your Kafka topic using a [log compaction](https://kafka.apache.org/documentation/#compaction) strategy, so that the most-recent version of a key is always preserved in Kafka. Without properly configuring retention and log compaction, older keys that are automatically removed from Kafka will not be available and will be lost when Druid services are restarted.
+
+### Example
+
+Consider a `country_codes` topic is being consumed, and the following records are added to the topic in the following order:
+
+| Offset | Key | Payload     |
+|--------|-----|-------------|
+| 1      | NZ  | Nu Zeelund  |
+| 2      | AU  | Australia   |
+| 3      | NZ  | New Zealand |
+| 4      | AU  | `null`      |
+| 5      | NZ  | Aotearoa    |
+| 6      | CZ  | Czechia     |
+
+This input topic would be consumed from the beginning, and result in a lookup namespace containing the following mappings (notice that the entry for _Australia_ was added and then deleted):
+
+| Key | Value     |
+|-----|-----------|
+| NZ  | Aotearoa  |
+| CZ  | Czechia   |
+
+Now when a query uses this extraction namespace, the country codes can be mapped to the full country name at query time.
+
+## Tombstones and Deleting Records
+
+The Kafka lookup extractor treats `null` Kafka messages as tombstones. This means that a record on the input topic with a `null` message payload on Kafka will remove the associated key from the lookup map, effectively deleting it.
+
+## Limitations
+
+The consumer properties `group.id`, `auto.offset.reset` and `enable.auto.commit` cannot be set in `kafkaProperties` as they are set by the extension as `UUID.randomUUID().toString()`, `earliest` and `false` respectively. This is because the entire topic must be consumed by the Druid service from the very beginning so that a complete map of lookup values can be built. Setting any of these consumer properties will cause the extractor to not start.
+
+Currently, the Kafka lookup extractor feeds the entire Kafka topic into a local cache. If you are using on-heap caching, this can easily clobber your java heap if the Kafka stream spews a lot of unique keys. Off-heap caching should alleviate these concerns, but there is still a limit to the quantity of data that can be stored.  There is currently no eviction policy.
+
+## Testing the Kafka rename functionality
+
+To test this setup, you can send key/value pairs to a Kafka stream via the following producer console:
+
+```
+./bin/kafka-console-producer.sh --property parse.key=true --property key.separator="->" --broker-list localhost:9092 --topic testTopic
+```
+
+Renames can then be published as `OLD_VAL->NEW_VAL` followed by newline (enter or return)
diff --git a/docs/35.0.0/querying/limitspec.md b/docs/35.0.0/querying/limitspec.md
new file mode 100644
index 0000000000..a734860e63
--- /dev/null
+++ b/docs/35.0.0/querying/limitspec.md
@@ -0,0 +1,72 @@
+---
+id: limitspec
+title: "Sorting and limiting (groupBy)"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ Apache Druid supports two query languages: [Druid SQL](sql.md) and [native queries](querying.md).
+ This document describes the native
+ language. For information about sorting in SQL, refer to the [SQL documentation](sql.md#order-by).
+:::
+
+The limitSpec field provides the functionality to sort and limit the set of results from a groupBy query. If you group by a single dimension and are ordering by a single metric, we highly recommend using [TopN Queries](../querying/topnquery.md) instead. The performance will be substantially better. Available options are:
+
+### DefaultLimitSpec
+
+The default limit spec takes a limit and the list of columns to do an orderBy operation over. The grammar is:
+
+```json
+{
+    "type"    : "default",
+    "limit"   : <optional integer>,
+    "offset"  : <optional integer>,
+    "columns" : [<optional list of OrderByColumnSpec>],
+}
+```
+
+The "limit" parameter is the maximum number of rows to return.
+
+The "offset" parameter tells Druid to skip this many rows when returning results. If both "limit" and "offset" are
+provided, then "offset" will be applied first, followed by "limit". For example, a spec with limit 100 and offset 10
+will return 100 rows starting from row number 10. Internally, the query is executed by extending the limit by the offset
+and then discarding a number of rows equal to the offset. This means that raising the offset will increase resource
+usage by an amount similar to increasing the limit.
+
+Together, "limit" and "offset" can be used to implement pagination. However, note that if the underlying datasource is
+modified in between page fetches in ways that affect overall query results, then the different pages will not
+necessarily align with each other.
+
+#### OrderByColumnSpec
+
+OrderByColumnSpecs indicate how to do order by operations. Each order-by condition can be a `jsonString` or a map of the following form:
+
+```json
+{
+    "dimension" : "<Any dimension or metric name>",
+    "direction" : <"ascending"|"descending">,
+    "dimensionOrder" : <"lexicographic"(default)|"alphanumeric"|"strlen"|"numeric">
+}
+```
+
+If only the dimension is provided (as a JSON string), the default order-by is ascending with lexicographic sorting.
+
+See [Sorting Orders](./sorting-orders.md) for more information on the sorting orders specified by "dimensionOrder".
diff --git a/docs/35.0.0/querying/lookups-cached-global.md b/docs/35.0.0/querying/lookups-cached-global.md
new file mode 100644
index 0000000000..68a7b64213
--- /dev/null
+++ b/docs/35.0.0/querying/lookups-cached-global.md
@@ -0,0 +1,387 @@
+---
+id: lookups-cached-global
+title: "Globally Cached Lookups"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+To use this Apache Druid extension, [include](../configuration/extensions.md#loading-extensions) `druid-lookups-cached-global` in the extensions load list.
+
+## Configuration
+:::info
+ Static configuration is no longer supported. Lookups can be configured through
+ [dynamic configuration](./lookups.md#configuration).
+:::
+
+Globally cached lookups are appropriate for lookups which are not possible to pass at query time due to their size,
+or are not desired to be passed at query time because the data is to reside in and be handled by the Druid servers,
+and are small enough to reasonably populate in-memory. This usually means tens to tens of thousands of entries per lookup.
+
+Globally cached lookups all draw from the same cache pool, allowing each process to have a fixed cache pool that can be used by cached lookups.
+
+Globally cached lookups can be specified as part of the [cluster wide config for lookups](./lookups.md) as a type of `cachedNamespace`
+
+ ```json
+ {
+    "type": "cachedNamespace",
+    "extractionNamespace": {
+       "type": "uri",
+       "uri": "file:/tmp/prefix/",
+       "namespaceParseSpec": {
+         "format": "csv",
+         "columns": [
+             "[\"key\"",
+             "\"value\"]"
+      ]
+       },
+       "pollPeriod": "PT5M"
+     },
+     "firstCacheTimeout": 0
+ }
+ ```
+
+ ```json
+{
+    "type": "cachedNamespace",
+    "extractionNamespace": {
+       "type": "jdbc",
+       "connectorConfig": {
+         "connectURI": "jdbc:mysql:\/\/localhost:3306\/druid",
+         "user": "druid",
+         "password": "diurd"
+       },
+       "table": "lookupTable",
+       "keyColumn": "mykeyColumn",
+       "valueColumn": "myValueColumn",
+       "filter" : "myFilterSQL (Where clause statement  e.g LOOKUPTYPE=1)",
+       "tsColumn": "timeColumn"
+    },
+    "firstCacheTimeout": 120000,
+    "injective":true
+}
+ ```
+
+The parameters are as follows
+
+|Property|Description|Required|Default|
+|--------|-----------|--------|-------|
+|`extractionNamespace`|Specifies how to populate the local cache. See below|Yes|-|
+|`firstCacheTimeout`|How long to wait (in ms) for the first run of the cache to populate. 0 indicates to not wait|No|`0` (do not wait)|
+|`injective`|If the underlying map is [injective](./lookups.md#query-rewrites) (keys and values are unique) then optimizations can occur internally by setting this to `true`|No|`false`|
+
+If `firstCacheTimeout` is set to a non-zero value, it should be less than `druid.manager.lookups.hostUpdateTimeout`. If `firstCacheTimeout` is NOT set, then management is essentially asynchronous and does not know if a lookup succeeded or failed in starting. In such a case logs from the processes using lookups should be monitored for repeated failures.
+
+Proper functionality of globally cached lookups requires the following extension to be loaded on the Broker, Peon, and Historical processes:
+`druid-lookups-cached-global`
+
+## Example configuration
+
+In a simple case where only one [tier](./lookups.md#dynamic-configuration) exists (`realtime_customer2`) with one `cachedNamespace` lookup called `country_code`, the resulting configuration JSON looks similar to the following:
+
+```json
+{
+  "realtime_customer2": {
+    "country_code": {
+      "version": "v0",
+      "lookupExtractorFactory": {
+        "type": "cachedNamespace",
+        "extractionNamespace": {
+          "type": "jdbc",
+          "connectorConfig": {
+            "connectURI": "jdbc:mysql:\/\/localhost:3306\/druid",
+            "user": "druid",
+            "password": "diurd"
+          },
+          "table": "lookupValues",
+          "keyColumn": "value_id",
+          "valueColumn": "value_text",
+          "filter": "value_type='country'",
+          "tsColumn": "timeColumn"
+        },
+        "firstCacheTimeout": 120000,
+        "injective": true
+      }
+    }
+  }
+}
+```
+
+Where the Coordinator endpoint `/druid/coordinator/v1/lookups/realtime_customer2/country_code` should return
+
+```json
+{
+  "version": "v0",
+  "lookupExtractorFactory": {
+    "type": "cachedNamespace",
+    "extractionNamespace": {
+      "type": "jdbc",
+      "connectorConfig": {
+        "connectURI": "jdbc:mysql://localhost:3306/druid",
+        "user": "druid",
+        "password": "diurd"
+      },
+      "table": "lookupValues",
+      "keyColumn": "value_id",
+      "valueColumn": "value_text",
+      "filter": "value_type='country'",
+      "tsColumn": "timeColumn"
+    },
+    "firstCacheTimeout": 120000,
+    "injective": true
+  }
+}
+```
+
+## Cache Settings
+
+Lookups are cached locally on Historical processes. The following are settings used by the processes which service queries when
+setting namespaces (Broker, Peon, Historical)
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.lookup.namespace.cache.type`|Specifies the type of caching to be used by the namespaces. May be one of [`offHeap`, `onHeap`]. `offHeap` uses a temporary file for off-heap storage of the namespace (memory mapped files). `onHeap` stores all cache on the heap in standard java map types.|`onHeap`|
+|`druid.lookup.namespace.numExtractionThreads`|The number of threads in the thread pool dedicated for lookup extraction and updates. This number may need to be scaled up, if you have a lot of lookups and they take long time to extract, to avoid timeouts.|2|
+|`druid.lookup.namespace.numBufferedEntries`|If using off-heap caching, the number of records to be stored on an on-heap buffer.|100,000|
+
+The cache is populated in different ways depending on the settings below. In general, most namespaces employ
+a `pollPeriod` at the end of which time they poll the remote resource of interest for updates.
+
+`onHeap` uses `ConcurrentMap`s in the java heap, and thus affects garbage collection and heap sizing.
+`offHeap` uses an on-heap buffer and MapDB using memory-mapped files in the java temporary directory.
+So if total number of entries in the `cachedNamespace` is in excess of the buffer's configured capacity, the extra will be kept in memory as page cache, and paged in and out by general OS tunings.
+It's highly recommended that `druid.lookup.namespace.numBufferedEntries` is set when using `offHeap`, the value should be chosen from the range between 10% and 50% of the number of entries in the lookup.
+
+## Supported lookups
+
+For additional lookups, please see our [extensions list](../configuration/extensions.md).
+
+### URI lookup
+
+The remapping values for each globally cached lookup can be specified by a JSON object as per the following examples:
+
+```json
+{
+  "type":"uri",
+  "uri": "s3://bucket/some/key/prefix/renames-0003.gz",
+  "namespaceParseSpec":{
+    "format":"csv",
+    "columns":[
+        "[\"key\"",
+        "\"value\"]"
+      ]
+  },
+  "pollPeriod":"PT5M"
+}
+```
+
+```json
+{
+  "type":"uri",
+  "uriPrefix": "s3://bucket/some/key/prefix/",
+  "fileRegex":"renames-[0-9]*\\.gz",
+  "namespaceParseSpec":{
+    "format":"csv",
+    "columns":[
+        "[\"key\"",
+        "\"value\"]"
+      ]
+  },
+  "pollPeriod":"PT5M",
+  "maxHeapPercentage": 10
+}
+```
+
+|Property|Description|Required|Default|
+|--------|-----------|--------|-------|
+|`pollPeriod`|Period between polling for updates|No|0 (only once)|
+|`uri`|URI for the lookup file. Can be a file, HDFS, S3 or GCS path|Either `uri` or `uriPrefix` must be set|None|
+|`uriPrefix`|A URI prefix that specifies a directory or other searchable resource where lookup files are located |Either `uri` or `uriPrefix` must be set|None|
+|`fileRegex`|Optional regex for matching the file name under `uriPrefix`. Only used if `uriPrefix` is used|No|`".*"`|
+|`namespaceParseSpec`|How to interpret the data at the URI|Yes||
+|`maxHeapPercentage`|The maximum percentage of heap size that the lookup should consume. If the lookup grows beyond this size, warning messages will be logged in the respective service logs.|No|10% of JVM heap size|
+
+One of either `uri` or `uriPrefix` must be specified, as either a local file system (file://), HDFS (hdfs://), S3 (s3://) or GCS (gs://) location. HTTP location is not currently supported.
+
+The `pollPeriod` value specifies the period in ISO 8601 format between checks for replacement data for the lookup. If the source of the lookup is capable of providing a timestamp, the lookup will only be updated if it has changed since the prior tick of `pollPeriod`. A value of 0, an absent parameter, or `null` all mean populate once and do not attempt to look for new data later. Whenever an poll occurs, the updating system will look for a file with the most recent timestamp and assume that one with the most recent data set, replacing the local cache of the lookup data.
+
+The `namespaceParseSpec` can be one of a number of values. Each of the examples below would rename foo to bar, baz to bat, and buck to truck. All parseSpec types assumes each input is delimited by a new line. See below for the types of parseSpec supported.
+
+Only ONE file which matches the search will be used. For most implementations, the discriminator for choosing the URIs is by whichever one reports the most recent timestamp for its modification time.
+
+#### csv lookupParseSpec
+|Parameter|Description|Required|Default|
+|---------|-----------|--------|-------|
+|`columns`|The list of columns in the csv file|no if `hasHeaderRow` is set|`null`|
+|`keyColumn`|The name of the column containing the key|no|The first column|
+|`valueColumn`|The name of the column containing the value|no|The second column|
+|`hasHeaderRow`|A flag to indicate that column information can be extracted from the input files' header row|no|false|
+|`skipHeaderRows`|Number of header rows to be skipped|no|0|
+
+If both `skipHeaderRows` and `hasHeaderRow` options are set, `skipHeaderRows` is first applied. For example, if you set
+`skipHeaderRows` to 2 and `hasHeaderRow` to true, Druid will skip the first two lines and then extract column information
+from the third line.
+
+*example input*
+
+```
+bar,something,foo
+bat,something2,baz
+truck,something3,buck
+```
+
+*example namespaceParseSpec*
+
+```json
+"namespaceParseSpec": {
+  "format": "csv",
+  "columns": ["value","somethingElse","key"],
+  "keyColumn": "key",
+  "valueColumn": "value"
+}
+```
+
+#### tsv lookupParseSpec
+|Parameter|Description|Required|Default|
+|---------|-----------|--------|-------|
+|`columns`|The list of columns in the tsv file|yes|`null`|
+|`keyColumn`|The name of the column containing the key|no|The first column|
+|`valueColumn`|The name of the column containing the value|no|The second column|
+|`delimiter`|The delimiter in the file|no|tab (`\t`)|
+|`listDelimiter`|The list delimiter in the file|no| (`\u0001`)|
+|`hasHeaderRow`|A flag to indicate that column information can be extracted from the input files' header row|no|false|
+|`skipHeaderRows`|Number of header rows to be skipped|no|0|
+
+If both `skipHeaderRows` and `hasHeaderRow` options are set, `skipHeaderRows` is first applied. For example, if you set
+`skipHeaderRows` to 2 and `hasHeaderRow` to true, Druid will skip the first two lines and then extract column information
+from the third line.
+
+*example input*
+
+```
+bar|something,1|foo
+bat|something,2|baz
+truck|something,3|buck
+```
+
+*example namespaceParseSpec*
+
+```json
+"namespaceParseSpec": {
+  "format": "tsv",
+  "columns": ["value","somethingElse","key"],
+  "keyColumn": "key",
+  "valueColumn": "value",
+  "delimiter": "|"
+}
+```
+
+#### customJson lookupParseSpec
+
+|Parameter|Description|Required|Default|
+|---------|-----------|--------|-------|
+|`keyFieldName`|The field name of the key|yes|null|
+|`valueFieldName`|The field name of the value|yes|null|
+
+*example input*
+
+```json
+{"key": "foo", "value": "bar", "somethingElse" : "something"}
+{"key": "baz", "value": "bat", "somethingElse" : "something"}
+{"key": "buck", "somethingElse": "something", "value": "truck"}
+```
+
+*example namespaceParseSpec*
+
+```json
+"namespaceParseSpec": {
+  "format": "customJson",
+  "keyFieldName": "key",
+  "valueFieldName": "value"
+}
+```
+
+With customJson parsing, if the value field for a particular row is missing or null then that line will be skipped, and
+will not be included in the lookup.
+
+#### simpleJson lookupParseSpec
+The `simpleJson` lookupParseSpec does not take any parameters. It is simply a line delimited JSON file where the field is the key, and the field's value is the value.
+
+*example input*
+
+```json
+{"foo": "bar"}
+{"baz": "bat"}
+{"buck": "truck"}
+```
+
+*example namespaceParseSpec*
+
+```json
+"namespaceParseSpec":{
+  "format": "simpleJson"
+}
+```
+
+### JDBC lookup
+
+The JDBC lookups will poll a database to populate its local cache. If the `tsColumn` is set it must be able to accept comparisons in the format `'2015-01-01 00:00:00'`. For example, the following must be valid SQL for the table `SELECT * FROM some_lookup_table WHERE timestamp_column >  '2015-01-01 00:00:00'`. If `tsColumn` is set, the caching service will attempt to only poll values that were written *after* the last sync. If `tsColumn` is not set, the entire table is pulled every time.
+
+|Parameter|Description|Required|Default|
+|---------|-----------|--------|-------|
+|`connectorConfig`|The connector config to use. You can set `connectURI`, `user` and `password`. You can selectively allow JDBC properties in `connectURI`. See [JDBC connections security config](../configuration/index.md#jdbc-connections-to-external-databases) for more details.|Yes||
+|`table`|The table which contains the key value pairs|Yes||
+|`keyColumn`|The column in `table` which contains the keys|Yes||
+|`valueColumn`|The column in `table` which contains the values|Yes||
+|`filter`|The filter to use when selecting lookups, this is used to create a where clause on lookup population|No|No Filter|
+|`tsColumn`| The column in `table` which contains when the key was updated|No|Not used|
+|`pollPeriod`|How often to poll the DB|No|0 (only once)|
+|`jitterSeconds`| How much jitter to add (in seconds) up to maximum as a delay (actual value will be used as random from 0 to `jitterSeconds`), used to distribute db load more evenly|No|0|
+|`loadTimeoutSeconds`| How much time (in seconds) it can take to query and populate lookup values. It will be helpful in lookup updates. On lookup update, it will wait maximum of `loadTimeoutSeconds` for new lookup to come up and continue serving from old lookup until new lookup successfully loads. |No|0|
+|`maxHeapPercentage`|The maximum percentage of heap size that the lookup should consume. If the lookup grows beyond this size, warning messages will be logged in the respective service logs.|No|10% of JVM heap size|
+
+```json
+{
+  "type":"jdbc",
+  "connectorConfig":{
+    "connectURI":"jdbc:mysql://localhost:3306/druid",
+    "user":"druid",
+    "password":"diurd"
+  },
+  "table":"some_lookup_table",
+  "keyColumn":"the_old_dim_value",
+  "valueColumn":"the_new_dim_value",
+  "tsColumn":"timestamp_column",
+  "pollPeriod":600000,
+  "jitterSeconds": 120,
+  "maxHeapPercentage": 10
+}
+```
+
+:::info
+ If using JDBC, you will need to add your database's client JAR files to the extension's directory.
+ For Postgres, the connector JAR is already included.
+ See the MySQL extension documentation for instructions to obtain [MySQL](../development/extensions-core/mysql.md#install-mysql-connectorj) or [MariaDB](../development/extensions-core/mysql.md#install-mariadb-connectorj) connector libraries.
+ The connector JAR should reside in the classpath of Druid's main class loader.
+ To add the connector JAR to the classpath, you can copy the downloaded file to `lib/` under the distribution root directory. Alternatively, create a symbolic link to the connector in the `lib` directory.
+:::
+
+## Introspection
+
+Globally cached lookups have introspection points at `/keys` and `/values`, which return the complete set of keys and values respectively in the lookup as a JSON object. Introspection to `/` returns the entire map as a JSON object. Introspection to `/version` provides the internal version indicating when the lookup cache was last updated. See [Introspect A Lookup](./lookups.md#Introspect a Lookup) for examples.
\ No newline at end of file
diff --git a/docs/35.0.0/querying/lookups.md b/docs/35.0.0/querying/lookups.md
new file mode 100644
index 0000000000..2b5af42aa4
--- /dev/null
+++ b/docs/35.0.0/querying/lookups.md
@@ -0,0 +1,340 @@
+---
+id: lookups
+title: "Lookups"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+Lookups are a concept in Apache Druid where dimension values are (optionally) replaced with new values, allowing join-like
+functionality. Applying lookups in Druid is similar to joining a dimension table in a data warehouse. See
+[dimension specs](./dimensionspecs.md) for more information. For the purpose of these documents, a "key"
+refers to a dimension value to match, and a "value" refers to its replacement. So if you wanted to map
+`appid-12345` to `Super Mega Awesome App` then the key would be `appid-12345` and the value would be
+`Super Mega Awesome App`.
+
+It is worth noting that lookups support not just use cases where keys map one-to-one to unique values, such as country
+code and country name, but also support use cases where multiple IDs map to the same value, e.g. multiple app-ids
+mapping to a single account manager. When lookups are one-to-one, Druid is able to apply additional
+[query rewrites](#query-rewrites); see below for more details.
+
+Lookups do not have history. They always use the current data. This means that if the chief account manager for a
+particular app-id changes, and you issue a query with a lookup to store the app-id to account manager relationship,
+it will return the current account manager for that app-id REGARDLESS of the time range over which you query.
+
+If you require data time range sensitive lookups, such a use case is not currently supported dynamically at query time,
+and such data belongs in the raw denormalized data for use in Druid.
+
+Lookups are generally preloaded in-memory on all servers. But very small lookups (on the order of a few dozen to a few
+hundred entries) can also be passed inline in native queries time using the "map" lookup type. Refer to the
+[dimension specs](./dimensionspecs.md) documentation for details.
+
+Other lookup types are available as extensions, including:
+
+- Globally cached lookups from local files, remote URIs, or JDBC through [lookups-cached-global](./lookups-cached-global.md).
+- Globally cached lookups from a Kafka topic through [kafka-extraction-namespace](./kafka-extraction-namespace.md).
+
+:::info
+[Multi-value dimensions](multi-value-dimensions.md) (MVDs) are not supported as keys in lookups. For example, to map the MVD `["A", "B", "C"]` to the value `x` in your lookup, flatten the MVD and map each element of the MVD to the value. Your lookup will have separate key-value pairs for each element of the MVD: `"A": "x"`, `"B": "x"`, and `"C": "x"`.
+:::
+
+Query Syntax
+------------
+
+In [Druid SQL](sql.md), lookups can be queried using the [`LOOKUP` function](sql-scalar.md#string-functions), for example:
+
+```sql
+SELECT
+  LOOKUP(store, 'store_to_country') AS country,
+  SUM(revenue)
+FROM sales
+GROUP BY 1
+```
+
+The `LOOKUP` function also accepts a third argument called `replaceMissingValueWith` as a constant string. If the lookup
+does not contain a value for the provided key, then the `LOOKUP` function returns this `replaceMissingValueWith` value
+rather than `NULL`, just like `COALESCE`. For example, `LOOKUP(store, 'store_to_country', 'NA')` is equivalent to
+`COALESCE(LOOKUP(store, 'store_to_country'), 'NA')`.
+
+Lookups can be queried using the [JOIN operator](datasource.md#join):
+
+```sql
+SELECT
+  store_to_country.v AS country,
+  SUM(sales.revenue) AS country_revenue
+FROM
+  sales
+  INNER JOIN lookup.store_to_country ON sales.store = store_to_country.k
+GROUP BY 1
+```
+
+:::info
+The `LOOKUP` function has automatic [query rewrites](#query-rewrites) available that the `JOIN` approach does not,
+including [reverse lookups](#reverse-lookup) and [pulling up through `GROUP BY`](#pull-up). If these rewrites are
+important for you, consider using the `LOOKUP` function instead of `JOIN`.
+:::
+
+In native queries, lookups can be queried with [dimension specs or extraction functions](dimensionspecs.md).
+
+Query Rewrites
+--------------
+Druid can perform two automatic query rewrites when using the `LOOKUP` function: [reverse lookups](#reverse-lookup) and
+[pulling up through `GROUP BY`](#pull-up). These rewrites and their requirements are described in the following
+sections.
+
+### Reverse lookup
+
+When `LOOKUP` function calls appear in the `WHERE` clause of a query, Druid reverses them [when possible](#table).
+For example, if the lookup table `sku_to_name` contains the mapping `'WB00013' => 'WhizBang Sprocket'`, then Druid
+automatically rewrites this query:
+
+```sql
+SELECT
+  LOOKUP(sku, 'sku_to_name') AS name,
+  SUM(revenue)
+FROM sales
+WHERE LOOKUP(sku, 'sku_to_name') = 'WhizBang Sprocket'
+GROUP BY LOOKUP(sku, 'sku_to_name')
+```
+
+Into this:
+
+```sql
+SELECT
+  LOOKUP(sku, 'sku_to_name') AS name,
+  SUM(revenue)
+FROM sales
+WHERE sku = 'WB00013'
+GROUP BY LOOKUP(sku, 'sku_to_name')
+```
+
+The difference is that in the latter case, data servers do not need to apply the `LOOKUP` function while filtering, and
+can make more efficient use of indexes for `sku`.
+
+<a name="table">The following table</a> contains examples of when it is possible to reverse calls to `LOOKUP` while in
+Druid's default null handling mode. The list of examples is illustrative, albeit not exhaustive.
+
+|SQL|Reversible?|
+|---|-----------|
+|`LOOKUP(sku, 'sku_to_name') = 'WhizBang Sprocket'`|Yes|
+|`LOOKUP(sku, 'sku_to_name') IS NOT DISTINCT FROM 'WhizBang Sprocket'`|Yes, for non-null literals|
+|`LOOKUP(sku, 'sku_to_name') <> 'WhizBang Sprocket'`|No, unless `sku_to_name` is [injective](#injective-lookups)|
+|`LOOKUP(sku, 'sku_to_name') IS DISTINCT FROM 'WhizBang Sprocket'`|Yes, for non-null literals|
+|`LOOKUP(sku, 'sku_to_name') = 'WhizBang Sprocket' IS NOT TRUE`|Yes|
+|`LOOKUP(sku, 'sku_to_name') IN ('WhizBang Sprocket', 'WhizBang Chain')`|Yes|
+|`LOOKUP(sku, 'sku_to_name') NOT IN ('WhizBang Sprocket', 'WhizBang Chain')`|No, unless `sku_to_name` is [injective](#injective-lookups)|
+|`LOOKUP(sku, 'sku_to_name') IN ('WhizBang Sprocket', 'WhizBang Chain') IS NOT TRUE`|Yes|
+|`LOOKUP(sku, 'sku_to_name') IS NULL`|No|
+|`LOOKUP(sku, 'sku_to_name') IS NOT NULL`|No|
+|`LOOKUP(UPPER(sku), 'sku_to_name') = 'WhizBang Sprocket'`|Yes, to `UPPER(sku) = [key for 'WhizBang Sprocket']` (the `UPPER` function remains)|
+|`COALESCE(LOOKUP(sku, 'sku_to_name'), 'N/A') = 'WhizBang Sprocket'`|Yes, but see next item for `= 'N/A'`|
+|`COALESCE(LOOKUP(sku, 'sku_to_name'), 'N/A') = 'N/A'`|No, unless `sku_to_name` is [injective](#injective-lookups), which allows Druid to ignore the `COALESCE`|
+|`COALESCE(LOOKUP(sku, 'sku_to_name'), 'N/A') = 'WhizBang Sprocket' IS NOT TRUE`|Yes|
+|`COALESCE(LOOKUP(sku, 'sku_to_name'), 'N/A') <> 'WhizBang Sprocket'`|Yes, but see next item for `<> 'N/A'`|
+|`COALESCE(LOOKUP(sku, 'sku_to_name'), 'N/A') <> 'N/A'`|No, unless `sku_to_name` is [injective](#injective-lookups), which allows Druid to ignore the `COALESCE`|
+|`COALESCE(LOOKUP(sku, 'sku_to_name'), sku) = 'WhizBang Sprocket'`|No, `COALESCE` is only reversible when the second argument is a constant|
+|`LOWER(LOOKUP(sku, 'sku_to_name')) = 'whizbang sprocket'`|No, functions other than `COALESCE` are not reversible|
+|`MV_CONTAINS(LOOKUP(sku, 'sku_to_name'), 'WhizBang Sprocket')`|Yes|
+|`NOT MV_CONTAINS(LOOKUP(sku, 'sku_to_name'), 'WhizBang Sprocket')`|No, unless `sku_to_name` is [injective](#injective-lookups)|
+|`MV_OVERLAP(LOOKUP(sku, 'sku_to_name'), ARRAY['WhizBang Sprocket'])`|Yes|
+|`NOT MV_OVERLAP(LOOKUP(sku, 'sku_to_name'), ARRAY['WhizBang Sprocket'])`|No, unless `sku_to_name` is [injective](#injective-lookups)|
+
+You can see the difference in the native query that is generated during SQL planning, which you
+can retrieve with [`EXPLAIN PLAN FOR`](sql.md#explain-plan). When a lookup is reversed in this way, the `lookup`
+function disappears and is replaced by a simpler filter, typically of type `equals` or `in`.
+
+Lookups are not reversed if the number of matching keys exceeds the [`sqlReverseLookupThreshold`](sql-query-context.md)
+or [`inSubQueryThreshold`](sql-query-context.md) for the query.
+
+This rewrite adds some planning time that may become noticeable for larger lookups, especially if many keys map to the
+same value. You can see the impact on planning time in the `sqlQuery/planningTimeMs` metric. You can also measure the
+time taken by `EXPLAIN PLAN FOR`, which plans the query but does not execute it.
+
+This rewrite can be disabled by setting [`sqlReverseLookup: false`](sql-query-context.md) in your query context.
+
+### Pull up
+
+Lookups marked as [_injective_](#injective-lookups) can be pulled up through a `GROUP BY`. For example, if the lookup
+`sku_to_name` is injective, Druid automatically rewrites this query:
+
+```sql
+SELECT
+  LOOKUP(sku, 'sku_to_name') AS name,
+  SUM(revenue)
+FROM sales
+GROUP BY LOOKUP(sku, 'sku_to_name')
+```
+
+Into this:
+
+```sql
+SELECT
+  LOOKUP(sku, 'sku_to_name') AS name,
+  SUM(revenue)
+FROM sales
+GROUP BY sku
+```
+
+The difference is that the `LOOKUP` function is not applied until after the `GROUP BY` is finished, which speeds up
+the `GROUP BY`.
+
+You can see the difference in the native query that is generated during SQL planning, which you
+can retrieve with [`EXPLAIN PLAN FOR`](sql.md#explain-plan). When a lookup is pulled up in this way, the `lookup`
+function call typically moves from the `virtualColumns` or `dimensions` section of a native query into the
+`postAggregations`.
+
+This rewrite can be disabled by setting [`sqlPullUpLookup: false`](sql-query-context.md) in your query context.
+
+### Injective lookups
+
+Injective lookups are eligible for the largest set of query rewrites. Injective lookups must satisfy the following
+"one-to-one lookup" properties:
+
+- All values in the lookup table must be unique. That is, no two keys can map to the same value.
+- The lookup table must have a key-value pair defined for every input that the `LOOKUP` function call may
+  encounter. For example, when calling `LOOKUP(sku, 'sku_to_name')`, the `sku_to_name` lookup table must have a key
+  for all possible `sku`.
+- Injective lookup tables are not required to have keys for `null`, since `LOOKUP` of `null` is always `null` itself.
+
+To determine whether a lookup is injective, Druid relies on an `injective` property that you can set in the
+[lookup definition](./lookups-cached-global.md). In general, you should set
+`injective: true` for any lookup that satisfies the required properties, to allow Druid to run your queries as fast as
+possible.
+
+Druid does not verify whether lookups satisfy these required properties. Druid may return incorrect query results
+if you set `injective: true` for a lookup table that is not actually a one-to-one lookup.
+
+Dynamic Configuration
+---------------------
+
+The following documents the behavior of the cluster-wide config which is accessible through the Coordinator.
+The configuration is propagated through the concept of "tier" of servers.
+A "tier" is defined as a group of services which should receive a set of lookups.
+For example, you might have all Historicals be part of `__default`, and Peons be part of individual tiers for the datasources they are tasked with.
+The tiers for lookups are completely independent of Historical tiers.
+
+These configs are accessed using JSON through the following URI template
+
+```
+http://<COORDINATOR_IP>:<PORT>/druid/coordinator/v1/lookups/config/{tier}/{id}
+```
+
+All URIs below are assumed to have `http://<COORDINATOR_IP>:<PORT>` prepended.
+
+If you have NEVER configured lookups before, you MUST post an empty json object `{}` to `/druid/coordinator/v1/lookups/config` to initialize the configuration.
+
+These endpoints will return one of the following results:
+
+* 404 if the resource is not found
+* 400 if there is a problem in the formatting of the request
+* 202 if the request was accepted asynchronously (`POST` and `DELETE`)
+* 200 if the request succeeded (`GET` only)
+
+## Configuration propagation behavior
+The configuration is propagated to the query serving processes (Broker / Router / Peon / Historical) by the Coordinator.
+The query serving processes have an internal API for managing lookups on the process and those are used by the Coordinator.
+The Coordinator periodically checks if any of the processes need to load/drop lookups and updates them appropriately.
+
+Please note that only 2 simultaneous lookup configuration propagation requests can be concurrently handled by a single query serving process. This limit is applied to prevent lookup handling from consuming too many server HTTP connections.
+
+## API
+See [Lookups API](../api-reference/lookups-api.md) for reference on configuring lookups and lookup status. 
+
+## Configuration
+
+See [Lookups Dynamic Configuration](../configuration/index.md#lookups-dynamic-configuration) for Coordinator configuration.
+
+To configure a Broker / Router / Historical / Peon to announce itself as part of a lookup tier, use following properties.
+
+|Property | Description | Default |
+|---------|-------------|---------|
+|`druid.lookup.lookupTier`| The tier for **lookups** for this process. This is independent of other tiers.|`__default`|
+|`druid.lookup.lookupTierIsDatasource`|For some things like indexing service tasks, the datasource is passed in the runtime properties of a task. This option fetches the tierName from the same value as the datasource for the task. It is suggested to only use this as Peon options for the indexing service, if at all. If true, `druid.lookup.lookupTier` MUST NOT be specified|`"false"`|
+
+To configure the behavior of the dynamic configuration manager, use the following properties on the Coordinator:
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.manager.lookups.hostTimeout`|Timeout (in ms) PER HOST for processing request|`2000`(2 seconds)|
+|`druid.manager.lookups.allHostTimeout`|Timeout (in ms) to finish lookup management on all the processes.|`900000`(15 mins)|
+|`druid.manager.lookups.period`|How long to pause between management cycles|`120000`(2 mins)|
+|`druid.manager.lookups.threadPoolSize`|Number of service processes that can be managed concurrently|`10`|
+
+## Saving configuration across restarts
+
+It is possible to save the configuration across restarts such that a process will not have to wait for Coordinator action to re-populate its lookups. To do this the following property is set:
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.lookup.snapshotWorkingDir`|Working path used to store snapshot of current lookup configuration, leaving this property null will disable snapshot/bootstrap utility|null|
+|`druid.lookup.enableLookupSyncOnStartup`|Enable the lookup synchronization process with Coordinator on startup. The queryable processes will fetch and load the lookups from the Coordinator instead of waiting for the Coordinator to load the lookups for them. Users may opt to disable this option if there are no lookups configured in the cluster.|true|
+|`druid.lookup.numLookupLoadingThreads`|Number of threads for loading the lookups in parallel on startup. This thread pool is destroyed once startup is done. It is not kept during the lifetime of the JVM|Available Processors / 2|
+|`druid.lookup.coordinatorFetchRetries`|How many times to retry to fetch the lookup bean list from Coordinator, during the sync on startup.|3|
+|`druid.lookup.lookupStartRetries`|How many times to retry to start each lookup, either during the sync on startup, or during the runtime.|3|
+|`druid.lookup.coordinatorRetryDelay`|How long to delay (in millis) between retries to fetch lookup list from the Coordinator during the sync on startup.|60_000|
+
+## Introspect a Lookup
+
+The Broker provides an API for lookup introspection if the lookup type implements a `LookupIntrospectHandler`.
+
+A `GET` request to `/druid/v1/lookups/introspect/{lookupId}` will return the map of complete values.
+
+ex: `GET /druid/v1/lookups/introspect/nato-phonetic`
+```
+{
+    "A": "Alfa",
+    "B": "Bravo",
+    "C": "Charlie",
+    ...
+    "Y": "Yankee",
+    "Z": "Zulu",
+    "-": "Dash"
+}
+
+```
+
+The list of keys can be retrieved via `GET` to `/druid/v1/lookups/introspect/{lookupId}/keys"`
+
+ex: `GET /druid/v1/lookups/introspect/nato-phonetic/keys`
+```
+[
+    "A",
+    "B",
+    "C",
+    ...
+    "Y",
+    "Z",
+    "-"
+]
+```
+
+A `GET` request to `/druid/v1/lookups/introspect/{lookupId}/values"` will return the list of values.
+
+ex: `GET /druid/v1/lookups/introspect/nato-phonetic/values`
+```
+[
+    "Alfa",
+    "Bravo",
+    "Charlie",
+    ...
+    "Yankee",
+    "Zulu",
+    "Dash"
+]
+```
diff --git a/docs/35.0.0/querying/math-expr.md b/docs/35.0.0/querying/math-expr.md
new file mode 100644
index 0000000000..06ac395c7a
--- /dev/null
+++ b/docs/35.0.0/querying/math-expr.md
@@ -0,0 +1,339 @@
+---
+id: math-expr
+title: "Expressions"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ Apache Druid supports two query languages: [native queries](../querying/querying.md) and [Druid SQL](../querying/sql.md).
+ This document describes the native language. For information about functions available in SQL, refer to the
+ [SQL documentation](../querying/sql-scalar.md).
+:::
+
+Expressions are used in various places in the native query language, including
+[virtual columns](../querying/virtual-columns.md) and [join conditions](../querying/datasource.md#join). They are
+also generated by most [Druid SQL functions](../querying/sql-scalar.md) during the
+[query translation](../querying/sql-translation.md) process.
+
+Expressions are also used at ingestion time inside [transformations](../ingestion/ingestion-spec.md#transforms).
+
+This expression language supports the following operators (listed in decreasing order of precedence).
+
+|Operators|Description|
+|---------|-----------|
+|!, -|Unary NOT and Minus|
+|^|Binary power op|
+|*, /, %|Binary multiplicative|
+|+, -|Binary additive|
+|&lt;, &le;, &gt;, &ge;, ==, !=|Binary Comparison|
+|&&, &#124;&#124;|Binary Logical AND, OR|
+
+Long, double, and string data types are supported. If a number contains a dot, it is interpreted as a double, otherwise it is interpreted as a long. That means, always add a '.' to your number if you want it interpreted as a double value. String literals should be quoted by single quotation marks.
+
+Additionally, the expression language supports long, double, and string arrays. Array literals are created by wrapping square brackets around a list of scalar literals values delimited by a comma or space character. All values in an array literal must be the same type, however null values are accepted. Typed empty arrays may be defined by prefixing with their type in angle brackets: `<STRING>[]`, `<DOUBLE>[]`, or `<LONG>[]`.
+
+Expressions can contain variables. Variable names may contain letters, digits, '\_' and '$'. Variable names must not begin with a digit. To escape other special characters, you can quote it with double quotation marks.
+
+For logical operators, a number is true if and only if it is positive (0 or negative value means false). For string type, it's the evaluation result of 'Boolean.valueOf(string)'.
+
+[Multi-value string dimensions](../querying/multi-value-dimensions.md) are supported and may be treated as either scalar or array typed values, as follows:  
+* When treated as a scalar type, the expression is automatically transformed so that the scalar operation is applied across all values of the multi-valued type, mimicking Druid's native behavior. 
+* Druid coerces values that result in arrays back into the native Druid string type for grouping and aggregation. Grouping on multi-value string dimensions in Druid groups by the individual values, not the 'array'. This behavior produces results similar to an implicit SQL `UNNEST` operation. Alternatively, you can use the `array_to_string` function to perform the aggregation on a _stringified_ version of the complete array and therefore preserve the complete row. To transform the stringified dimension back into the true native array type, use `string_to_array` in an expression post-aggregator.
+
+
+The following built-in functions are available.
+
+## General functions
+
+|name|description|
+|----|-----------|
+|cast|cast(expr,LONG or DOUBLE or STRING or ARRAY\<LONG\>, or ARRAY\<DOUBLE\> or ARRAY\<STRING\>) returns expr with specified type. exception can be thrown. Scalar types may be cast to array types and will take the form of a single element list (null will still be null). |
+|coalesce|coalesce(exprs) returns the first non-null expression, or null if all expressions are null. |
+|if|if(predicate,then,else) returns 'then' if 'predicate' evaluates to a positive number, otherwise it returns 'else' |
+|nvl|nvl(expr,expr-for-null) returns 'expr-for-null' if 'expr' is null. |
+|like|like(expr, pattern[, escape]) is equivalent to SQL `expr LIKE pattern`|
+|case_searched|case_searched(expr1, result1, \[\[expr2, result2, ...\], else-result\]) is similar to `CASE WHEN expr1 THEN result1 [ELSE else_result] END` in SQL|
+|case_simple|case_simple(expr, value1, result1, \[\[value2, result2, ...\], else-result\]) is similar to `CASE expr WHEN value THEN result [ELSE else_result] END` in SQL|
+|isnull|isnull(expr) returns 1 if the value is null, else 0|
+|notnull|notnull(expr) returns 1 if the value is not null, else 0|
+|bloom_filter_test|bloom_filter_test(expr, filter) tests the value of 'expr' against 'filter', a bloom filter serialized as a base64 string. See [bloom filter extension](../development/extensions-core/bloom-filter.md) documentation for additional details.|
+
+## String functions
+
+|name|description|
+|----|-----------|
+|concat|concat(expr, expr...) concatenate a list of strings|
+|format|format(pattern[, args...]) returns a string formatted in the manner of Java's [String.format](https://docs.oracle.com/en/java/javase/17/docs/api/java.base/java/lang/String.html#format(java.lang.String,java.lang.Object...)).|
+|like|like(expr, pattern[, escape]) is equivalent to SQL `expr LIKE pattern`|
+|lookup|lookup(expr, lookup-name[,replaceMissingValueWith]) looks up expr in a registered,`replaceMissingValueWith` is an optional constant string [query-time lookup](../querying/lookups.md)|
+|parse_long|parse_long(string[, radix]) parses a string as a long with the given radix, or 10 (decimal) if a radix is not provided.|
+|regexp_extract|regexp_extract(expr, pattern[, index]) applies a regular expression pattern and extracts a capture group index, or null if there is no match. If index is unspecified or zero, returns the substring that matched the pattern. The pattern may match anywhere inside `expr`; if you want to match the entire string instead, use the `^` and `$` markers at the start and end of your pattern.|
+|regexp_like|regexp_like(expr, pattern) returns whether `expr` matches regular expression `pattern`. The pattern may match anywhere inside `expr`; if you want to match the entire string instead, use the `^` and `$` markers at the start and end of your pattern. |
+|regexp_replace|regexp_replace(expr, pattern, replacement) replaces all instances of a regular expression pattern with a given replacement string. The pattern may match anywhere inside `expr`; if you want to match the entire string instead, use the `^` and `$` markers at the start and end of your pattern.|
+|contains_string|contains_string(expr, string) returns whether `expr` contains `string` as a substring. This method is case-sensitive.|
+|icontains_string|contains_string(expr, string) returns whether `expr` contains `string` as a substring. This method is case-insensitive.|
+|replace|replace(expr, pattern, replacement) replaces pattern with replacement|
+|substring|substring(expr, index, length) behaves like java.lang.String's substring|
+|right|right(expr, length) returns the rightmost length characters from a string|
+|left|left(expr, length) returns the leftmost length characters from a string|
+|strlen|strlen(expr) returns length of a string in UTF-16 code units|
+|strpos|strpos(haystack, needle[, fromIndex]) returns the position of the needle within the haystack, with indexes starting from 0. The search will begin at fromIndex, or 0 if fromIndex is not specified. If the needle is not found then the function returns -1.|
+|trim|trim(expr[, chars]) remove leading and trailing characters from `expr` if they are present in `chars`. `chars` defaults to ' ' (space) if not provided.|
+|ltrim|ltrim(expr[, chars]) remove leading characters from `expr` if they are present in `chars`. `chars` defaults to ' ' (space) if not provided.|
+|rtrim|rtrim(expr[, chars]) remove trailing characters from `expr` if they are present in `chars`. `chars` defaults to ' ' (space) if not provided.|
+|lower|lower(expr) converts a string to lowercase|
+|upper|upper(expr) converts a string to uppercase|
+|reverse|reverse(expr) reverses a string|
+|repeat|repeat(expr, N) repeats a string N times|
+|lpad|lpad(expr, length, chars) returns a string of `length` from `expr` left-padded with `chars`. If `length` is shorter than the length of `expr`, the result is `expr` which is truncated to `length`. The result will be null if either `expr` or `chars` is null. If `chars` is an empty string, no padding is added, however `expr` may be trimmed if necessary.|
+|rpad|rpad(expr, length, chars) returns a string of `length` from `expr` right-padded with `chars`. If `length` is shorter than the length of `expr`, the result is `expr` which is truncated to `length`. The result will be null if either `expr` or `chars` is null. If `chars` is an empty string, no padding is added, however `expr` may be trimmed if necessary.|
+
+## Time functions
+
+|name|description|
+|----|-----------|
+|timestamp|timestamp(expr[,format-string]) parses string expr into date then returns milliseconds from java epoch. without 'format-string' it's regarded as ISO datetime format |
+|unix_timestamp|same with 'timestamp' function but returns seconds instead |
+|timestamp_ceil|timestamp_ceil(expr, period, \[origin, \[timezone\]\]) rounds up a timestamp, returning it as a new timestamp. Period can be any ISO8601 period, like P3M (quarters) or PT12H (half-days). The time zone, if provided, should be a time zone name like "America/Los_Angeles" or offset like "-08:00".|
+|timestamp_floor|timestamp_floor(expr, period, \[origin, [timezone\]\]) rounds down a timestamp, returning it as a new timestamp. Period can be any ISO8601 period, like P3M (quarters) or PT12H (half-days). The time zone, if provided, should be a time zone name like "America/Los_Angeles" or offset like "-08:00".|
+|timestamp_shift|timestamp_shift(expr, period, step, \[timezone\]) shifts a timestamp by a period (step times), returning it as a new timestamp. Period can be any ISO8601 period. Step may be negative. The time zone, if provided, should be a time zone name like "America/Los_Angeles" or offset like "-08:00".|
+|timestamp_extract|timestamp_extract(expr, unit, \[timezone\]) extracts a time part from expr, returning it as a number. Unit can be EPOCH (number of seconds since 1970-01-01 00:00:00 UTC), SECOND, MINUTE, HOUR, DAY (day of month), DOW (day of week), DOY (day of year), WEEK (week of [week year](https://en.wikipedia.org/wiki/ISO_week_date)), MONTH (1 through 12), QUARTER (1 through 4), or YEAR. The time zone, if provided, should be a time zone name like "America/Los_Angeles" or offset like "-08:00"|
+|timestamp_parse|timestamp_parse(string expr, \[pattern, [timezone\]\]) parses a string into a timestamp using a given [Joda DateTimeFormat pattern](http://www.joda.org/joda-time/apidocs/org/joda/time/format/DateTimeFormat). If the pattern is not provided, this parses time strings in either ISO8601 or SQL format. The time zone, if provided, should be a time zone name like "America/Los_Angeles" or offset like "-08:00", and will be used as the time zone for strings that do not include a time zone offset. Pattern and time zone must be literals. Strings that cannot be parsed as timestamps will be returned as nulls.|
+|timestamp_format|timestamp_format(expr, \[pattern, \[timezone\]\]) formats a timestamp as a string with a given [Joda DateTimeFormat pattern](http://www.joda.org/joda-time/apidocs/org/joda/time/format/DateTimeFormat), or ISO8601 if the pattern is not provided. The time zone, if provided, should be a time zone name like "America/Los_Angeles" or offset like "-08:00". Pattern and time zone must be literals.|
+
+## Math functions
+
+See javadoc of java.lang.Math for detailed explanation for each function.
+
+|name|description|
+|----|-----------|
+|abs|abs(x) returns the absolute value of x|
+|acos|acos(x) returns the arc cosine of x|
+|asin|asin(x) returns the arc sine of x|
+|atan|atan(x) returns the arc tangent of x|
+|bitwiseAnd|bitwiseAnd(x,y) returns the result of x & y. Double values will be implicitly cast to longs, use `bitwiseConvertDoubleToLongBits` to perform bitwise operations directly with doubles|
+|bitwiseComplement|bitwiseComplement(x) returns the result of ~x. Double values will be implicitly cast to longs, use `bitwiseConvertDoubleToLongBits` to perform bitwise operations directly with doubles|
+|bitwiseConvertDoubleToLongBits|bitwiseConvertDoubleToLongBits(x) converts the bits of an IEEE 754 floating-point double value to a long. If the input is not a double, it is implicitly cast to a double prior to conversion|
+|bitwiseConvertLongBitsToDouble|bitwiseConvertLongBitsToDouble(x) converts a long to the IEEE 754 floating-point double specified by the bits stored in the long. If the input is not a long, it is implicitly cast to a long prior to conversion|
+|bitwiseOr|bitwiseOr(x,y) returns the result of x [PIPE] y. Double values will be implicitly cast to longs, use `bitwiseConvertDoubleToLongBits` to perform bitwise operations directly with doubles|
+|bitwiseShiftLeft|bitwiseShiftLeft(x,y) returns the result of x `<<` y. Double values will be implicitly cast to longs, use `bitwiseConvertDoubleToLongBits` to perform bitwise operations directly with doubles|
+|bitwiseShiftRight|bitwiseShiftRight(x,y) returns the result of x `>>` y. Double values will be implicitly cast to longs, use `bitwiseConvertDoubleToLongBits` to perform bitwise operations directly with doubles|
+|bitwiseXor|bitwiseXor(x,y) returns the result of x ^ y. Double values will be implicitly cast to longs, use `bitwiseConvertDoubleToLongBits` to perform bitwise operations directly with doubles|
+|atan2|atan2(y, x) returns the angle theta from the conversion of rectangular coordinates (x, y) to polar * coordinates (r, theta)|
+|cbrt|cbrt(x) returns the cube root of x|
+|ceil|ceil(x) returns the smallest (closest to negative infinity) double value that is greater than or equal to x and is equal to a mathematical integer|
+|copysign|copysign(x) returns the first floating-point argument with the sign of the second floating-point argument|
+|cos|cos(x) returns the trigonometric cosine of x|
+|cosh|cosh(x) returns the hyperbolic cosine of x|
+|cot|cot(x) returns the trigonometric cotangent of an angle x|
+|div|div(x,y) is integer division of x by y|
+|exp|exp(x) returns Euler's number raised to the power of x|
+|expm1|expm1(x) returns e^x-1|
+|floor|floor(x) returns the largest (closest to positive infinity) double value that is less than or equal to x and is equal to a mathematical integer|
+|getExponent|getExponent(x) returns the unbiased exponent used in the representation of x|
+|hypot|hypot(x, y) returns sqrt(x^2+y^2) without intermediate overflow or underflow|
+|log|log(x) returns the natural logarithm of x|
+|log10|log10(x) returns the base 10 logarithm of x|
+|log1p|log1p(x) will the natural logarithm of x + 1|
+|max|max(x, y) returns the greater of two values|
+|min|min(x, y) returns the smaller of two values|
+|nextafter|nextafter(x, y) returns the floating-point number adjacent to the x in the direction of the y|
+|nextUp|nextUp(x) returns the floating-point value adjacent to x in the direction of positive infinity|
+|pi|pi returns the constant value of the π |
+|pow|pow(x, y) returns the value of the x raised to the power of y|
+|remainder|remainder(x, y) returns the remainder operation on two arguments as prescribed by the IEEE 754 standard|
+|rint|rint(x) returns value that is closest in value to x and is equal to a mathematical integer|
+|round|round(x, y) returns the value of the x rounded to the y decimal places. While x can be an integer or floating-point number, y must be an integer. The type of the return value is specified by that of x. y defaults to 0 if omitted. When y is negative, x is rounded on the left side of the y decimal points. If x is `NaN`, x returns 0. If x is infinity, x will be converted to the nearest finite double. |
+|safe_divide|safe_divide(x,y) returns the division of x by y if y is not equal to 0. Returns `null` if y is 0.|
+|scalb|scalb(d, sf) returns d * 2^sf rounded as if performed by a single correctly rounded floating-point multiply to a member of the double value set|
+|signum|signum(x) returns the signum function of the argument x|
+|sin|sin(x) returns the trigonometric sine of an angle x|
+|sinh|sinh(x) returns the hyperbolic sine of x|
+|sqrt|sqrt(x) returns the correctly rounded positive square root of x|
+|tan|tan(x) returns the trigonometric tangent of an angle x|
+|tanh|tanh(x) returns the hyperbolic tangent of x|
+|todegrees|todegrees(x) converts an angle measured in radians to an approximately equivalent angle measured in degrees|
+|toradians|toradians(x) converts an angle measured in degrees to an approximately equivalent angle measured in radians|
+|ulp|ulp(x) returns the size of an ulp of the argument x|
+
+## Array functions
+
+| function | description |
+| --- | --- |
+| array(expr1,expr ...) | constructs an array from the expression arguments, using the type of the first argument as the output array type |
+| array_length(arr) | returns length of array expression |
+| array_offset(arr,long) | returns the array element at the 0 based index supplied, or null for an out of range index|
+| array_ordinal(arr,long) | returns the array element at the 1 based index supplied, or null for an out of range index |
+| array_contains(arr,expr) | returns 1 if the array contains the element specified by expr, or contains all elements specified by expr if expr is an array, else 0 |
+| array_overlap(arr1,arr2) | returns 1 if arr1 and arr2 have any elements in common, else 0 |
+| scalar_in_array(expr, arr) | returns 1 if the scalar is present in the array, else 0 if the expr is non-null, or null if the expr is null |
+| array_offset_of(arr,expr) | returns the 0 based index of the first occurrence of expr in the array, or `null` if no matching elements exist in the array. |
+| array_ordinal_of(arr,expr) | returns the 1 based index of the first occurrence of expr in the array, or `null` if no matching elements exist in the array. |
+| array_prepend(expr,arr) | adds expr to arr at the beginning, the resulting array type determined by the type of the array |
+| array_append(arr,expr) | appends expr to arr, the resulting array type determined by the type of the first array |
+| array_concat(arr1,arr2) | concatenates 2 arrays, the resulting array type determined by the type of the first array |
+| array_set_add(arr,expr) | adds expr to arr and converts the array to a new array composed of the unique set of elements. The resulting array type determined by the type of the array |
+| array_set_add_all(arr1,arr2) | combines the unique set of elements of 2 arrays, the resulting array type determined by the type of the first array |
+| array_slice(arr,start,end) | return the subarray of arr from the 0 based index start(inclusive) to end(exclusive), or `null`, if start is less than 0, greater than length of arr or less than end|
+| array_to_string(arr,str) | joins all elements of arr by the delimiter specified by str |
+| string_to_array(str1,str2) | splits str1 into an array on the delimiter specified by str2, which is a regular expression |
+
+
+## Apply functions
+Apply functions allow for special 'lambda' expressions to be defined and applied to array inputs to enable free-form transformations.
+
+| function | description |
+| --- | --- |
+| map(lambda,arr) | applies a transform specified by a single argument lambda expression to all elements of arr, returning a new array |
+| cartesian_map(lambda,arr1,arr2,...) | applies a transform specified by a multi argument lambda expression to all elements of the Cartesian product of all input arrays, returning a new array; the number of lambda arguments and array inputs must be the same |
+| filter(lambda,arr) | filters arr by a single argument lambda, returning a new array with all matching elements, or null if no elements match |
+| fold(lambda,arr,acc) | folds a 2 argument lambda across arr using acc as the initial input value. The first argument of the lambda is the array element and the second the accumulator, returning a single accumulated value. |
+| cartesian_fold(lambda,arr1,arr2,...,acc) | folds a multi argument lambda across the Cartesian product of all input arrays using acc as the initial input value. The first arguments of the lambda are the array elements of each array and the last is the accumulator, returning a single accumulated value. |
+| any(lambda,arr) | returns 1 if any element in the array matches the lambda expression, else 0 |
+| all(lambda,arr) | returns 1 if all elements in the array matches the lambda expression, else 0 |
+
+
+### Lambda expressions syntax
+Lambda expressions are a sort of function definition, where new identifiers can be defined and passed as input to the expression body
+```
+(identifier1 ...) -> expr
+```
+e.g.
+```
+(x, y) -> x + y 
+```
+The identifier arguments of a lambda expression correspond to the elements of the array it is being applied to. For example:
+```
+map((x) -> x + 1, some_multi_value_column)
+```
+will map each element of `some_multi_value_column` to the identifier `x` so that the lambda expression body can be evaluated for each `x`. The scoping rules are that lambda arguments will override identifiers which are defined externally from the lambda expression body. Using the same example:
+
+```
+map((x) -> x + 1, x)
+```
+in this case, the `x` when evaluating `x + 1` is the lambda argument, thus an element of the multi-valued column `x`, rather than the column `x` itself.
+
+
+## JSON functions
+JSON functions provide facilities to extract, transform, and create `COMPLEX<json>` values. 
+
+| function | description |
+|---|---|
+| json_value(expr, path[, type]) | Extract a Druid literal (`STRING`, `LONG`, `DOUBLE`, `ARRAY<STRING>`, `ARRAY<LONG>`, or `ARRAY<DOUBLE>`) value from `expr` using JSONPath syntax of `path`. The optional `type` argument can be set to `'LONG'`,`'DOUBLE'`, `'STRING'`, `'ARRAY<LONG>'`, `'ARRAY<DOUBLE>'`, or `'ARRAY<STRING>'` to cast values to that type. |
+| json_query(expr, path) | Extract a `COMPLEX<json>` value from `expr` using JSONPath syntax of `path` |
+| json_query_array(expr, path) | Extract an `ARRAY<COMPLEX<json>>` value from `expr` using JSONPath syntax of `path`. If value is not an `ARRAY`, it gets translated into a single element `ARRAY` containing the value at `path`. The primary use of this function is to extract arrays of objects to use as inputs to other [array functions](#array-functions). |
+| json_object(expr1, expr2[, expr3, expr4 ...]) | Construct a `COMPLEX<json>` with alternating 'key' and 'value' arguments|
+| parse_json(expr) | Deserialize a JSON `STRING` into a `COMPLEX<json>`. If the input is not a `STRING` or it is invalid JSON, this function will result in an error.|
+| try_parse_json(expr) | Deserialize a JSON `STRING` into a `COMPLEX<json>`. If the input is not a `STRING` or it is invalid JSON, this function will result in a `NULL` value. |
+| to_json_string(expr) | Convert `expr` into a JSON `STRING` value |
+| json_keys(expr, path) | Get array of field names from `expr` at the specified JSONPath `path`, or null if the data does not exist or have any fields |
+| json_paths(expr) | Get array of all JSONPath paths available from `expr` |
+| json_merge(expr1, expr2[, expr3 ...]) | Merges two or more JSON `STRING` or `COMPLEX<json>` into one. Preserves the rightmost value when there are key overlaps. |
+
+### JSONPath syntax
+
+Druid supports a small, simplified subset of the [JSONPath syntax](https://github.com/json-path/JsonPath/blob/master/README.md) operators, primarily limited to extracting individual values from nested data structures.
+
+|Operator|Description|
+| --- | --- |
+|`$`| Root element. All JSONPath expressions start with this operator. |
+|`.<name>`| Child element in dot notation. |
+|`['<name>']`| Child element in bracket notation. |
+|`[<number>]`| Array index. |
+
+See [SQL JSON documentation](../querying/sql-json-functions.md#jsonpath-syntax) for examples and [Nested columns](../querying/nested-columns.md) for more information on ingesting and storing nested data.
+
+## Reduction functions
+
+Reduction functions operate on zero or more expressions and return a single expression. If no expressions are passed as
+arguments, then the result is `NULL`. The expressions must all be convertible to a common data type, which will be the
+type of the result:
+*  If all arguments are `NULL`, the result is `NULL`. Otherwise, `NULL` arguments are ignored.
+*  If the arguments comprise a mix of numbers and strings, the arguments are interpreted as strings.
+*  If all arguments are integer numbers, the arguments are interpreted as longs.
+*  If all arguments are numbers and at least one argument is a double, the arguments are interpreted as doubles. 
+
+| function | description |
+| --- | --- |
+| greatest([expr1, ...]) | Evaluates zero or more expressions and returns the maximum value based on comparisons as described above. |
+| least([expr1, ...]) | Evaluates zero or more expressions and returns the minimum value based on comparisons as described above. |
+
+
+## IP address functions
+
+For the IPv4 address functions, the `address` argument accepts either an IPv4 dotted-decimal string (e.g. "192.168.0.1") or an IP address represented as a long (e.g. 3232235521). Format the `subnet` argument as an IPv4 address subnet in CIDR notation (e.g. "192.168.0.0/16").
+
+For the IPv6 address function, the `address` argument accepts a semicolon separated string (e.g. "75e9:efa4:29c6:85f6::232c"). The format of the `subnet` argument should be an IPv6 address subnet in CIDR notation (e.g. "75e9:efa4:29c6:85f6::/64").
+
+| function | description |
+| --- | --- |
+| ipv4_match(address, subnet) | Returns 1 if the IPv4 `address` belongs to the `subnet` literal, else 0. If `address` is not a valid IPv4 address, then 0 is returned. This function is more efficient if `address` is a long instead of a string.|
+| ipv4_parse(address) | Parses `address` into an IPv4 address stored as a long. Returns `address` if it is already a valid IPv4 integer address.  Returns null if `address` cannot be represented as an IPv4 address. |
+| ipv4_stringify(address) | Converts `address` into an IPv4 address dotted-decimal string. Returns `address` if it is already a valid IPv4 dotted-decimal string. Returns null if `address` cannot be represented as an IPv4 address.|
+| ipv6_match(address, subnet) | Returns 1 if the IPv6 `address` belongs to the `subnet` literal, else 0. If `address` is not a valid IPv6 address, then 0 is returned.|
+
+## Other functions
+
+| function | description |
+| --- | --- |
+| human_readable_binary_byte_format(value[, precision]) | Format a number in human-readable [IEC](https://en.wikipedia.org/wiki/Binary_prefix) format. `precision` must be in the range of [0,3] (default: 2). For example:<li> human_readable_binary_byte_format(1048576) returns `1.00 MiB`</li><li>human_readable_binary_byte_format(1048576, 3) returns `1.000 MiB`</li> |
+| human_readable_decimal_byte_format(value[, precision]) | Format a number in human-readable [SI](https://en.wikipedia.org/wiki/Binary_prefix) format. `precision` must be in the range of [0,3] (default: 2). For example:<li> human_readable_decimal_byte_format(1000000) returns `1.00 MB`</li><li>human_readable_decimal_byte_format(1000000, 3) returns `1.000 MB`</li> |
+| human_readable_decimal_format(value[, precision]) | Format a number in human-readable SI format. `precision` must be in the range of [0,3] (default: 2). For example:<li>human_readable_decimal_format(1000000) returns `1.00 M`</li><li>human_readable_decimal_format(1000000, 3) returns `1.000 M`</li>  |
+
+
+## Vectorization support
+A number of expressions support ['vectorized' query engines](../querying/query-context-reference.md#vectorization-parameters)
+
+Supported features:
+* constants and identifiers are supported for any column type
+* `cast` is supported for numeric and string types
+* math operators: `+`,`-`,`*`,`/`,`%`,`^` are supported for numeric types
+* logical operators: `!`, `&&`, `||`, are supported for string and numeric types
+* comparison operators: `=`, `!=`, `>`, `>=`, `<`, `<=` are supported for string and numeric types
+* math functions: `abs`, `acos`, `asin`, `atan`, `cbrt`, `ceil`, `cos`, `cosh`, `cot`, `exp`, `expm1`, `floor`, `getExponent`, `log`, `log10`, `log1p`, `nextUp`, `rint`, `signum`, `sin`, `sinh`, `sqrt`, `tan`, `tanh`, `toDegrees`, `toRadians`, `ulp`, `atan2`, `copySign`, `div`, `hypot`, `max`, `min`, `nextAfter`,  `pow`, `remainder`, `scalb` are supported for numeric types
+* time functions: `timestamp_floor` (with constant granularity argument) is supported for numeric types
+* boolean functions: `isnull`, `notnull` are supported for string and numeric types
+* conditional functions: `nvl` is supported for string and numeric types
+* string functions: the concatenation operator (`+`) and `concat` function are supported for string and numeric types
+* other: `parse_long` is supported for numeric and string types
+
+## Logical operator behavior
+Logical operations treat `null` values as "unknown" for SQL compatible behavior. _All boolean output functions_ output `LONG` typed boolean values of `1` for `true` and `0` for `false`. 
+
+For the "or" operator:
+* `true || null`, `null || true`, -> `1`
+* `false || null`, `null || false`, `null || null`-> `null`
+
+For the "and" operator:
+* `true && null`, `null && true`, `null && null` -> `null`
+* `false && null`, `null && false` -> `0`
+
+Druid allows implicit conversion of `LONG`, `DOUBLE`, and `STRING` types into boolean values: 
+* `LONG` or `DOUBLE`: any value greater than 0 is considered `true`, else `false`.
+* `STRING`: the value `'true'` (case insensitive) is considered `true`, everything else is `false`.
+
+Behavior examples:
+* `100 && 11` -> `1`
+* `0.7 || 0.3` -> `1`
+* `100 && 0` -> `0`
+* `'troo' && 'true'` -> `0`
+* `'troo' || 'true'` -> `1`
+
diff --git a/docs/35.0.0/querying/multi-value-dimensions.md b/docs/35.0.0/querying/multi-value-dimensions.md
new file mode 100644
index 0000000000..f18f45994f
--- /dev/null
+++ b/docs/35.0.0/querying/multi-value-dimensions.md
@@ -0,0 +1,522 @@
+---
+id: multi-value-dimensions
+title: "Multi-value dimensions"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+Apache Druid supports "multi-value" string dimensions. Multi-value string dimensions result from input fields that contain an
+array of values instead of a single value, such as the `tags` values in the following JSON array example: 
+
+```
+{"timestamp": "2011-01-12T00:00:00.000Z", "tags": ["t1","t2","t3"]} 
+```
+
+It is important to be aware that multi-value dimensions are distinct from [array types](arrays.md). While array types behave like standard SQL arrays, multi-value dimensions do not. This document describes the behavior of multi-value dimensions, and some additional details can be found in the [SQL data type documentation](sql-data-types.md#multi-value-strings-behavior).
+
+This document describes inserting, filtering, and grouping behavior for multi-value dimensions. For information about the internal representation of multi-value dimensions, see
+[segments documentation](../design/segments.md#multi-value-columns). Examples in this document
+are in the form of both [SQL](sql.md) and [native Druid queries](querying.md). Refer to the [Druid SQL documentation](sql-multivalue-string-functions.md) for details
+about the functions available for using multi-value string dimensions in SQL.
+
+The following sections describe inserting, filtering, and grouping behavior based on the following example data, which includes a multi-value dimension, `tags`.
+
+```json lines
+{"timestamp": "2011-01-12T00:00:00.000Z", "label": "row1", "tags": ["t1","t2","t3"]}
+{"timestamp": "2011-01-13T00:00:00.000Z", "label": "row2", "tags": ["t3","t4","t5"]}
+{"timestamp": "2011-01-14T00:00:00.000Z", "label": "row3", "tags": ["t5","t6","t7"]}
+{"timestamp": "2011-01-14T00:00:00.000Z", "label": "row4", "tags": []}
+```
+
+## Ingestion
+
+### Native batch and streaming ingestion
+When using native [batch](../ingestion/native-batch.md) or streaming ingestion such as with [Apache Kafka](../ingestion/kafka-ingestion.md), the Druid web console data loader can detect multi-value dimensions and configure the `dimensionsSpec` accordingly.
+
+For TSV or CSV data, you can specify the multi-value delimiters using the `listDelimiter` field in the `inputFormat`. JSON data must be formatted as a JSON array to be ingested as a multi-value dimension. JSON data does not require `inputFormat` configuration.
+
+The following shows an example `dimensionsSpec` for native ingestion of the data used in this document:
+
+```
+"dimensions": [
+  {
+    "type": "string",
+    "name": "label"
+  },
+  {
+    "type": "string",
+    "name": "tags",
+    "multiValueHandling": "SORTED_ARRAY",
+    "createBitmapIndex": true
+  }
+],
+```
+
+By default, Druid sorts values in multi-value dimensions. This behavior is controlled by the `SORTED_ARRAY` value of the `multiValueHandling` field. Alternatively, you can specify multi-value handling as:
+
+* `SORTED_SET`: results in the removal of duplicate values
+* `ARRAY`: retains the original order of the values
+
+See [Dimension Objects](../ingestion/ingestion-spec.md#dimension-objects) for information on configuring multi-value handling.
+
+### SQL-based ingestion
+Multi-value dimensions can also be inserted with [SQL-based ingestion](../multi-stage-query/index.md). The functions `MV_TO_ARRAY` and `ARRAY_TO_MV` can assist in converting `VARCHAR` to `VARCHAR ARRAY` and `VARCHAR ARRAY` into `VARCHAR` respectively. `multiValueHandling` is not available when using the multi-stage query engine to insert data.
+
+For example, to insert the data used in this document:
+```sql
+REPLACE INTO "mvd_example" OVERWRITE ALL
+WITH "ext" AS (
+  SELECT *
+  FROM TABLE(
+    EXTERN(
+      '{"type":"inline","data":"{\"timestamp\": \"2011-01-12T00:00:00.000Z\", \"label\": \"row1\", \"tags\": [\"t1\",\"t2\",\"t3\"]}\n{\"timestamp\": \"2011-01-13T00:00:00.000Z\", \"label\": \"row2\", \"tags\": [\"t3\",\"t4\",\"t5\"]}\n{\"timestamp\": \"2011-01-14T00:00:00.000Z\", \"label\": \"row3\", \"tags\": [\"t5\",\"t6\",\"t7\"]}\n{\"timestamp\": \"2011-01-14T00:00:00.000Z\", \"label\": \"row4\", \"tags\": []}"}',
+      '{"type":"json"}',
+      '[{"name":"timestamp", "type":"STRING"},{"name":"label", "type":"STRING"},{"name":"tags", "type":"ARRAY<STRING>"}]'
+    )
+  )
+)
+SELECT
+  TIME_PARSE("timestamp") AS "__time",
+  "label",
+  ARRAY_TO_MV("tags") AS "tags"
+FROM "ext"
+PARTITIONED BY DAY
+```
+
+### SQL-based ingestion with rollup
+These input arrays can also be grouped prior to converting into a multi-value dimension:
+```sql
+REPLACE INTO "mvd_example_rollup" OVERWRITE ALL
+WITH "ext" AS (
+  SELECT *
+  FROM TABLE(
+    EXTERN(
+      '{"type":"inline","data":"{\"timestamp\": \"2011-01-12T00:00:00.000Z\", \"label\": \"row1\", \"tags\": [\"t1\",\"t2\",\"t3\"]}\n{\"timestamp\": \"2011-01-13T00:00:00.000Z\", \"label\": \"row2\", \"tags\": [\"t3\",\"t4\",\"t5\"]}\n{\"timestamp\": \"2011-01-14T00:00:00.000Z\", \"label\": \"row3\", \"tags\": [\"t5\",\"t6\",\"t7\"]}\n{\"timestamp\": \"2011-01-14T00:00:00.000Z\", \"label\": \"row4\", \"tags\": []}"}',
+      '{"type":"json"}',
+      '[{"name":"timestamp", "type":"STRING"},{"name":"label", "type":"STRING"},{"name":"tags", "type":"ARRAY<STRING>"}]'
+    )
+  )
+)
+SELECT
+  TIME_PARSE("timestamp") AS "__time",
+  "label",
+  ARRAY_TO_MV("tags") AS "tags",
+  COUNT(*) AS "count"
+FROM "ext"
+GROUP BY 1, 2, "tags"
+PARTITIONED BY DAY
+```
+
+Notice that `ARRAY_TO_MV` is not present in the `GROUP BY` clause since we only wish to coerce the type _after_ grouping.
+
+
+The `EXTERN` is also able to refer to the `tags` input type as `VARCHAR`, which is also how a query on a Druid table containing a multi-value dimension would specify the type of the `tags` column. If this is the case you must use `MV_TO_ARRAY` since the multi-stage query engine only supports grouping on multi-value dimensions as arrays. So, they must be coerced first. These arrays must then be coerced back into `VARCHAR` in the `SELECT` part of the statement with `ARRAY_TO_MV`.
+
+```sql
+REPLACE INTO "mvd_example_rollup" OVERWRITE ALL
+WITH "ext" AS (
+  SELECT *
+  FROM TABLE(
+    EXTERN(
+      '{"type":"inline","data":"{\"timestamp\": \"2011-01-12T00:00:00.000Z\", \"label\": \"row1\", \"tags\": [\"t1\",\"t2\",\"t3\"]}\n{\"timestamp\": \"2011-01-13T00:00:00.000Z\", \"label\": \"row2\", \"tags\": [\"t3\",\"t4\",\"t5\"]}\n{\"timestamp\": \"2011-01-14T00:00:00.000Z\", \"label\": \"row3\", \"tags\": [\"t5\",\"t6\",\"t7\"]}\n{\"timestamp\": \"2011-01-14T00:00:00.000Z\", \"label\": \"row4\", \"tags\": []}"}',
+      '{"type":"json"}'
+    )
+  ) EXTEND ("timestamp" VARCHAR, "label" VARCHAR, "tags" VARCHAR)
+)
+SELECT
+  TIME_PARSE("timestamp") AS "__time",
+  "label",
+  ARRAY_TO_MV(MV_TO_ARRAY("tags")) AS "tags",
+  COUNT(*) AS "count"
+FROM "ext"
+GROUP BY 1, 2, MV_TO_ARRAY("tags")
+PARTITIONED BY DAY
+```
+
+## Querying multi-value dimensions
+
+### Filtering
+
+All query types, as well as [filtered aggregators](aggregations.md#filtered-aggregator), can filter on multi-value
+dimensions. Filters follow these rules on multi-value dimensions:
+
+- Value filters (like "selector", "bound", and "in") match a row if any of the values of a multi-value dimension match
+  the filter.
+- The Column Comparison filter will match a row if the dimensions have any overlap.
+- Value filters that match `null` or `""` (empty string) will match empty cells in a multi-value dimension.
+- Logical expression filters behave the same way they do on single-value dimensions: "and" matches a row if all
+  underlying filters match that row; "or" matches a row if any underlying filters match that row; "not" matches a row
+  if the underlying filter does not match the row.
+  
+The following example illustrates these rules. This query applies an "or" filter to match row1 and row2 of the dataset above, but not row3:
+
+```sql
+SELECT *
+FROM "mvd_example_rollup"
+WHERE tags = 't1' OR tags = 't3'
+```
+
+returns
+```json lines
+{"__time":"2011-01-12T00:00:00.000Z","label":"row1","tags":"[\"t1\",\"t2\",\"t3\"]","count":1}
+{"__time":"2011-01-13T00:00:00.000Z","label":"row2","tags":"[\"t3\",\"t4\",\"t5\"]","count":1}
+```
+
+Native queries can also perform filtering that would be considered a "contradiction" in SQL, such as this "and" filter which would match only row1 of the dataset above:
+
+```
+{
+  "type": "and",
+  "fields": [
+    {
+      "type": "selector",
+      "dimension": "tags",
+      "value": "t1"
+    },
+    {
+      "type": "selector",
+      "dimension": "tags",
+      "value": "t3"
+    }
+  ]
+}
+```
+
+which returns
+```json lines
+{"__time":"2011-01-12T00:00:00.000Z","label":"row1","tags":"[\"t1\",\"t2\",\"t3\"]","count":1}
+```
+
+Multi-value dimensions also consider an empty row as `null`, consider:
+```sql
+SELECT *
+FROM "mvd_example_rollup"
+WHERE tags is null
+```
+
+which results in:
+```json lines
+{"__time":"2011-01-14T00:00:00.000Z","label":"row4","tags":null,"count":1}
+```
+
+### Grouping
+
+When grouping on a multi-value dimension with SQL or a native [topN](topnquery.md) or [groupBy](groupbyquery.md) queries, _all_ values 
+from matching rows will be used to generate one group per value. This behaves similarly to an implicit SQL `UNNEST`
+operation. This means it's possible for a query to return more groups than there are rows. For example, a topN on the
+dimension `tags` with filter `"t1" AND "t3"` would match only row1, and generate a result with three groups:
+`t1`, `t2`, and `t3`.
+
+If you only need to include values that match your filter, you can use the SQL functions [`MV_FILTER_ONLY`/`MV_FILTER_NONE`](sql-multivalue-string-functions.md),
+[filtered virtual column](virtual-columns.md#list-filtered-virtual-column), or [filtered dimensionSpec](dimensionspecs.md#filtered-dimensionspecs). This can also improve performance.
+
+#### Example: SQL grouping query with no filtering
+```sql
+SELECT label, tags
+FROM "mvd_example_rollup"
+GROUP BY 1,2
+```
+results in:
+```json lines
+{"label":"row1","tags":"t1"}
+{"label":"row1","tags":"t2"}
+{"label":"row1","tags":"t3"}
+{"label":"row2","tags":"t3"}
+{"label":"row2","tags":"t4"}
+{"label":"row2","tags":"t5"}
+{"label":"row3","tags":"t5"}
+{"label":"row3","tags":"t6"}
+{"label":"row3","tags":"t7"}
+{"label":"row4","tags":null}
+```
+
+#### Example: SQL grouping query with a filter
+```sql
+SELECT label, tags
+FROM "mvd_example_rollup"
+WHERE label in ('row1','row2')
+GROUP BY 1,2
+```
+
+results:
+```json lines
+{"label":"row1","tags":"t1"}
+{"label":"row1","tags":"t2"}
+{"label":"row1","tags":"t3"}
+{"label":"row2","tags":"t3"}
+{"label":"row2","tags":"t4"}
+{"label":"row2","tags":"t5"}
+```
+
+#### Example: native GroupBy query with no filtering
+
+See [GroupBy querying](groupbyquery.md) for details.
+
+```json
+{
+  "queryType": "groupBy",
+  "dataSource": "test",
+  "intervals": [
+    "1970-01-01T00:00:00.000Z/3000-01-01T00:00:00.000Z"
+  ],
+  "granularity": {
+    "type": "all"
+  },
+  "dimensions": [
+    {
+      "type": "default",
+      "dimension": "tags",
+      "outputName": "tags"
+    }
+  ],
+  "aggregations": [
+    {
+      "type": "count",
+      "name": "count"
+    }
+  ]
+}
+```
+
+This query returns the following result:
+
+```json
+[
+  {
+    "timestamp": "1970-01-01T00:00:00.000Z",
+    "event": {
+      "count": 1,
+      "tags": "t1"
+    }
+  },
+  {
+    "timestamp": "1970-01-01T00:00:00.000Z",
+    "event": {
+      "count": 1,
+      "tags": "t2"
+    }
+  },
+  {
+    "timestamp": "1970-01-01T00:00:00.000Z",
+    "event": {
+      "count": 2,
+      "tags": "t3"
+    }
+  },
+  {
+    "timestamp": "1970-01-01T00:00:00.000Z",
+    "event": {
+      "count": 1,
+      "tags": "t4"
+    }
+  },
+  {
+    "timestamp": "1970-01-01T00:00:00.000Z",
+    "event": {
+      "count": 2,
+      "tags": "t5"
+    }
+  },
+  {
+    "timestamp": "1970-01-01T00:00:00.000Z",
+    "event": {
+      "count": 1,
+      "tags": "t6"
+    }
+  },
+  {
+    "timestamp": "1970-01-01T00:00:00.000Z",
+    "event": {
+      "count": 1,
+      "tags": "t7"
+    }
+  }
+]
+```
+
+Notice that original rows are "exploded" into multiple rows and merged.
+
+#### Example: native GroupBy query with a selector query filter
+
+See [query filters](filters.md) for details of selector query filter.
+
+```json
+{
+  "queryType": "groupBy",
+  "dataSource": "test",
+  "intervals": [
+    "1970-01-01T00:00:00.000Z/3000-01-01T00:00:00.000Z"
+  ],
+  "filter": {
+    "type": "selector",
+    "dimension": "tags",
+    "value": "t3"
+  },
+  "granularity": {
+    "type": "all"
+  },
+  "dimensions": [
+    {
+      "type": "default",
+      "dimension": "tags",
+      "outputName": "tags"
+    }
+  ],
+  "aggregations": [
+    {
+      "type": "count",
+      "name": "count"
+    }
+  ]
+}
+```
+
+This query returns the following result:
+
+```json
+[
+  {
+    "timestamp": "1970-01-01T00:00:00.000Z",
+    "event": {
+      "count": 1,
+      "tags": "t1"
+    }
+  },
+  {
+    "timestamp": "1970-01-01T00:00:00.000Z",
+    "event": {
+      "count": 1,
+      "tags": "t2"
+    }
+  },
+  {
+    "timestamp": "1970-01-01T00:00:00.000Z",
+    "event": {
+      "count": 2,
+      "tags": "t3"
+    }
+  },
+  {
+    "timestamp": "1970-01-01T00:00:00.000Z",
+    "event": {
+      "count": 1,
+      "tags": "t4"
+    }
+  },
+  {
+    "timestamp": "1970-01-01T00:00:00.000Z",
+    "event": {
+      "count": 1,
+      "tags": "t5"
+    }
+  }
+]
+```
+
+You might be surprised to see "t1", "t2", "t4" and "t5" included in the results. This is because the query filter is
+applied on the row before explosion. For multi-value dimensions, a filter for value "t3" would match row1 and row2,
+after which exploding is done. For multi-value dimensions, a query filter matches a row if any individual value inside
+the multiple values matches the query filter.
+
+#### Example: native GroupBy query with selector query and dimension filters
+
+To solve the problem above and to get only rows for "t3", use a "filtered dimension spec", as in the query below.
+
+See filtered `dimensionSpecs` in [dimensionSpecs](dimensionspecs.md#filtered-dimensionspecs) for details.
+
+```json
+{
+  "queryType": "groupBy",
+  "dataSource": "test",
+  "intervals": [
+    "1970-01-01T00:00:00.000Z/3000-01-01T00:00:00.000Z"
+  ],
+  "filter": {
+    "type": "selector",
+    "dimension": "tags",
+    "value": "t3"
+  },
+  "granularity": {
+    "type": "all"
+  },
+  "dimensions": [
+    {
+      "type": "listFiltered",
+      "delegate": {
+        "type": "default",
+        "dimension": "tags",
+        "outputName": "tags"
+      },
+      "values": ["t3"]
+    }
+  ],
+  "aggregations": [
+    {
+      "type": "count",
+      "name": "count"
+    }
+  ]
+}
+```
+
+This query returns the following result:
+
+```json
+[
+  {
+    "timestamp": "1970-01-01T00:00:00.000Z",
+    "event": {
+      "count": 2,
+      "tags": "t3"
+    }
+  }
+]
+```
+
+Note that, for groupBy queries, you could get similar result with a [having spec](having.md) but using a filtered
+`dimensionSpec` is much more efficient because that gets applied at the lowest level in the query processing pipeline.
+Having specs are applied at the outermost level of groupBy query processing.
+
+## Disable GroupBy on multi-value columns
+
+You can disable the implicit unnesting behavior for groupBy by setting `groupByEnableMultiValueUnnesting: false` in your 
+[query context](query-context-reference.md). In this mode, the groupBy engine will return an error instead of completing the query. This is a safety 
+feature for situations where you believe that all dimensions are singly-valued and want the engine to reject any 
+multi-valued dimensions that were inadvertently included.
+
+## Differences between arrays and multi-value dimensions
+Avoid confusing string arrays with [multi-value dimensions](multi-value-dimensions.md). Arrays and multi-value dimensions are stored in different column types, and query behavior is different. You can use the functions `MV_TO_ARRAY` and `ARRAY_TO_MV` to convert between the two if needed. In general, we recommend using arrays whenever possible, since they are a newer and more powerful feature and have SQL compliant behavior.
+
+Use care during ingestion to ensure you get the type you want.
+
+To get arrays when performing an ingestion using JSON ingestion specs, such as [native batch](../ingestion/native-batch.md) or streaming ingestion such as with [Apache Kafka](../ingestion/kafka-ingestion.md), use dimension type `auto` or enable `useSchemaDiscovery`. When performing a [SQL-based ingestion](../multi-stage-query/index.md), write a query that generates arrays. Arrays may contain strings or numbers.
+
+To get multi-value dimensions when performing an ingestion using JSON ingestion specs, use dimension type `string` and do not enable `useSchemaDiscovery`. When performing a [SQL-based ingestion](../multi-stage-query/index.md), wrap arrays in [`ARRAY_TO_MV`](multi-value-dimensions.md#sql-based-ingestion). Multi-value dimensions can only contain strings.
+
+You can tell which type you have by checking the `INFORMATION_SCHEMA.COLUMNS` table, using a query like:
+
+```sql
+SELECT COLUMN_NAME, DATA_TYPE
+FROM INFORMATION_SCHEMA.COLUMNS
+WHERE TABLE_NAME = 'mytable'
+```
+
+Arrays are type `ARRAY`, multi-value strings are type `VARCHAR`.
\ No newline at end of file
diff --git a/docs/35.0.0/querying/multitenancy.md b/docs/35.0.0/querying/multitenancy.md
new file mode 100644
index 0000000000..bc70177d0f
--- /dev/null
+++ b/docs/35.0.0/querying/multitenancy.md
@@ -0,0 +1,91 @@
+---
+id: multitenancy
+title: "Multitenancy considerations"
+sidebar_label: "Multitenancy"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+Apache Druid is often used to power user-facing data applications, where multitenancy is an important requirement. This
+document outlines Druid's multitenant storage and querying features.
+
+## Shared datasources or datasource-per-tenant?
+
+A datasource is the Druid equivalent of a database table. Multitenant workloads can either use a separate datasource
+for each tenant, or can share one or more datasources between tenants using a "tenant_id" dimension. When deciding
+which path to go down, consider that each path has pros and cons.
+
+Pros of datasources per tenant:
+
+- Each datasource can have its own schema, its own backfills, its own partitioning rules, and its own data loading
+and expiration rules.
+- Queries can be faster since there will be fewer segments to examine for a typical tenant's query.
+- You get the most flexibility.
+
+Pros of shared datasources:
+
+- Each datasource requires its own JVMs for realtime indexing.
+- Each datasource requires its own YARN resources for Hadoop batch jobs.
+- Each datasource requires its own segment files on disk.
+- For these reasons it can be wasteful to have a very large number of small datasources.
+
+One compromise is to use more than one datasource, but a smaller number than tenants. For example, you could have some
+tenants with partitioning rules A and some with partitioning rules B; you could use two datasources and split your
+tenants between them.
+
+## Partitioning shared datasources
+
+If your multitenant cluster uses shared datasources, most of your queries will likely filter on a "tenant_id"
+dimension. These sorts of queries perform best when data is well-partitioned by tenant. There are a few ways to
+accomplish this.
+
+With batch indexing, you can use [single-dimension partitioning](../ingestion/hadoop.md#single-dimension-range-partitioning)
+to partition your data by tenant_id. Druid always partitions by time first, but the secondary partition within each
+time bucket will be on tenant_id.
+
+With realtime indexing, you'd do this by tweaking the stream you send to Druid. For example, if you're using Kafka then
+you can have your Kafka producer partition your topic by a hash of tenant_id.
+
+## Customizing data distribution
+
+Druid additionally supports multitenancy by providing configurable means of distributing data. Druid's Historical processes
+can be configured into [tiers](../operations/rule-configuration.md), and [rules](../operations/rule-configuration.md)
+can be set that determines which segments go into which tiers. One use case of this is that recent data tends to be accessed
+more frequently than older data. Tiering enables more recent segments to be hosted on more powerful hardware for better performance.
+A second copy of recent segments can be replicated on cheaper hardware (a different tier), and older segments can also be
+stored on this tier.
+
+## Supporting high query concurrency
+
+Druid uses a [segment](../design/segments.md) as its fundamental unit of computation. Processes scan segments in parallel and a given process can scan `druid.processing.numThreads` concurrently. You can add more cores to a cluster to process more data in parallel and increase performance. Size your Druid segments such that any computation over any given segment should complete in at most 500ms. Use the [`query/segment/time`](../operations/metrics.md#historical) metric to monitor computation times.
+
+Druid internally stores requests to scan segments in a priority queue. If a given query requires scanning
+more segments than the total number of available processors in a cluster, and many similarly expensive queries are concurrently
+running, we don't want any query to be starved out. Druid's internal processing logic will scan a set of segments from one query and release resources as soon as the scans complete.
+This allows for a second set of segments from another query to be scanned. By keeping segment computation time very small, we ensure
+that resources are constantly being yielded, and segments pertaining to different queries are all being processed.
+
+Druid queries can optionally set a `priority` flag in the [query context reference](../querying/query-context-reference.md). Queries known to be
+slow (download or reporting style queries) can be de-prioritized and more interactive queries can have higher priority.
+
+Broker processes can also be dedicated to a given tier. For example, one set of Broker processes can be dedicated to fast interactive queries,
+and a second set of Broker processes can be dedicated to slower reporting queries. Druid also provides a [Router](../design/router.md)
+process that can route queries to different Brokers based on various query parameters (datasource, interval, etc.).
diff --git a/docs/35.0.0/querying/nested-columns.md b/docs/35.0.0/querying/nested-columns.md
new file mode 100644
index 0000000000..6073ec7743
--- /dev/null
+++ b/docs/35.0.0/querying/nested-columns.md
@@ -0,0 +1,692 @@
+---
+id: nested-columns
+title: "Nested columns"
+sidebar_label: Nested columns
+---
+import Tabs from '@theme/Tabs';
+import TabItem from '@theme/TabItem';
+
+
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+Apache Druid supports directly storing nested data structures in `COMPLEX<json>` columns. `COMPLEX<json>` columns store a copy of the structured data in JSON format and specialized internal columns and indexes for nested primitive values&mdash;STRING, LONG, and DOUBLE types, as well as ARRAY of STRING, LONG, and DOUBLE values. An optimized [virtual column](./virtual-columns.md#nested-field-virtual-column) allows Druid to read and filter these values at speeds consistent with standard Druid LONG, DOUBLE, and STRING columns.
+
+Druid [SQL JSON functions](./sql-json-functions.md) allow you to extract, transform, and create `COMPLEX<json>` values in SQL queries, using the specialized virtual columns where appropriate. You can use the [JSON nested columns functions](math-expr.md#json-functions) in [native queries](./querying.md) using [expression virtual columns](./virtual-columns.md#expression-virtual-column), and in native ingestion with a [`transformSpec`](../ingestion/ingestion-spec.md#transformspec).
+
+You can use the JSON functions in INSERT and REPLACE statements in SQL-based ingestion, or in a `transformSpec` in native ingestion as an alternative to using a [`flattenSpec`](../ingestion/data-formats.md#flattenspec) object to "flatten" nested data for ingestion.
+
+Columns ingested as `COMPLEX<json>` are automatically optimized to store the most appropriate physical column based on the data processed. For example, if only LONG values are processed, Druid stores a LONG column, ARRAY columns if the data consists of arrays, or `COMPLEX<json>` in the general case if the data is actually nested. This is the same functionality that powers ['type aware' schema discovery](../ingestion/schema-design.md#type-aware-schema-discovery).
+
+Druid supports directly ingesting nested data with the following formats: JSON, Parquet, Avro, ORC, Protobuf.
+
+## Example nested data
+
+The examples in this topic use the JSON data in [`nested_example_data.json`](https://static.imply.io/data/nested_example_data.json). The file contains a simple facsimile of an order tracking and shipping table.
+
+When pretty-printed, a sample row in `nested_example_data` looks like this:
+
+```json
+{
+    "time":"2022-6-14T10:32:08Z",
+    "product":"Keyboard",
+    "department":"Computers",
+    "shipTo":{
+        "firstName": "Sandra",
+        "lastName": "Beatty",
+        "address": {
+            "street": "293 Grant Well",
+            "city": "Loischester",
+            "state": "FL",
+            "country": "TV",
+            "postalCode": "88845-0066"
+        },
+        "phoneNumbers": [
+            {"type":"primary","number":"1-788-771-7028 x8627" },
+            {"type":"secondary","number":"1-460-496-4884 x887"}
+        ]
+    },
+    "details"{"color":"plum","price":"40.00"}
+}
+```
+
+## Native batch ingestion
+
+For native batch ingestion, you can use the [SQL JSON functions](./sql-json-functions.md) to extract nested data as an alternative to using the [`flattenSpec`](../ingestion/data-formats.md#flattenspec) input format.
+
+To configure a dimension as a nested data type, specify the `json` type for the dimension in the `dimensions` list in the `dimensionsSpec` property of your ingestion spec.
+
+For example, the following ingestion spec instructs Druid to ingest `shipTo` and `details` as JSON-type nested dimensions:
+
+```json
+{
+  "type": "index_parallel",
+  "spec": {
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "http",
+        "uris": [
+          "https://static.imply.io/data/nested_example_data.json"
+        ]
+      },
+      "inputFormat": {
+        "type": "json"
+      }
+    },
+    "dataSchema": {
+      "granularitySpec": {
+        "segmentGranularity": "day",
+        "queryGranularity": "none",
+        "rollup": false
+      },
+      "dataSource": "nested_data_example",
+      "timestampSpec": {
+        "column": "time",
+        "format": "auto"
+      },
+      "dimensionsSpec": {
+        "dimensions": [
+          "product",
+          "department",
+          {
+            "type": "json",
+            "name": "shipTo"
+          },
+          {
+            "type": "json",
+            "name": "details"
+          }
+        ]
+      },
+      "transformSpec": {}
+    },
+    "tuningConfig": {
+      "type": "index_parallel",
+      "partitionsSpec": {
+        "type": "dynamic"
+      }
+    }
+  }
+}
+```
+
+### Transform data during batch ingestion
+
+You can use the [SQL JSON functions](./sql-json-functions.md) to transform nested data and reference the transformed data in your ingestion spec.
+
+To do this, define the output name and expression in the `transforms` list in the `transformSpec` object of your ingestion spec.
+
+For example, the following ingestion spec extracts `firstName`, `lastName` and `address` from `shipTo` and creates a composite JSON object containing `product`, `details` and `department`.
+
+```json
+{
+  "type": "index_parallel",
+  "spec": {
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "http",
+        "uris": [
+          "https://static.imply.io/data/nested_example_data.json"
+        ]
+      },
+      "inputFormat": {
+        "type": "json"
+      }
+    },
+    "dataSchema": {
+      "granularitySpec": {
+        "segmentGranularity": "day",
+        "queryGranularity": "none",
+        "rollup": false
+      },
+      "dataSource": "nested_data_transform_example",
+      "timestampSpec": {
+        "column": "time",
+        "format": "auto"
+      },
+      "dimensionsSpec": {
+        "dimensions": [
+          "firstName",
+          "lastName",
+          {
+            "type": "json",
+            "name": "address"
+          },
+          {
+            "type": "json",
+            "name": "productDetails"
+          }
+        ]
+      },
+      "transformSpec": {
+        "transforms":[
+            { "type":"expression", "name":"firstName", "expression":"json_value(shipTo, '$.firstName')"},
+            { "type":"expression", "name":"lastName", "expression":"json_value(shipTo, '$.lastName')"},
+            { "type":"expression", "name":"address", "expression":"json_query(shipTo, '$.address')"},
+            { "type":"expression", "name":"productDetails", "expression":"json_object('product', product, 'details', details, 'department', department)"}
+        ]
+      }
+    },
+    "tuningConfig": {
+      "type": "index_parallel",
+      "partitionsSpec": {
+        "type": "dynamic"
+      }
+    }
+  }
+}
+```
+
+## SQL-based ingestion
+
+To ingest nested data using SQL-based ingestion, specify `COMPLEX<json>` as the value for `type` when you define the row signature&mdash;`shipTo` and `details` in the following example ingestion spec:
+
+![SQL-based ingestion](../assets/nested-msq-ingestion.png)
+
+```sql
+REPLACE INTO msq_nested_data_example OVERWRITE ALL
+SELECT
+  TIME_PARSE("time") as __time,
+  product,
+  department,
+  shipTo,
+  details
+FROM (
+  SELECT * FROM
+  TABLE(
+    EXTERN(
+      '{"type":"http","uris":["https://static.imply.io/data/nested_example_data.json"]}',
+      '{"type":"json"}',
+      '[{"name":"time","type":"string"},{"name":"product","type":"string"},{"name":"department","type":"string"},{"name":"shipTo","type":"COMPLEX<json>"},{"name":"details","type":"COMPLEX<json>"}]'
+    )
+  )
+)
+PARTITIONED BY ALL
+```
+
+## Streaming ingestion
+
+You can ingest nested data into Druid using the [streaming method](../ingestion/index.md#streaming)&mdash;for example, from a Kafka topic.
+
+When you [define your supervisor spec](../ingestion/supervisor.md#start-a-supervisor), include a dimension with type `json` for each nested column. For example, the following supervisor spec from the [Kafka ingestion tutorial](../tutorials/tutorial-kafka.md) contains dimensions for the nested columns `event`, `agent`, and `geo_ip` in datasource `kttm-kafka`.
+
+```json
+{
+   "type": "kafka",
+   "spec": {
+      "ioConfig": {
+         "type": "kafka",
+         "consumerProperties": {
+           "bootstrap.servers": "localhost:9092"
+      },
+      "topic": "kttm",
+      "inputFormat": {
+         "type": "json"
+      },
+      "useEarliestOffset": true
+   },
+   "tuningConfig": {
+     "type": "kafka"
+   },
+   "dataSchema": {
+      "dataSource": "kttm-kafka",
+      "timestampSpec": {
+         "column": "timestamp",
+         "format": "iso"
+      },
+      "dimensionsSpec": {
+         "dimensions": [
+            "session",
+             "number",
+             "client_ip",
+             "language",
+             "adblock_list",
+             "app_version",
+             "path",
+             "loaded_image",
+             "referrer",
+             "referrer_host",
+             "server_ip",
+             "screen",
+             "window",
+             {
+               "type": "long",
+               "name": "session_length"
+             },
+             "timezone",
+             "timezone_offset",
+             {
+               "type": "json",
+               "name": "event"
+             },
+             {
+               "type": "json",
+               "name": "agent"
+             },
+             {
+               "type": "json",
+               "name": "geo_ip"
+             }
+           ]
+         },
+      "granularitySpec": {
+         "queryGranularity": "none",
+         "rollup": false,
+         "segmentGranularity": "day"
+      }
+    }
+  }
+}
+```
+
+
+The [Kafka tutorial](../tutorials/tutorial-kafka.md) guides you through the steps to load sample nested data into a Kafka topic, then ingest the data into Druid.
+
+### Transform data during SQL-based ingestion
+
+You can use the [SQL JSON functions](./sql-json-functions.md) to transform nested data in your ingestion query.
+
+For example, the following ingestion query is the SQL-based version of the [previous batch example](#transform-data-during-batch-ingestion)&mdash;it extracts `firstName`, `lastName`, and `address` from `shipTo` and creates a composite JSON object containing `product`, `details`, and `department`.
+
+![SQL-based ingestion](../assets/nested-msq-ingestion-transform.png)
+
+```sql
+REPLACE INTO msq_nested_data_transform_example OVERWRITE ALL
+SELECT
+  TIME_PARSE("time") as __time,
+  JSON_VALUE(shipTo, '$.firstName') as firstName,
+  JSON_VALUE(shipTo, '$.lastName') as lastName,
+  JSON_QUERY(shipTo, '$.address') as address,
+  JSON_OBJECT('product':product,'details':details, 'department':department) as productDetails
+FROM (
+  SELECT * FROM
+  TABLE(
+    EXTERN(
+      '{"type":"http","uris":["https://static.imply.io/data/nested_example_data.json"]}',
+      '{"type":"json"}',
+      '[{"name":"time","type":"string"},{"name":"product","type":"string"},{"name":"department","type":"string"},{"name":"shipTo","type":"COMPLEX<json>"},{"name":"details","type":"COMPLEX<json>"}]'
+    )
+  )
+)
+PARTITIONED BY ALL
+```
+
+## Ingest a JSON string as COMPLEX\<json\>
+
+If your source data contains serialized JSON strings, you can ingest the data as `COMPLEX<JSON>` as follows:
+- During native batch ingestion, call the `parse_json` function in a `transform` object in the `transformSpec`.
+- During SQL-based ingestion, use the PARSE_JSON keyword within your SELECT statement to transform the string values to JSON.
+- If you are concerned that your data may not contain valid JSON, you can use `try_parse_json` for native batch or `TRY_PARSE_JSON` for SQL-based ingestion. For cases where the column does not contain valid JSON, Druid inserts a null value.
+
+If you are using a text input format like `tsv`, you need to use this method to ingest data into a `COMPLEX<json>` column.
+
+For example, consider the following deserialized row of the sample data set:
+
+```
+{"time": "2022-06-13T10:10:35Z", "product": "Bike", "department":"Sports", "shipTo":"{\"firstName\": \"Henry\",\"lastName\": \"Wuckert\",\"address\": {\"street\": \"5643 Jan Walk\",\"city\": \"Lake Bridget\",\"state\": \"HI\",\"country\":\"ME\",\"postalCode\": \"70204-2939\"},\"phoneNumbers\": [{\"type\":\"primary\",\"number\":\"593.475.0449 x86733\" },{\"type\":\"secondary\",\"number\":\"638-372-1210\"}]}", "details":"{\"color\":\"ivory\", \"price\":955.00}"}
+```
+
+The following examples demonstrate how to ingest the `shipTo` and `details` columns both as string type and as `COMPLEX<json>` in the `shipTo_parsed` and `details_parsed` columns.
+
+<Tabs>
+<TabItem value="1" label="SQL">
+
+```
+REPLACE INTO deserialized_example OVERWRITE ALL
+WITH source AS (SELECT * FROM TABLE(
+  EXTERN(
+    '{"type":"inline","data":"{\"time\": \"2022-06-13T10:10:35Z\", \"product\": \"Bike\", \"department\":\"Sports\", \"shipTo\":\"{\\\"firstName\\\": \\\"Henry\\\",\\\"lastName\\\": \\\"Wuckert\\\",\\\"address\\\": {\\\"street\\\": \\\"5643 Jan Walk\\\",\\\"city\\\": \\\"Lake Bridget\\\",\\\"state\\\": \\\"HI\\\",\\\"country\\\":\\\"ME\\\",\\\"postalCode\\\": \\\"70204-2939\\\"},\\\"phoneNumbers\\\": [{\\\"type\\\":\\\"primary\\\",\\\"number\\\":\\\"593.475.0449 x86733\\\" },{\\\"type\\\":\\\"secondary\\\",\\\"number\\\":\\\"638-372-1210\\\"}]}\", \"details\":\"{\\\"color\\\":\\\"ivory\\\", \\\"price\\\":955.00}\"}\n"}',
+    '{"type":"json"}',
+    '[{"name":"time","type":"string"},{"name":"product","type":"string"},{"name":"department","type":"string"},{"name":"shipTo","type":"string"},{"name":"details","type":"string"}]'
+  )
+))
+SELECT
+  TIME_PARSE("time") AS __time,
+  "product",
+  "department",
+  "shipTo",
+  "details",
+  PARSE_JSON("shipTo") as "shipTo_parsed",
+  PARSE_JSON("details") as "details_parsed"
+FROM source
+PARTITIONED BY DAY
+```
+</TabItem>
+<TabItem value="2" label="Native batch">
+
+```
+{
+  "type": "index_parallel",
+  "spec": {
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "inline",
+        "data": "{\"time\": \"2022-06-13T10:10:35Z\", \"product\": \"Bike\", \"department\":\"Sports\", \"shipTo\":\"{\\\"firstName\\\": \\\"Henry\\\",\\\"lastName\\\": \\\"Wuckert\\\",\\\"address\\\": {\\\"street\\\": \\\"5643 Jan Walk\\\",\\\"city\\\": \\\"Lake Bridget\\\",\\\"state\\\": \\\"HI\\\",\\\"country\\\":\\\"ME\\\",\\\"postalCode\\\": \\\"70204-2939\\\"},\\\"phoneNumbers\\\": [{\\\"type\\\":\\\"primary\\\",\\\"number\\\":\\\"593.475.0449 x86733\\\" },{\\\"type\\\":\\\"secondary\\\",\\\"number\\\":\\\"638-372-1210\\\"}]}\", \"details\":\"{\\\"color\\\":\\\"ivory\\\", \\\"price\\\":955.00}\"}\n"
+      },
+      "inputFormat": {
+        "type": "json"
+      }
+    },
+    "tuningConfig": {
+      "type": "index_parallel",
+      "partitionsSpec": {
+        "type": "dynamic"
+      }
+    },
+    "dataSchema": {
+      "dataSource": "deserialized_example",
+      "timestampSpec": {
+        "column": "time",
+        "format": "iso"
+      },
+      "transformSpec": {
+        "transforms": [
+          {
+            "type": "expression",
+            "name": "shipTo_parsed",
+            "expression": "parse_json(shipTo)"
+          },
+          {
+            "type": "expression",
+            "name": "details_parsed",
+            "expression": "parse_json(details)"
+          }
+        ]
+      },
+      "dimensionsSpec": {
+        "dimensions": [
+          "product",
+          "department",
+          "shipTo",
+          "details",
+          "shipTo_parsed",
+          "details_parsed"
+        ]
+      },
+      "granularitySpec": {
+        "queryGranularity": "none",
+        "rollup": false,
+        "segmentGranularity": "day"
+      }
+    }
+  }
+}
+```
+</TabItem>
+</Tabs>
+
+## Querying nested columns
+
+Once ingested, Druid stores the JSON-typed columns as native JSON objects and presents them as `COMPLEX<json>`.
+
+See the [Nested columns functions reference](./sql-json-functions.md) for information on the functions in the examples below.
+
+Druid supports a small, simplified subset of the [JSONPath syntax](https://github.com/json-path/JsonPath/blob/master/README.md) operators, primarily limited to extracting individual values from nested data structures. See the [SQL JSON functions](./sql-json-functions.md#jsonpath-syntax) page for details.
+
+### Displaying data types
+
+The following example illustrates how you can display the data types for your columns. Note that `details` and `shipTo` display as `COMPLEX<json>`.
+
+#### Example query: Display data types
+
+![Display data types](../assets/nested-display-data-types.png)
+
+```sql
+SELECT TABLE_NAME, COLUMN_NAME, DATA_TYPE
+FROM INFORMATION_SCHEMA.COLUMNS
+WHERE TABLE_NAME = 'nested_data_example'
+```
+
+Example query results:
+
+```json
+[["TABLE_NAME","COLUMN_NAME","DATA_TYPE"],["STRING","STRING","STRING"],["VARCHAR","VARCHAR","VARCHAR"],["nested_data_example","__time","TIMESTAMP"],["nested_data_example","department","VARCHAR"],["nested_data_example","details","COMPLEX<json>"],["nested_data_example","product","VARCHAR"],["nested_data_example","shipTo","COMPLEX<json>"]]
+```
+
+### Retrieving JSON data
+
+You can retrieve JSON data directly from a table. Druid returns the results as a JSON object, so you can't use grouping, aggregation, or filtering operators.
+
+#### Example query: Retrieve JSON data
+
+The following example query extracts all data from `nested_data_example`:
+
+![Retrieve JSON data](../assets/nested-retrieve-json.png)
+
+```sql
+SELECT * FROM nested_data_example
+```
+
+Example query results:
+
+```json
+[["__time","department","details","product","shipTo"],["LONG","STRING","COMPLEX<json>","STRING","COMPLEX<json>"],["TIMESTAMP","VARCHAR","OTHER","VARCHAR","OTHER"],["2022-06-13T07:52:29.000Z","Sports","{\"color\":\"sky blue\",\"price\":542.0}","Bike","{\"firstName\":\"Russ\",\"lastName\":\"Cole\",\"address\":{\"street\":\"77173 Rusty Station\",\"city\":\"South Yeseniabury\",\"state\":\"WA\",\"country\":\"BL\",\"postalCode\":\"01893\"},\"phoneNumbers\":[{\"type\":\"primary\",\"number\":\"891-374-6188 x74568\"},{\"type\":\"secondary\",\"number\":\"1-248-998-4426 x33037\"}]}"],["2022-06-13T10:10:35.000Z","Sports","{\"color\":\"ivory\",\"price\":955.0}","Bike","{\"firstName\":\"Henry\",\"lastName\":\"Wuckert\",\"address\":{\"street\":\"5643 Jan Walk\",\"city\":\"Lake Bridget\",\"state\":\"HI\",\"country\":\"ME\",\"postalCode\":\"70204-2939\"},\"phoneNumbers\":[{\"type\":\"primary\",\"number\":\"593.475.0449 x86733\"},{\"type\":\"secondary\",\"number\":\"638-372-1210\"}]}"],["2022-06-13T13:57:38.000Z","Grocery","{\"price\":8.0}","Sausages","{\"firstName\":\"Forrest\",\"lastName\":\"Brekke\",\"address\":{\"street\":\"41548 Collier Divide\",\"city\":\"Wintheiserborough\",\"state\":\"WA\",\"country\":\"AD\",\"postalCode\":\"27577-6784\"},\"phoneNumbers\":[{\"type\":\"primary\",\"number\":\"(904) 890-0696 x581\"},{\"type\":\"secondary\",\"number\":\"676.895.6759\"}]}"],["2022-06-13T21:37:06.000Z","Computers","{\"color\":\"olive\",\"price\":90.0}","Mouse","{\"firstName\":\"Rickey\",\"lastName\":\"Rempel\",\"address\":{\"street\":\"6232 Green Glens\",\"city\":\"New Fermin\",\"state\":\"HI\",\"country\":\"CW\",\"postalCode\":\"98912-1195\"},\"phoneNumbers\":[{\"type\":\"primary\",\"number\":\"(689) 766-4272 x60778\"},{\"type\":\"secondary\",\"number\":\"375.662.4737 x24707\"}]}"],["2022-06-14T10:32:08.000Z","Computers","{\"color\":\"plum\",\"price\":40.0}","Keyboard","{\"firstName\":\"Sandra\",\"lastName\":\"Beatty\",\"address\":{\"street\":\"293 Grant Well\",\"city\":\"Loischester\",\"state\":\"FL\",\"country\":\"TV\",\"postalCode\":\"88845-0066\"},\"phoneNumbers\":[{\"type\":\"primary\",\"number\":\"1-788-771-7028 x8627\"},{\"type\":\"secondary\",\"number\":\"1-460-496-4884 x887\"}]}"]]
+```
+
+### Extracting nested data elements
+
+The `JSON_VALUE` function is specially optimized to provide native Druid level performance when processing nested primitive values, as if they were flattened, traditional, Druid column types. It does this by reading from the specialized nested columns and indexes that are built and stored in JSON objects when Druid creates segments.
+
+Some operations using `JSON_VALUE` run faster than those using native Druid columns. For example, filtering numeric types uses the indexes built for nested numeric columns, which are not available for Druid DOUBLE, FLOAT, or LONG columns.
+
+`JSON_VALUE` only returns primitive types of `STRING`, `LONG`, `DOUBLE`, and if using `RETURNING` syntax `ARRAY<STRING>`, `ARRAY<LONG>` or `ARRAY<DOUBLE>`. Any paths that reference JSON objects or array types (if not specifying an array type in `RETURNING` clause) return null.
+
+:::info
+ To achieve the best possible performance, use the `JSON_VALUE` function whenever you query JSON objects.
+:::
+
+#### Example query: Extract nested data elements
+
+The following example query illustrates how to use `JSON_VALUE` to extract specified elements from a `COMPLEX<json>` object. Note that the returned values default to type VARCHAR.
+
+![Extract nested data elements](../assets/nested-extract-elements.png)
+
+```sql
+SELECT
+  product,
+  department,
+  JSON_VALUE(shipTo, '$.address.country') as country,
+  JSON_VALUE(shipTo, '$.phoneNumbers[0].number') as primaryPhone,
+  JSON_VALUE(details, '$.price') as price
+FROM nested_data_example
+```
+
+Example query results:
+
+```json
+[["product","department","country","primaryPhone","price"],["STRING","STRING","STRING","STRING","STRING"],["VARCHAR","VARCHAR","VARCHAR","VARCHAR","VARCHAR"],["Bike","Sports","BL","891-374-6188 x74568","542.0"],["Bike","Sports","ME","593.475.0449 x86733","955.0"],["Sausages","Grocery","AD","(904) 890-0696 x581","8.0"],["Mouse","Computers","CW","(689) 766-4272 x60778","90.0"],["Keyboard","Computers","TV","1-788-771-7028 x8627","40.0"]]
+```
+
+### Extracting nested data elements as a suggested type
+
+You can use the `RETURNING` keyword to provide type hints to the `JSON_VALUE` function. This way the SQL planner produces the correct native Druid query, leading to expected results. This keyword allows you to specify a SQL type for the `path` value.
+
+#### Example query: Extract nested data elements as suggested types
+
+The following example query illustrates how to use `JSON_VALUE` and the `RETURNING` keyword to extract an element of nested data and return it as specified types.
+
+![Extract nested data elements as a suggested type](../assets/nested-extract-as-type.png)
+
+```sql
+SELECT
+  product,
+  department,
+  JSON_VALUE(shipTo, '$.address.country') as country,
+  JSON_VALUE(details, '$.price' RETURNING BIGINT) as price_int,
+  JSON_VALUE(details, '$.price' RETURNING DECIMAL) as price_decimal,
+  JSON_VALUE(details, '$.price' RETURNING VARCHAR) as price_varchar
+FROM nested_data_example
+```
+
+Query results:
+
+```json
+[["product","department","country","price_int","price_decimal","price_varchar"],["STRING","STRING","STRING","LONG","DOUBLE","STRING"],["VARCHAR","VARCHAR","VARCHAR","BIGINT","DECIMAL","VARCHAR"],["Bike","Sports","BL",542,542.0,"542.0"],["Bike","Sports","ME",955,955.0,"955.0"],["Sausages","Grocery","AD",8,8.0,"8.0"],["Mouse","Computers","CW",90,90.0,"90.0"],["Keyboard","Computers","TV",40,40.0,"40.0"]]
+```
+
+### Grouping, aggregating, and filtering
+
+You can use `JSON_VALUE` expressions in any context where you can use traditional Druid columns, such as grouping, aggregation, and filtering.
+
+#### Example query: Grouping and filtering
+
+The following example query illustrates how to use SUM, WHERE, GROUP BY, and ORDER BY operators with `JSON_VALUE`.
+
+![Group, aggregate, filter](../assets/nested-group-aggregate.png)
+
+```sql
+SELECT
+  product,
+  JSON_VALUE(shipTo, '$.address.country'),
+  SUM(JSON_VALUE(details, '$.price' RETURNING BIGINT))
+FROM nested_data_example
+WHERE JSON_VALUE(shipTo, '$.address.country') in ('BL', 'CW')
+GROUP BY 1,2
+ORDER BY 3 DESC
+```
+
+Example query results:
+
+```json
+[["product","EXPR$1","EXPR$2"],["STRING","STRING","LONG"],["VARCHAR","VARCHAR","BIGINT"],["Bike","BL",542],["Mouse","CW",90]]
+```
+
+### Transforming JSON object data
+
+In addition to `JSON_VALUE`, Druid offers a number of operators that focus on transforming JSON object data:
+
+- `JSON_QUERY`
+- `JSON_OBJECT`
+- `PARSE_JSON`
+- `TO_JSON_STRING`
+
+These functions are primarily intended for use with SQL-based ingestion to transform data during insert operations, but they also work in traditional Druid SQL queries. Because most of these functions output JSON objects, they have the same limitations when used in traditional Druid queries as interacting with the JSON objects directly.
+
+#### Example query: Return results in a JSON object
+
+You can use the `JSON_QUERY` function to extract a partial structure from any JSON input and return results in a JSON object. Unlike `JSON_VALUE` it can extract objects and arrays.
+
+The following example query illustrates the differences in output between `JSON_VALUE` and `JSON_QUERY`. The two output columns for `JSON_VALUE` contain null values only because `JSON_VALUE` only returns primitive types.
+
+![Return results in a JSON object](../assets/nested-return-json.png)
+
+```sql
+SELECT
+  JSON_VALUE(shipTo, '$.address'),
+  JSON_QUERY(shipTo, '$.address'),
+  JSON_VALUE(shipTo, '$.phoneNumbers'),
+  JSON_QUERY(shipTo, '$.phoneNumbers')
+FROM nested_data_example
+```
+
+Example query results:
+
+```json
+[["EXPR$0","EXPR$1","EXPR$2","EXPR$3"],["STRING","COMPLEX<json>","STRING","COMPLEX<json>"],["VARCHAR","OTHER","VARCHAR","OTHER"],["","{\"street\":\"77173 Rusty Station\",\"city\":\"South Yeseniabury\",\"state\":\"WA\",\"country\":\"BL\",\"postalCode\":\"01893\"}","","[{\"type\":\"primary\",\"number\":\"891-374-6188 x74568\"},{\"type\":\"secondary\",\"number\":\"1-248-998-4426 x33037\"}]"],["","{\"street\":\"5643 Jan Walk\",\"city\":\"Lake Bridget\",\"state\":\"HI\",\"country\":\"ME\",\"postalCode\":\"70204-2939\"}","","[{\"type\":\"primary\",\"number\":\"593.475.0449 x86733\"},{\"type\":\"secondary\",\"number\":\"638-372-1210\"}]"],["","{\"street\":\"41548 Collier Divide\",\"city\":\"Wintheiserborough\",\"state\":\"WA\",\"country\":\"AD\",\"postalCode\":\"27577-6784\"}","","[{\"type\":\"primary\",\"number\":\"(904) 890-0696 x581\"},{\"type\":\"secondary\",\"number\":\"676.895.6759\"}]"],["","{\"street\":\"6232 Green Glens\",\"city\":\"New Fermin\",\"state\":\"HI\",\"country\":\"CW\",\"postalCode\":\"98912-1195\"}","","[{\"type\":\"primary\",\"number\":\"(689) 766-4272 x60778\"},{\"type\":\"secondary\",\"number\":\"375.662.4737 x24707\"}]"],["","{\"street\":\"293 Grant Well\",\"city\":\"Loischester\",\"state\":\"FL\",\"country\":\"TV\",\"postalCode\":\"88845-0066\"}","","[{\"type\":\"primary\",\"number\":\"1-788-771-7028 x8627\"},{\"type\":\"secondary\",\"number\":\"1-460-496-4884 x887\"}]"]]
+```
+
+#### Example query: Combine multiple JSON inputs into a single JSON object value
+
+ The following query illustrates how to use `JSON_OBJECT` to combine nested data elements into a new object.
+
+![Combine JSON inputs](../assets/nested-combined-json.png)
+
+```sql
+SELECT
+  JSON_OBJECT(KEY 'shipTo' VALUE JSON_QUERY(shipTo, '$'), KEY 'details' VALUE JSON_QUERY(details, '$')) as combinedJson
+FROM nested_data_example
+```
+
+Example query results:
+
+```json
+[["combinedJson"],["COMPLEX<json>"],["OTHER"],["{\"details\":{\"color\":\"sky blue\",\"price\":542.0},\"shipTo\":{\"firstName\":\"Russ\",\"lastName\":\"Cole\",\"address\":{\"street\":\"77173 Rusty Station\",\"city\":\"South Yeseniabury\",\"state\":\"WA\",\"country\":\"BL\",\"postalCode\":\"01893\"},\"phoneNumbers\":[{\"type\":\"primary\",\"number\":\"891-374-6188 x74568\"},{\"type\":\"secondary\",\"number\":\"1-248-998-4426 x33037\"}]}}"],["{\"details\":{\"color\":\"ivory\",\"price\":955.0},\"shipTo\":{\"firstName\":\"Henry\",\"lastName\":\"Wuckert\",\"address\":{\"street\":\"5643 Jan Walk\",\"city\":\"Lake Bridget\",\"state\":\"HI\",\"country\":\"ME\",\"postalCode\":\"70204-2939\"},\"phoneNumbers\":[{\"type\":\"primary\",\"number\":\"593.475.0449 x86733\"},{\"type\":\"secondary\",\"number\":\"638-372-1210\"}]}}"],["{\"details\":{\"price\":8.0},\"shipTo\":{\"firstName\":\"Forrest\",\"lastName\":\"Brekke\",\"address\":{\"street\":\"41548 Collier Divide\",\"city\":\"Wintheiserborough\",\"state\":\"WA\",\"country\":\"AD\",\"postalCode\":\"27577-6784\"},\"phoneNumbers\":[{\"type\":\"primary\",\"number\":\"(904) 890-0696 x581\"},{\"type\":\"secondary\",\"number\":\"676.895.6759\"}]}}"],["{\"details\":{\"color\":\"olive\",\"price\":90.0},\"shipTo\":{\"firstName\":\"Rickey\",\"lastName\":\"Rempel\",\"address\":{\"street\":\"6232 Green Glens\",\"city\":\"New Fermin\",\"state\":\"HI\",\"country\":\"CW\",\"postalCode\":\"98912-1195\"},\"phoneNumbers\":[{\"type\":\"primary\",\"number\":\"(689) 766-4272 x60778\"},{\"type\":\"secondary\",\"number\":\"375.662.4737 x24707\"}]}}"],["{\"details\":{\"color\":\"plum\",\"price\":40.0},\"shipTo\":{\"firstName\":\"Sandra\",\"lastName\":\"Beatty\",\"address\":{\"street\":\"293 Grant Well\",\"city\":\"Loischester\",\"state\":\"FL\",\"country\":\"TV\",\"postalCode\":\"88845-0066\"},\"phoneNumbers\":[{\"type\":\"primary\",\"number\":\"1-788-771-7028 x8627\"},{\"type\":\"secondary\",\"number\":\"1-460-496-4884 x887\"}]}}"]]
+```
+
+### Using other transform functions
+
+Druid provides the following additional transform functions:
+
+- `PARSE_JSON`: Deserializes a string value into a JSON object.
+- `TO_JSON_STRING`: Performs the operation of `TO_JSON` and then serializes the value into a string.
+
+#### Example query: Parse and deserialize data
+
+ The following query illustrates how to use the transform functions to parse and deserialize data.
+
+![Parse and deserialize data](../assets/nested-parse-deserialize.png)
+
+```sql
+SELECT
+  PARSE_JSON('{"x":"y"}'),
+  TO_JSON_STRING('{"x":"y"}'),
+  TO_JSON_STRING(PARSE_JSON('{"x":"y"}'))
+```
+
+Example query results:
+
+```json
+[["EXPR$0","EXPR$2","EXPR$3"],["COMPLEX<json>","STRING","STRING"],["OTHER","VARCHAR","VARCHAR"],["{\"x\":\"y\"}","\"{\\\"x\\\":\\\"y\\\"}\"","{\"x\":\"y\"}"]]
+```
+
+### Using helper operators
+
+The `JSON_KEYS` and `JSON_PATHS` functions are helper operators that you can use to examine JSON object schema. Use them to plan your queries, for example to work out which paths to use in `JSON_VALUE`.
+
+#### Example query: Examine JSON object schema
+
+ The following query illustrates how to use the helper operators to examine a nested data object.
+
+![Examine JSON object schema](../assets/nested-examine-schema.png)
+
+```sql
+SELECT
+  ARRAY_CONCAT_AGG(DISTINCT JSON_KEYS(shipTo, '$.')),
+  ARRAY_CONCAT_AGG(DISTINCT JSON_KEYS(shipTo, '$.address')),
+  ARRAY_CONCAT_AGG(DISTINCT JSON_PATHS(shipTo))
+FROM nested_data_example
+```
+
+Example query results:
+
+```json
+[["EXPR$0","EXPR$1","EXPR$2","EXPR$3"],["COMPLEX<json>","COMPLEX<json>","STRING","STRING"],["OTHER","OTHER","VARCHAR","VARCHAR"],["{\"x\":\"y\"}","\"{\\\"x\\\":\\\"y\\\"}\"","\"{\\\"x\\\":\\\"y\\\"}\"","{\"x\":\"y\"}"]]
+```
+
+## Known issues
+
+Before you start using the nested columns feature, consider the following known issues:
+
+- Directly using `COMPLEX<json>` columns and expressions is not well integrated into the Druid query engine. It can result in errors or undefined behavior when grouping and filtering, and when you use `COMPLEX<json>` objects as inputs to aggregators. As a workaround, consider using `TO_JSON_STRING` to coerce the values to strings before you perform these operations.
+- Directly using array-typed outputs from `JSON_KEYS` and `JSON_PATHS` is moderately supported by the Druid query engine. You can group on these outputs, and there are a number of array expressions that can operate on these values, such as `ARRAY_CONCAT_AGG`. However, some operations are not well defined for use outside array-specific functions, such as filtering using `=` or `IS NULL`.
+- Input validation for JSON SQL operators is currently incomplete, which sometimes results in undefined behavior or unhelpful error messages.
+- Ingesting data with a very complex nested structure is potentially an expensive operation and may require you to tune ingestion tasks and/or cluster parameters to account for increased memory usage or overall task run time. When you tune your ingestion configuration, treat each nested primitive field inside an object as a flattened top-level Druid column.
+
+## Further reading
+
+For more information, see the following pages:
+
+- [Nested columns functions reference](./sql-json-functions.md) for details of the functions used in the examples on this page.
+- [Multi-stage query architecture overview](../multi-stage-query/index.md) for information on how to set up and use this feature.
+- [Ingestion spec reference](../ingestion/ingestion-spec.md) for information on native ingestion and [`transformSpec`](../ingestion/ingestion-spec.md#transformspec).
+- [Data formats](../ingestion/data-formats.md) for information on [`flattenSpec`](../ingestion/data-formats.md#flattenspec).
diff --git a/docs/35.0.0/querying/post-aggregations.md b/docs/35.0.0/querying/post-aggregations.md
new file mode 100644
index 0000000000..169ab9d4bc
--- /dev/null
+++ b/docs/35.0.0/querying/post-aggregations.md
@@ -0,0 +1,297 @@
+---
+id: post-aggregations
+title: "Post-aggregations"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ Apache Druid supports two query languages: [Druid SQL](sql.md) and [native queries](querying.md).
+ This document describes the native
+ language. For information about functions available in SQL, refer to the
+ [SQL documentation](sql-aggregations.md).
+:::
+
+Post-aggregations are specifications of processing that should happen on aggregated values as they come out of Apache Druid. If you include a post aggregation as part of a query, make sure to include all aggregators the post-aggregator requires.
+
+There are several post-aggregators available.
+
+### Arithmetic post-aggregator
+
+The arithmetic post-aggregator applies the provided function to the given
+fields from left to right. The fields can be aggregators or other post aggregators.
+
+| Property | Description | Required |
+| --- | --- | --- |
+| `type` | Must be `"arithmetic"`. | Yes |
+| `name` | Output name of the post-aggregation | Yes |
+| `fn`| Supported functions are `+`, `-`, `*`, `/`, `pow` and `quotient` | Yes |
+| `fields` | List of post-aggregator specs which define inputs to the `fn` | Yes |
+| `ordering` | If no ordering (or `null`) is specified, the default floating point ordering is used. `numericFirst` ordering always returns finite values first, followed by `NaN`, and infinite values last. | No |
+
+
+**Note**:
+* `/` division always returns `0` if dividing by`0`, regardless of the numerator.
+* `quotient` division behaves like regular floating point division
+* Arithmetic post-aggregators always use floating point arithmetic.
+
+Example:
+
+```json
+{
+  "type"  : "arithmetic",
+  "name"  : "mult",
+  "fn"    : "*",
+  "fields": [
+    {"type": "fieldAccess", "fieldName":  "someAgg"},
+    {"type": "fieldAccess", "fieldName":  "someOtherAgg"}
+  ]
+}
+```
+
+### Field accessor post-aggregators
+
+These post-aggregators return the value produced by the specified [dimension](../querying/dimensionspecs.md) or [aggregator](../querying/aggregations.md).
+
+| Property | Description | Required |
+| --- | --- | --- |
+| `type` | Must be `"fieldAccess"` or `"finalizingFieldAccess"`. Use type `"fieldAccess"` to return the raw aggregation object, or use type `"finalizingFieldAccess"` to return a finalized value, such as an estimated cardinality. | Yes |
+| `name` | Output name of the post-aggregation | Yes if defined as a standalone post-aggregation, but may be omitted if used inline to some other post-aggregator in a `fields` list |
+| `fieldName` | The output name of the dimension or aggregator to reference | Yes |
+
+Example:
+
+```json
+{ "type" : "fieldAccess", "name": "someField", "fieldName" : "someAggregator" }
+```
+
+or
+
+```json
+{ "type" : "finalizingFieldAccess", "name": "someFinalizedField", "fieldName" : "someAggregator" }
+```
+
+
+### Constant post-aggregator
+
+The constant post-aggregator always returns the specified value.
+
+| Property | Description | Required |
+| --- | --- | --- |
+| `type` | Must be `"constant"` | Yes |
+| `name` | Output name of the post-aggregation | Yes |
+| `value` | The constant value | Yes |
+
+Example:
+
+```json
+{ "type"  : "constant", "name"  : "someConstant", "value" : 1234 }
+```
+
+
+### Expression post-aggregator
+The expression post-aggregator is defined using a Druid [expression](math-expr.md).
+
+| Property | Description | Required |
+| --- | --- | --- |
+| `type` | Must be `"expression"` | Yes |
+| `name` | Output name of the post-aggregation | Yes |
+| `expression` | Native Druid [expression](math-expr.md) to compute, may refer to any dimension or aggregator output names | Yes |
+| `ordering` | If no ordering (or `null`) is specified, the "natural" ordering is used. `numericFirst` ordering always returns finite values first, followed by `NaN`, and infinite values last. If the expression produces array or complex types, specify `ordering` as null and use `outputType` instead to use the correct type native ordering. | No |
+| `outputType` | Output type is optional, and can be any native Druid type: `LONG`, `FLOAT`, `DOUBLE`, `STRING`, `ARRAY` types (e.g. `ARRAY<LONG>`), or `COMPLEX` types (e.g. `COMPLEX<json>`). If not specified, the output type will be inferred from the `expression`. If specified and `ordering` is null, the type native ordering will be used for sorting values. If the expression produces array or complex types, this value must be non-null to ensure the correct ordering is used. If `outputType` does not match the actual output type of the `expression`, the value will be attempted to coerced to the specified type, possibly failing if coercion is not possible. | No |
+
+Example:
+```json
+{
+  "type": "expression",
+  "name": "someExpression",
+  "expression": "someAgg + someOtherAgg",
+  "ordering": null,
+  "outputType": "LONG" 
+}
+```
+
+### Greatest / Least post-aggregators
+
+`doubleGreatest` and `longGreatest` computes the maximum of all fields and Double.NEGATIVE_INFINITY.
+`doubleLeast` and `longLeast` computes the minimum of all fields and Double.POSITIVE_INFINITY.
+
+| Property | Description | Required |
+| --- | --- | --- |
+| `type` | Must be `"doubleGreatest"`, `"doubleLeast"`, `"longGreatest"`, or `"longLeast"`. | Yes |
+| `name` | Output name of the post-aggregation | Yes |
+| `fields` | List of post-aggregator specs which define inputs to the greatest or least function | Yes |
+
+The difference between the `doubleMax` aggregator and the `doubleGreatest` post-aggregator is that `doubleMax` returns the highest value of
+all rows for one specific column while `doubleGreatest` returns the highest value of multiple columns in one row. These are similar to the
+SQL `MAX` and `GREATEST` functions.
+
+Example:
+
+```json
+{
+  "type"  : "doubleGreatest",
+  "name"  : "theGreatest",
+  "fields": [
+   { "type": "fieldAccess", "fieldName": "someAgg" },
+   { "type": "fieldAccess", "fieldName": "someOtherAgg" }
+  ]
+}
+```
+
+### JavaScript post-aggregator
+
+Applies the provided JavaScript function to the given fields. Fields are passed as arguments to the JavaScript function in the given order.
+
+| Property | Description | Required |
+| --- | --- | --- |
+| `type` | Must be `"javascript"` | Yes |
+| `name` | Output name of the post-aggregation | Yes |
+| `fieldNames` | List of input dimension or aggregator output names | Yes |
+| `function` | String javascript function which accepts `fieldNames` as arguments | Yes |
+
+Example:
+```json
+{
+  "type": "javascript",
+  "name": "someJavascript",
+  "fieldNames" : ["someAgg", "someOtherAgg"],
+  "function": "function(someAgg, someOtherAgg) { return 100 * Math.abs(someAgg) / someOtherAgg;"
+}
+```
+
+:::info
+ JavaScript-based functionality is disabled by default. Please refer to the Druid [JavaScript programming guide](../development/javascript.md) for guidelines about using Druid's JavaScript functionality, including instructions on how to enable it.
+:::
+
+### HyperUnique Cardinality post-aggregator
+
+The hyperUniqueCardinality post aggregator is used to wrap a hyperUnique object such that it can be used in post aggregations.
+
+| Property | Description | Required |
+| --- | --- | --- |
+| `type` | Must be `"hyperUniqueCardinality"` | Yes |
+| `name` | Output name of the post-aggregation | Yes |
+| `fieldName` | The output name of a [`hyperUnique` aggregator](aggregations.md#cardinality-hyperunique) | Yes |
+
+```json
+{
+  "type"  : "hyperUniqueCardinality",
+  "name": "someCardinality",
+  "fieldName"  : "someHyperunique"
+}
+```
+
+It can be used in a sample calculation as so:
+
+```json
+{
+  ...
+  "aggregations" : [{
+    {"type" : "count", "name" : "rows"},
+    {"type" : "hyperUnique", "name" : "unique_users", "fieldName" : "uniques"}
+  }],
+  "postAggregations" : [{
+    "type"   : "arithmetic",
+    "name"   : "average_users_per_row",
+    "fn"     : "/",
+    "fields" : [
+      { "type" : "hyperUniqueCardinality", "fieldName" : "unique_users" },
+      { "type" : "fieldAccess", "name" : "rows", "fieldName" : "rows" }
+    ]
+  }]
+  ...
+```
+
+This post-aggregator will inherit the rounding behavior of the aggregator it references. Note that this inheritance
+is only effective if you directly reference an aggregator. Going through another post-aggregator, for example, will
+cause the user-specified rounding behavior to get lost and default to "no rounding".
+
+## Example Usage
+
+In this example, let’s calculate a simple percentage using post aggregators. Let’s imagine our data set has a metric called "total".
+
+The format of the query JSON is as follows:
+
+```json
+{
+  ...
+  "aggregations" : [
+    { "type" : "count", "name" : "rows" },
+    { "type" : "doubleSum", "name" : "tot", "fieldName" : "total" }
+  ],
+  "postAggregations" : [{
+    "type"   : "arithmetic",
+    "name"   : "average",
+    "fn"     : "/",
+    "fields" : [
+           { "type" : "fieldAccess", "name" : "tot", "fieldName" : "tot" },
+           { "type" : "fieldAccess", "name" : "rows", "fieldName" : "rows" }
+         ]
+  }]
+  ...
+}
+```
+
+
+```json
+{
+  ...
+  "aggregations" : [
+    { "type" : "doubleSum", "name" : "tot", "fieldName" : "total" },
+    { "type" : "doubleSum", "name" : "part", "fieldName" : "part" }
+  ],
+  "postAggregations" : [{
+    "type"   : "arithmetic",
+    "name"   : "part_percentage",
+    "fn"     : "*",
+    "fields" : [
+       { "type"   : "arithmetic",
+         "name"   : "ratio",
+         "fn"     : "/",
+         "fields" : [
+           { "type" : "fieldAccess", "name" : "part", "fieldName" : "part" },
+           { "type" : "fieldAccess", "name" : "tot", "fieldName" : "tot" }
+         ]
+       },
+       { "type" : "constant", "name": "const", "value" : 100 }
+    ]
+  }]
+  ...
+}
+```
+
+The same could be computed using an expression post-aggregator: 
+```json
+{
+  ...
+  "aggregations" : [
+    { "type" : "doubleSum", "name" : "tot", "fieldName" : "total" },
+    { "type" : "doubleSum", "name" : "part", "fieldName" : "part" }
+  ],
+  "postAggregations" : [{
+    "type"       : "expression",
+    "name"       : "part_percentage",
+    "expression" : "100 * (part / tot)"
+  }]
+  ...
+}
+```
+
diff --git a/docs/35.0.0/querying/query-context-reference.md b/docs/35.0.0/querying/query-context-reference.md
new file mode 100644
index 0000000000..a7532b265d
--- /dev/null
+++ b/docs/35.0.0/querying/query-context-reference.md
@@ -0,0 +1,142 @@
+---
+id: query-context-reference
+title: "Query context reference"
+sidebar_label: "Query context reference"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+The query context provides runtime configuration for individual queries in Apache Druid. Each parameter in the query context controls a specific aspect of query behavior—from execution timeouts and resource limits to caching policies and processing strategies.
+
+This reference contains context parameters organized by their scope: 
+
+- **General parameters**: Applies to all query types.
+- **Parameters by query type**: Applies to a specific type of query, such as TopN.
+- **Vectorization parameters**: Controls vectorized query execution for supported queries.
+
+To learn how to set the query context, see [Set query context](./query-context.md).
+
+For reference on query context parameters specific to Druid SQL, visit [SQL query context](sql-query-context.md). 
+For context parameters related to SQL-based ingestion, see the [SQL-based ingestion reference](../multi-stage-query/reference/#context-parameters).
+
+
+## General parameters
+
+Unless otherwise noted, the following parameters apply to all query types, and to both native and SQL queries.
+
+|Parameter          |Default                                 | Description          |
+|-------------------|----------------------------------------|----------------------|
+|`timeout`          | `druid.server.http.defaultQueryTimeout`| Query timeout in millis, beyond which unfinished queries will be cancelled. 0 timeout means `no timeout` (up to the server-side maximum query timeout, `druid.server.http.maxQueryTimeout`). To set the default timeout and maximum timeout, see [Broker configuration](../configuration/index.md#broker) |
+|`perSegmentTimeout`| `null`                                 | Per-segment processing timeout in millis, beyond which unfinished queries will be cancelled. Should be ≤ `timeout`. 0 `perSegmentTimeout` means `no per-segment timeout`. Generally, a standard default should be O(X seconds). A cluster-wide default value for this query context can be specified via `druid.query.default.context.perSegmentTimeout`.|
+|`priority`         | The default priority is one of the following: <ul><li>Value of `priority` in the query context, if set</li><li>The value of the runtime property `druid.query.default.context.priority`, if set and not null</li><li>`0` if the priority is not set in the query context or runtime properties</li></ul>| Query priority. Queries with higher priority get precedence for computational resources.|
+|`lane`             | `null`                                 | Query lane, used to control usage limits on classes of queries. See [Broker configuration](../configuration/index.md#broker) for more details.|
+|`queryId`          | auto-generated                         | Unique identifier given to this query. If a query ID is set or known, this can be used to cancel the query |
+|`brokerService`    | `null`                                 | Broker service to which this query should be routed. This parameter is honored only by a broker selector strategy of type *manual*. See [Router strategies](../design/router.md#router-strategies) for more details.|
+|`useCache`         | `true`                                 | Flag indicating whether to leverage the query cache for this query. When set to false, it disables reading from the query cache for this query. When set to true, Apache Druid uses `druid.broker.cache.useCache` or `druid.historical.cache.useCache` to determine whether or not to read from the query cache |
+|`populateCache`    | `true`                                 | Flag indicating whether to save the results of the query to the query cache. Primarily used for debugging. When set to false, it disables saving the results of this query to the query cache. When set to true, Druid uses `druid.broker.cache.populateCache` or `druid.historical.cache.populateCache` to determine whether or not to save the results of this query to the query cache |
+|`useResultLevelCache`| `true`                      | Flag indicating whether to leverage the result level cache for this query. When set to false, it disables reading from the query cache for this query. When set to true, Druid uses `druid.broker.cache.useResultLevelCache` to determine whether or not to read from the result-level query cache |
+|`populateResultLevelCache`    | `true`                      | Flag indicating whether to save the results of the query to the result level cache. Primarily used for debugging. When set to false, it disables saving the results of this query to the query cache. When set to true, Druid uses `druid.broker.cache.populateResultLevelCache` to determine whether or not to save the results of this query to the result-level query cache |
+|`bySegment`        | `false`                                | Native queries only. Return "by segment" results. Primarily used for debugging, setting it to `true` returns results associated with the data segment they came from |
+|`finalize`         | `N/A`                                 | Flag indicating whether to "finalize" aggregation results. Primarily used for debugging. For instance, the `hyperUnique` aggregator returns the full HyperLogLog sketch instead of the estimated cardinality when this flag is set to `false` |
+|`maxScatterGatherBytes`| `druid.server.http.maxScatterGatherBytes` | Maximum number of bytes gathered from data processes such as Historicals and realtime processes to execute a query. This parameter can be used to further reduce `maxScatterGatherBytes` limit at query time. See [Broker configuration](../configuration/index.md#broker) for more details.|
+|`maxQueuedBytes`       | `druid.broker.http.maxQueuedBytes`        | Maximum number of bytes queued per query before exerting backpressure on the channel to the data server. Similar to `maxScatterGatherBytes`, except unlike that configuration, this one will trigger backpressure rather than query failure. Zero means disabled.|
+|`maxSubqueryRows`| `druid.server.http.maxSubqueryRows` | Upper limit on the number of rows a subquery can generate. See [Broker configuration](../configuration/index.md#broker) and [subquery guardrails](../configuration/index.md#Guardrails for materialization of subqueries) for more details.|
+|`maxSubqueryBytes`| `druid.server.http.maxSubqueryBytes` | Upper limit on the number of bytes a subquery can generate. See [Broker configuration](../configuration/index.md#broker) and [subquery guardrails](../configuration/index.md#Guardrails for materialization of subqueries) for more details.|
+|`serializeDateTimeAsLong`| `false`       | If true, DateTime is serialized as long in the result returned by Broker and the data transportation between Broker and compute process|
+|`serializeDateTimeAsLongInner`| `false`  | If true, DateTime is serialized as long in the data transportation between Broker and compute process|
+|`enableParallelMerge`|`true`|Enable parallel result merging on the Broker. Note that `druid.processing.merge.useParallelMergePool` must be enabled for this setting to be set to `true`. See [Broker configuration](../configuration/index.md#broker) for more details.|
+|`parallelMergeParallelism`|`druid.processing.merge.parallelism`|Maximum number of parallel threads to use for parallel result merging on the Broker. See [Broker configuration](../configuration/index.md#broker) for more details.|
+|`parallelMergeInitialYieldRows`|`druid.processing.merge.initialYieldNumRows`|Number of rows to yield per ForkJoinPool merge task for parallel result merging on the Broker, before forking off a new task to continue merging sequences. See [Broker configuration](../configuration/index.md#broker) for more details.|
+|`parallelMergeSmallBatchRows`|`druid.processing.merge.smallBatchNumRows`|Size of result batches to operate on in ForkJoinPool merge tasks for parallel result merging on the Broker. See [Broker configuration](../configuration/index.md#broker) for more details.|
+|`useFilterCNF`|`false`| If true, Druid will attempt to convert the query filter to Conjunctive Normal Form (CNF). During query processing, columns can be pre-filtered by intersecting the bitmap indexes of all values that match the eligible filters, often greatly reducing the raw number of rows which need to be scanned. But this effect only happens for the top level filter, or individual clauses of a top level 'and' filter. As such, filters in CNF potentially have a higher chance to utilize a large amount of bitmap indexes on string columns during pre-filtering. However, this setting should be used with great caution, as it can sometimes have a negative effect on performance, and in some cases, the act of computing CNF of a filter can be expensive. We recommend hand tuning your filters to produce an optimal form if possible, or at least verifying through experimentation that using this parameter actually improves your query performance with no ill-effects.|
+|`secondaryPartitionPruning`|`true`|Enable secondary partition pruning on the Broker. The Broker will always prune unnecessary segments from the input scan based on a filter on time intervals, but if the data is further partitioned with hash or range partitioning, this option will enable additional pruning based on a filter on secondary partition dimensions.|
+|`debug`| `false` | Flag indicating whether to enable debugging outputs for the query. When set to false, no additional logs will be produced (logs produced will be entirely dependent on your logging level). When set to true, the following addition logs will be produced:<br />- Log the stack trace of the exception (if any) produced by the query |
+|`setProcessingThreadNames`|`true`| Whether processing thread names will be set to `queryType_dataSource_intervals` while processing a query. This aids in interpreting thread dumps, and is on by default. Query overhead can be reduced slightly by setting this to `false`. This has a tiny effect in most scenarios, but can be meaningful in high-QPS, low-per-segment-processing-time scenarios. |
+|`sqlPlannerBloat`|`1000`|Calcite parameter which controls whether to merge two Project operators when inlining expressions causes complexity to increase. Implemented as a workaround to exception `There are not enough rules to produce a node with desired properties: convention=DRUID, sort=[]` thrown after rejecting the merge of two projects.|
+|`cloneQueryMode`|`excludeClones`| Indicates whether clone Historicals should be queried by brokers. Clone servers are created by the `cloneServers` Coordinator dynamic configuration. Possible values are `excludeClones`, `includeClones` and `preferClones`. `excludeClones` means that clone Historicals are not queried by the broker. `preferClones` indicates that when given a choice between the clone Historical and the original Historical which is being cloned, the broker chooses the clones. Historicals which are not involved in the cloning process will still be queried. `includeClones` means that broker queries any Historical without regarding clone status. This parameter only affects native queries. MSQ does not query Historicals directly.|
+|`realtimeSegmentsOnly` |`false`| When set to true, only query realtime segments. Historical segments are excluded. |
+
+## Parameters by query type
+
+Some query types offer context parameters specific to that query type.
+
+### TopN
+
+|Parameter        |Default              | Description          |
+|-----------------|---------------------|----------------------|
+|`minTopNThreshold` | `1000`              | The top minTopNThreshold local results from each segment are returned for merging to determine the global topN. |
+
+### Timeseries
+
+|Parameter        |Default              | Description          |
+|-----------------|---------------------|----------------------|
+|`skipEmptyBuckets` | `false`             | Disable timeseries zero-filling behavior, so only buckets with results will be returned. |
+
+### Join filter
+
+|Parameter        |Default              | Description          |
+|-----------------|---------------------|----------------------|
+|`enableJoinFilterPushDown` | `true` | Controls whether a join query will attempt filter push down, which reduces the number of rows that have to be compared in a join operation.|
+|`enableJoinFilterRewrite` | `true` | Controls whether filter clauses that reference non-base table columns will be rewritten into filters on base table columns.|
+|`enableJoinFilterRewriteValueColumnFilters` | `false` | Controls whether Druid rewrites non-base table filters on non-key columns in the non-base table. Requires a scan of the non-base table.|
+|`enableRewriteJoinToFilter` | `true` | Controls whether a join can be pushed partial or fully to the base table as a filter at runtime.|
+|`joinFilterRewriteMaxSize` | `10000` | The maximum size of the correlated value set used for filter rewrites. Set this limit to prevent excessive memory use.| 
+
+### GroupBy
+
+See the list of [GroupBy query context](groupbyquery.md#advanced-configurations) parameters available on the groupBy
+query page.
+
+## Vectorization parameters
+
+The GroupBy and Timeseries query types can run in _vectorized_ mode, which speeds up query execution by processing
+batches of rows at a time. Not all queries can be vectorized. In particular, vectorization currently has the following
+requirements:
+
+- All query-level filters must either be able to run on bitmap indexes or must offer vectorized row-matchers. These
+include `selector`, `bound`, `in`, `like`, `regex`, `search`, `and`, `or`, and `not`.
+- All filters in filtered aggregators must offer vectorized row-matchers.
+- All aggregators must offer vectorized implementations. These include `count`, `doubleSum`, `floatSum`, `longSum`. `longMin`,
+ `longMax`, `doubleMin`, `doubleMax`, `floatMin`, `floatMax`, `longAny`, `doubleAny`, `floatAny`, `stringAny`,
+ `hyperUnique`, `filtered`, `approxHistogram`, `approxHistogramFold`, and `fixedBucketsHistogram` (with numerical input). 
+- All virtual columns must offer vectorized implementations. Currently for expression virtual columns, support for vectorization is decided on a per expression basis, depending on the type of input and the functions used by the expression. See the currently supported list in the [expression documentation](math-expr.md#vectorization-support).
+- For GroupBy: All dimension specs must be "default" (no extraction functions or filtered dimension specs).
+- For GroupBy: No multi-value dimensions.
+- For Timeseries: No "descending" order.
+- Only immutable segments (not real-time).
+- Only [table datasources](datasource.md#table) (not joins, subqueries, lookups, or inline datasources).
+
+Other query types (like TopN, Scan, Select, and Search) ignore the `vectorize` parameter, and will execute without
+vectorization. These query types will ignore the `vectorize` parameter even if it is set to `"force"`.
+
+|Parameter|Default| Description|
+|---------|-------|------------|
+|`vectorize`|`true`|Enables or disables vectorized query execution. Possible values are `false` (disabled), `true` (enabled if possible, disabled otherwise, on a per-segment basis), and `force` (enabled, and groupBy or timeseries queries that cannot be vectorized will fail). The `"force"` setting is meant to aid in testing, and is not generally useful in production (since real-time segments can never be processed with vectorized execution, any queries on real-time data will fail). This will override `druid.query.default.context.vectorize` if it's set.|
+|`vectorSize`|`512`|Sets the row batching size for a particular query. This will override `druid.query.default.context.vectorSize` if it's set.|
+|`vectorizeVirtualColumns`|`true`|Enables or disables vectorized query processing of queries with virtual columns, layered on top of `vectorize` (`vectorize` must also be set to true for a query to utilize vectorization). Possible values are `false` (disabled), `true` (enabled if possible, disabled otherwise, on a per-segment basis), and `force` (enabled, and groupBy or timeseries queries with virtual columns that cannot be vectorized will fail). The `"force"` setting is meant to aid in testing, and is not generally useful in production. This will override `druid.query.default.context.vectorizeVirtualColumns` if it's set.|
+
+## Learn more
+
+For more information, see the following topics:
+
+- [Set query context](./query-context.md) to learn how to configure query context parameters.
+- [SQL query context](sql-query-context.md) for query context parameters specific to Druid SQL.
+- [SQL-based ingestion reference](../multi-stage-query/reference/#context-parameters) for context parameters used in SQL-based ingestion (MSQ).
+
diff --git a/docs/35.0.0/querying/query-context.md b/docs/35.0.0/querying/query-context.md
new file mode 100644
index 0000000000..2f423945be
--- /dev/null
+++ b/docs/35.0.0/querying/query-context.md
@@ -0,0 +1,297 @@
+---
+id: query-context
+title: "Set query context"
+sidebar_label: "Set query context"
+description: 
+  "Learn how to configure the query context
+  to customize query execution behavior and optimize performance."
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+  
+
+The query context gives you fine-grained control over how Apache Druid executes your individual queries. While the default settings in Druid work well for most queries, you can set the query context to handle specific requirements and optimize performance.
+
+Common use cases for the query context include:
+- Override default timeouts for long-running queries or complex aggregations.
+- Debug query performance by disabling caching during testing.
+- Configure SQL-specific behaviors like time zones for accurate time-based analysis.
+- Set priorities to ensure critical queries get computational resources first.
+- Adjust memory limits for queries that process large datasets.
+
+The way you set the query context depends on how you submit the query to Druid, whether using the web console or API.
+It also depends on whether your query is Druid SQL or a JSON-based native query.
+This guide shows you how to set the query context for each application.
+
+Before you begin, identify which context parameters you need to configure in order to establish your query context as query context carriers. For available parameters and their descriptions, see [Query context reference](query-context-reference.md).
+
+## Web console
+
+You can configure query context parameters for both Druid SQL and native queries in the [web console](../operations/web-console.md).
+
+The following steps show you how to set the query context using the web console:
+
+1. In the web console, select **Query** from the top-level navigation.
+
+   ![Query view](../assets/set-query-context-query-view.png)
+
+2. Enter the query you want to run. If you ingested the Wikipedia dataset from the [quickstart](../tutorials/index.md), you can use the following query: 
+
+    ```sql
+    SELECT * FROM wikipedia WHERE user='BlueMoon2662'
+    ```
+
+   ![Adding query](../assets/set-query-context-insert-query.png)
+
+3. In the menu for the engine selector, click **Edit query context**.
+
+   ![Opening context dialog](../assets/set-query-context-open-context-dialog.png)
+
+4. In the **Edit query context** dialog, add your context parameters as JSON key-value pairs.
+
+   For example, you can set the `sqlTimeZone` parameter to ensure that the query results reflect the specified time zone. This may differ from your local time zone when viewing the data.
+
+   ```json
+   {
+     "sqlTimeZone" : "America/Los_Angeles"
+   }
+   ```
+
+5. The web console validates the JSON object containing the query context parameters and highlights any syntax errors.
+   Click **Save**.
+
+   ![Setting the context parameters](../assets/set-query-context-set-context-parameters.png)
+
+6. Click **Run** to execute your query with the specified context parameters.
+
+   ![Running the query](../assets/set-query-context-run-the-query.png)
+
+   Compare the results of the example query with and without the query context.
+   * Without the query context, the query returns the `__time` value of `2015-09-12T00:47:53.259Z`.
+   * When you set the `sqlTimeZone` parameter, the query returns `2015-09-11T17:47:53.259-07:00`.
+
+
+## Druid SQL
+
+When using Druid SQL programmatically—such as in applications, automated scripts, or database tools—you can set the query context through various methods depending on how you submit your queries.
+
+### HTTP API
+
+When using the HTTP API, you include query context parameters in the `context` object of your JSON request. For more information on how to format Druid SQL API requests and handle responses, see [Druid SQL API](../api-reference/sql-api.md).
+
+The following example sets the `sqlTimeZone` parameter:
+
+```json
+{
+  "query": "SELECT * FROM wikipedia WHERE user = 'BlueMoon2662'",
+  "context": {
+    "sqlTimeZone": "America/Los_Angeles"
+  }
+}
+```
+
+You can set multiple context parameters in a single request:
+
+```json
+{
+  "query": "SELECT * FROM wikipedia WHERE user = 'BlueMoon2662'",
+  "context": {
+    "sqlTimeZone": "America/Los_Angeles",
+    "sqlQueryId": "request01"
+  }
+}
+```
+
+
+### JDBC driver API
+
+You can connect to Druid over JDBC and issue Druid SQL queries using the [Druid SQL JDBC driver API](../api-reference/sql-jdbc.md).
+This approach is useful when integrating Druid with BI tools or Java applications.
+When connecting to Druid through JDBC, you set query context parameters in a JDBC connection properties object.
+You supply the object when establishing the connection to Druid.
+
+The following code excerpt shows how you can configure the connection properties:
+
+```java
+String url = "jdbc:avatica:remote:url=http://localhost:8888/druid/v2/sql/avatica/";
+
+// Set the time zone to America/Los_Angeles
+Properties connectionProperties = new Properties();
+connectionProperties.setProperty("sqlTimeZone", "America/Los_Angeles");
+
+try (Connection connection = DriverManager.getConnection(url, connectionProperties)) {
+  // create and execute statements, process result sets, etc
+}
+```
+
+<details>
+<summary>View full JDBC example</summary>
+
+```java
+import java.sql.*;
+import java.util.Properties;
+
+public class JdbcDruid {
+
+    public static void main(String args[]) {
+
+        // Connect to /druid/v2/sql/avatica/ on your Broker.
+        String url = "jdbc:avatica:remote:url=http://localhost:8888/druid/v2/sql/avatica/;transparent_reconnection=true";
+
+        // The query you want to run.
+        String query = "SELECT * FROM wikipedia WHERE user = 'BlueMoon2662'";
+
+        // Set any connection context parameters you need here.
+        Properties connectionProperties = new Properties();
+        connectionProperties.setProperty("sqlTimeZone", "America/Los_Angeles");
+
+        try (Connection connection = DriverManager.getConnection(url, connectionProperties)) {
+            try (
+                final Statement statement = connection.createStatement();
+                final ResultSet rs = statement.executeQuery(query)
+            ) {
+                while (rs.next()) {
+                    // process result set
+                    Timestamp timeStamp = rs.getTimestamp("__time");
+                    System.out.println(timeStamp);
+                }
+            }
+        } catch (Exception e) {
+            System.out.println(e.toString());
+        }
+    }
+}
+```
+
+</details>
+
+### SET statements
+
+You can use the SET command to specify SQL query context parameters that modify the behavior of a Druid SQL query. Druid accepts one or more SET statements before the main SQL query. The SET command works in the both web console and the Druid SQL HTTP API.
+
+In the web console, you can write your SET statements followed by your query directly. For example:
+
+```sql
+SET sqlTimeZone = 'America/Los_Angeles';
+SELECT * FROM wikipedia WHERE user = 'BlueMoon2662';
+```
+
+You can also include your SET statements as part of the query string in your HTTP API call. For example:
+
+```bash
+curl -X POST 'http://localhost:8888/druid/v2/sql' \
+  -H 'Content-Type: application/json' \
+  -d '{
+    "query": "SET sqlTimeZone='\''America/Los_Angeles'\''; SELECT * FROM wikipedia WHERE user='\''BlueMoon2662'\''"
+}'
+```
+
+You can also combine SET statements with the `context` field. If you include both, the parameter value in SET takes precedence:
+
+```bash
+curl -X POST 'http://localhost:8888/druid/v2/sql' \
+  -H 'Content-Type: application/json' \
+  -d '{
+    "query": "SET sqlTimeZone='\''America/Los_Angeles'\''; SELECT * FROM wikipedia WHERE user='\''BlueMoon2662'\''",
+    "context": {
+      "sqlTimeZone": "UTC"
+    }
+}'
+```
+
+For more details on how to use the SET command in your SQL query, see [SET](sql.md#set).
+
+:::info
+You cannot use SET statements in JDBC connections.
+:::
+
+
+## Native queries
+
+For native queries, you can include query context parameters in a JSON object named `context` within your query or through the [web console](#web-console).
+
+The following example shows a native query that sets the `sqlTimeZone` to `America/Los_Angeles` and `queryId` to `only_query_id_test`:
+
+```json
+{
+  "queryType": "timeseries",
+  "dataSource": "wikipedia",
+  "granularity": "day",
+  "descending": true,
+  "filter": {
+    "type": "and",
+    "fields": [
+      { "type": "selector", "dimension": "countryName", "value": "Australia" },
+      { "type": "selector", "dimension": "isAnonymous", "value": "true" }
+    ]
+  },
+  "aggregations": [
+    { "type": "count", "name": "row_count" }
+  ],
+  "intervals": ["2015-09-12T00:00:00.000/2015-09-13T00:00:00.000"],
+  "context": {
+    "sqlTimeZone": "America/Los_Angeles",
+    "queryId": "only_query_id_test",
+  }
+}
+```
+
+
+## Runtime properties
+
+You can configure query context parameters globally by adding a runtime property to your configuration file.
+The property takes the following format:
+
+```properties
+druid.query.default.context.{PARAMETER}={VALUE}
+```
+
+Replace `PARAMETER` with the query context parameter and `VALUE` with its value.
+For example:
+
+```properties
+druid.query.default.context.debug=true
+```
+
+For more information, see [Configuration reference](../configuration/index.md#overriding-default-query-context-values).
+
+
+## Query context precedence
+
+For a given context query, Druid determines the final query context value to use based on the following order of precedence, from lowest to highest:
+
+1. **Built-in defaults**: Druid uses the documented default values if you don’t specify anything.
+
+2. **Runtime properties**: If you configure parameters as `druid.query.default.context.{PARAMETER}` in the configuration files, these override the built-in defaults and act as your system-wide defaults.
+
+3. **Context object in HTTP request**: Parameters passed within the JSON `context` object override both built-in defaults and runtime properties.
+
+4. **SET statements**: Parameters set in Druid SQL using `SET key=value;` take the highest precedence and override all other settings.
+
+
+## Learn more
+
+For more information, see the following topics:
+
+- [Query context reference](query-context-reference.md) for available query context parameters.
+- [SQL query context](sql-query-context.md) for SQL-specific context parameters.
+- [Multi-stage query context](../multi-stage-query/reference.md#context-parameters) for context parameters specific to SQL-based ingestion.
+- [Native queries](querying.md) for details on constructing native queries with context.
+- [SET](sql.md#set) for complete syntax and usage of SET statements.
diff --git a/docs/35.0.0/querying/query-execution.md b/docs/35.0.0/querying/query-execution.md
new file mode 100644
index 0000000000..9228258601
--- /dev/null
+++ b/docs/35.0.0/querying/query-execution.md
@@ -0,0 +1,122 @@
+---
+id: query-execution
+title: "Query execution"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ This document describes how Druid executes [native queries](querying.md), but since [Druid SQL](sql.md) queries
+ are translated to native queries, this document applies to the SQL runtime as well. Refer to the SQL
+ [Query translation](sql-translation.md) page for information about how SQL queries are translated to native
+ queries.
+:::
+
+Druid's approach to query execution varies depending on the kind of [datasource](datasource.md) you are querying.
+
+## Datasource type
+
+### `table`
+
+Queries that operate directly on [table datasources](datasource.md#table) are executed using a scatter-gather approach
+led by the Broker process. The process looks like this:
+
+1. The Broker identifies which [segments](../design/segments.md) are relevant to the query based on the `"intervals"`
+parameter. Segments are always partitioned by time, so any segment whose interval overlaps the query interval is
+potentially relevant.
+
+2. The Broker may additionally further prune the segment list based on the `"filter"`, if the input data was partitioned
+by range using the [`single_dim` partitionsSpec](../ingestion/native-batch.md#partitionsspec), and if the filter matches
+the dimension used for partitioning.
+
+3. The Broker, having pruned the list of segments for the query, forwards the query to data servers (like Historicals
+and tasks running on Middle Managers) that are currently serving those segments.
+
+4. For all query types except [Scan](scan-query.md), data servers process each segment in parallel and generate partial
+results for each segment. The specific processing that is done depends on the query type. These partial results may be
+cached if [query caching](caching.md) is enabled. For Scan queries, segments are processed in order by a single thread.
+
+5. The Broker receives partial results from each data server, merges them into the final result set, and returns them
+to the caller. For Timeseries and Scan queries, and for GroupBy queries where there is no sorting, the Broker is able to
+do this in a streaming fashion. Otherwise, the Broker fully computes the result set before returning anything.
+
+### `lookup`
+
+Queries that operate directly on [lookup datasources](datasource.md#lookup) (without a join) are executed on the Broker
+that received the query, using its local copy of the lookup. All registered lookup tables are preloaded in-memory on the
+Broker. The query runs single-threaded.
+
+Execution of queries that use lookups as right-hand inputs to a join are executed in a way that depends on their
+"base" (bottom-leftmost) datasource, as described in the [join](#join) section below.
+
+### `union`
+
+Queries that operate directly on [union datasources](datasource.md#union) are split up on the Broker into a separate
+query for each table that is part of the union. Each of these queries runs separately, and the Broker merges their
+results together.
+
+### `inline`
+
+Queries that operate directly on [inline datasources](datasource.md#inline) are executed on the Broker that received the
+query. The query runs single-threaded.
+
+Execution of queries that use inline datasources as right-hand inputs to a join are executed in a way that depends on
+their "base" (bottom-leftmost) datasource, as described in the [join](#join) section below.
+
+### `query`
+
+[Query datasources](datasource.md#query) are subqueries. Each subquery is executed as if it was its own query and
+the results are brought back to the Broker. Then, the Broker continues on with the rest of the query as if the subquery
+was replaced with an inline datasource.
+
+In most cases, Druid buffers subquery results in memory on the Broker before the rest of the query proceeds.
+Therefore, subqueries execute sequentially. The total number of rows buffered across all subqueries of a given query 
+cannot exceed the [`druid.server.http.maxSubqueryRows`](../configuration/index.md) which defaults to 100000 rows, or the
+[`druid.server.http.maxSubqueryBytes`](../configuration/index.md) if set. Otherwise, Druid throws a resource limit exceeded 
+exception.
+
+There is one exception: if the outer query is of type [`groupBy`](groupbyquery.md), and has a `dataSource` of type
+`query` that is itself another `groupBy`, then subquery results can be processed in a streaming fashion. In this case
+the `druid.server.http.maxSubqueryRows` and `druid.server.http.maxSubqueryBytes` limits do not apply.
+
+### `join`
+
+[Join datasources](datasource.md#join) are handled using a broadcast hash-join approach.
+
+1. The Broker executes any subqueries that are inputs the join, as described in the [query](#query) section, and
+replaces them with inline datasources.
+
+2. The Broker flattens a join tree, if present, into a "base" datasource (the bottom-leftmost one) and other leaf
+datasources (the rest).
+
+3. Query execution proceeds using the same structure that the base datasource would use on its own. If the base
+datasource is a [table](#table), segments are pruned based on `"intervals"` as usual, and the query is executed on the
+cluster by forwarding it to all relevant data servers in parallel. If the base datasource is a [lookup](#lookup) or
+[inline](#inline) datasource (including an inline datasource that was the result of inlining a subquery), the query is
+executed on the Broker itself. The base query cannot be a union, because unions are not currently supported as inputs to
+a join.
+
+4. Before beginning to process the base datasource, the server(s) that will execute the query first inspect all the
+non-base leaf datasources to determine if a new hash table needs to be built for the upcoming hash join. Currently,
+lookups do not require new hash tables to be built (because they are preloaded), but inline datasources do.
+
+5. Query execution proceeds again using the same structure that the base datasource would use on its own, with one
+addition: while processing the base datasource, Druid servers will use the hash tables built from the other join inputs
+to produce the join result row-by-row, and query engines will operate on the joined rows rather than the base rows.
diff --git a/docs/35.0.0/querying/query-from-deep-storage.md b/docs/35.0.0/querying/query-from-deep-storage.md
new file mode 100644
index 0000000000..ba34d116a3
--- /dev/null
+++ b/docs/35.0.0/querying/query-from-deep-storage.md
@@ -0,0 +1,208 @@
+---
+id: query-deep-storage
+title: "Query from deep storage"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+Druid can query segments that are only stored in deep storage. Running a query from deep storage is slower than running queries from segments that are loaded on Historical processes, but it's a great tool for data that you either access infrequently or where the low latency results that typical Druid queries provide is not necessary. Queries from deep storage can increase the surface area of data available to query without requiring you to scale your Historical processes to accommodate more segments.
+
+## Prerequisites
+
+Query from deep storage requires the Multi-stage query (MSQ) task engine. Load the extension for it if you don't already have it enabled before you begin. See [enable MSQ](../multi-stage-query/index.md#load-the-extension) for more information.
+
+To be queryable, your datasource must meet one of the following conditions:
+
+- At least one segment from the datasource is loaded onto a Historical service for Druid to plan the query. This segment can be any segment from the datasource. You can verify that a datasource has at least one segment on a Historical service if it's visible in the Druid console.
+- You have the centralized datasource schema feature enabled. For more information, see [Centralized datasource schema](../configuration/index.md#centralized-datasource-schema-experimental).
+
+If you use centralized data source schema, there's an additional step for any datasource created prior to enabling it to make the datasource queryable from deep storage. You need to load the segments from deep storage onto a Historical so that the schema can be backfilled in the metadata database. You can load some or all of the segments that are only in deep storage. If you don't load all the segments, any dimensions that are only in the segments you didn't load will not be in the queryable datasource schema and won't be queryable from deep storage. That is, only the dimensions that are present in the segment schema in metadata database are queryable. Once that process is complete, you can unload all the segments from the Historical and only keep the data in deep storage.
+
+## Keep segments in deep storage only
+
+Any data you ingest into Druid is already stored in deep storage, so you don't need to perform any additional configuration from that perspective. However, to take advantage of the cost savings that querying from deep storage provides, make sure not all your segments get loaded onto Historical processes. If you use centralized datasource schema, a datasource can be kept only in deep storage but remain queryable.
+
+To manage which segments are kept only in deep storage and which get loaded onto Historical processes, configure [load rules](../operations/rule-configuration.md#load-rules) 
+
+The easiest way to keep segments only in deep storage is to explicitly configure the segments that don't get loaded onto Historical processes. Set `tieredReplicants` to an empty array and `useDefaultTierForNull` to `false`. For example, if you configure the following rule for a datasource:
+
+```json
+[
+  {
+    "interval": "2016-06-27T00:00:00.000Z/2016-06-27T02:59:00.000Z",
+    "tieredReplicants": {},
+    "useDefaultTierForNull": false,
+    "type": "loadByInterval"
+  }
+]
+```
+
+Any segment that falls within the specified interval exists only in deep storage. For segments that aren't in this interval, they'll use the default cluster load rules or any other load rules you configure.
+
+To configure the load rules through the Druid console, go to **Datasources > ... in the Actions column > Edit retention rules**. Then, paste the provided JSON into the JSON tab:
+
+![](../assets/tutorial-query-deepstorage-retention-rule.png)
+
+
+You can verify that a segment is not loaded on any Historical tiers by querying the Druid metadata table:
+
+```sql
+SELECT "segment_id", "replication_factor" FROM sys."segments" WHERE "replication_factor" = 0 AND "datasource" = YOUR_DATASOURCE
+```
+
+Segments with a `replication_factor` of `0` are not assigned to any Historical tiers. Queries against these segments are run directly against the segment in deep storage. 
+
+You can also confirm this through the Druid console. On the **Segments** page, see the **Replication factor** column.
+
+Note that the actual number of replicas may differ from the replication factor temporarily as Druid processes your load rules.
+
+## Run a query from deep storage
+
+### Submit a query
+
+You can query data from deep storage by submitting a query to the API using `POST /sql/statements`  or the Druid console. Druid uses the multi-stage query (MSQ) task engine to perform the query.
+
+To run a query from deep storage, send your query to the Router using the POST method:
+
+```
+POST https://ROUTER:8888/druid/v2/sql/statements
+```
+
+Submitting a query from deep storage uses the same syntax as any other Druid SQL query where the query is contained in the "query" field in the JSON object within the request payload. For example:
+
+```json
+{"query" : "SELECT COUNT(*) FROM data_source WHERE foo = 'bar'"}
+```  
+
+Generally, the request body fields are the same between the `sql` and `sql/statements` endpoints.
+
+Apart from the context parameters mentioned [here](../multi-stage-query/reference.md#context-parameters) there are additional context parameters for `sql/statements`: 
+
+   - `executionMode`  (required) determines how query results are fetched. Set this to `ASYNC`. 
+   - `selectDestination` (optional) set to `durableStorage` instructs Druid to write the results of SELECT queries to durable storage. For result sets with more than 3000 rows, it is highly recommended to use `durableStorage`. Note that this requires you to have [durable storage for MSQ enabled](../operations/durable-storage.md).
+
+The following sample query includes the two additional context parameters that querying from deep storage supports:
+
+```
+curl --location 'http://localhost:8888/druid/v2/sql/statements' \
+--header 'Content-Type: application/json' \
+--data '{
+    "query":"SELECT * FROM \"YOUR_DATASOURCE\" where \"__time\" >TIMESTAMP'\''2017-09-01'\'' and \"__time\" <= TIMESTAMP'\''2017-09-02'\''",
+    "context":{
+        "executionMode":"ASYNC",
+        "selectDestination": "durableStorage"
+
+    }  
+}'
+```
+
+Note that you can also submit context parameters using [SET](../querying/sql.md#set). For example:
+
+```
+  "query": "SET executionMode = '\''ASYNC'\''; SET selectDestination = '\''durableStorage'\''; SELECT * FROM \"YOUR_DATASOURCE\" WHERE \"__time\" > TIMESTAMP '\''2017-09-01'\'' AND \"__time\" <= TIMESTAMP '\''2017-09-02'\''"
+```
+
+The response for submitting a query includes the query ID along with basic information, such as when you submitted the query and the schema of the results:
+
+```json
+{
+  "queryId": "query-ALPHANUMBERIC-STRING",
+  "state": "ACCEPTED",
+  "createdAt": CREATION_TIMESTAMP,
+"schema": [
+  {
+    "name": COLUMN_NAME,
+    "type": COLUMN_TYPE,
+    "nativeType": COLUMN_TYPE
+  },
+  ...
+],
+"durationMs": DURATION_IN_MS,
+}
+```
+
+### Get query status
+
+You can check the status of a query with the following API call:
+
+```
+GET https://ROUTER:8888/druid/v2/sql/statements/QUERYID
+```
+
+The query returns the status of the query, such as `ACCEPTED` or `RUNNING`. Before you attempt to get results, make sure the state is `SUCCESS`. 
+
+When you check the status on a successful query,  it includes useful information about your query results including a sample record and information about how the results are organized by `pages`. The information for each page includes the following:
+
+- `numRows`: the number of rows in that page of results
+- `sizeInBytes`: the size of the page
+- `id`: the indexed page number that you can use to reference a specific page when you get query results
+
+You can use `page` as a parameter to refine the results you retrieve. 
+
+The following snippet shows the structure of the `result` object:
+
+```json
+{
+  ...
+  "result": {
+    "numTotalRows": INTEGER,
+    "totalSizeInBytes": INTEGER,
+    "dataSource": "__query_select",
+    "sampleRecords": [
+      [
+        RECORD_1,
+        RECORD_2,
+        ...
+      ]
+    ],
+    "pages": [
+      {
+        "numRows": INTEGER,
+        "sizeInBytes": INTEGER,
+        "id": INTEGER_PAGE_NUMBER
+      }
+      ...
+    ]
+}
+}
+```
+
+### Get query results
+
+Only the user who submitted a query can retrieve the results for the query.
+
+Use the following endpoint to retrieve results:
+
+```
+GET https://ROUTER:8888/druid/v2/sql/statements/QUERYID/results?page=PAGENUMBER&resultFormat=FORMAT
+```
+
+Results are returned in JSON format.
+
+You can use the optional `page` parameter to refine your results, and `resultFormat` parameter to define the format in which the results will be presented. 
+* You can retrieve the `page` information for your results by fetching the status of the completed query.
+* For `resultFormat` the following options are supported `arrayLines`,`objectLines`,`array`,`object`, and `csv`. Default value is `object`. More documentation present [here](../api-reference/sql-api.md#request-body). 
+
+When you try to get results for a query from deep storage, you may receive an error that states the query is still running. Wait until the query completes before you try again.
+
+## Further reading
+
+* [Query from deep storage tutorial](../tutorials/tutorial-query-deep-storage.md)
+* [Query from deep storage API reference](../api-reference/sql-api.md#query-from-deep-storage)
diff --git a/docs/35.0.0/querying/query-processing.md b/docs/35.0.0/querying/query-processing.md
new file mode 100644
index 0000000000..b4ecd006f0
--- /dev/null
+++ b/docs/35.0.0/querying/query-processing.md
@@ -0,0 +1,48 @@
+---
+id: query-processing
+title: "Query processing"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+This topic provides a high-level overview of how Apache Druid distributes and processes queries.
+
+The general flow is as follows:
+
+1. A query enters the [Broker](../design/broker.md) service, which identifies the segments with data that may pertain to that query. The list of segments is always pruned by time, and may also be pruned by other attributes depending on how the datasource is partitioned.
+2. The Broker identifies which [Historical](../design/historical.md) and [Middle Manager](../design/middlemanager.md) services are serving those segments and distributes a rewritten subquery to each of the services.
+3. The Historical and Middle Manager services execute each subquery and return results to the Broker.
+4. The Broker merges the partial results to get the final answer, which it returns to the original caller.
+
+Druid uses time and attribute pruning to minimize the data it must scan for each query.
+
+For filters that are more precise than what the Broker uses for pruning, the [indexing structures](../design/storage.md#indexing-and-handoff) inside each segment allow Historical services to identify matching rows before accessing the data. Once the Historical service knows which rows match a particular query, it only accesses the requires rows and columns.
+
+To maximize query performance, Druid uses the following techniques:
+
+- Pruning the set of segments accessed for a query.
+- Within each segment, using indexes to identify which rows must be accessed.
+- Within each segment, only reading the specific rows and columns that are relevant to a particular query.
+
+## Learn more
+
+See the following topic for more information:
+
+* [Query execution](../querying/query-execution.md) to learn how Druid services process query statements.
\ No newline at end of file
diff --git a/docs/35.0.0/querying/querying.md b/docs/35.0.0/querying/querying.md
new file mode 100644
index 0000000000..ba173fdb0a
--- /dev/null
+++ b/docs/35.0.0/querying/querying.md
@@ -0,0 +1,158 @@
+---
+id: querying
+title: "Native queries"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+:::info
+ Apache Druid supports two query languages: [Druid SQL](sql.md) and [native queries](querying.md).
+ This document describes the
+ native query language. For information about how Druid SQL chooses which native query types to use when
+ it runs a SQL query, refer to the [SQL documentation](sql-translation.md#query-types).
+:::
+
+Native queries in Druid are JSON objects and are typically issued to the Broker or Router processes. Queries can be
+posted like this:
+
+```bash
+curl -X POST '<queryable_host>:<port>/druid/v2/?pretty' -H 'Content-Type:application/json' -H 'Accept:application/json' -d @<query_json_file>
+```
+
+:::info
+ Replace `<queryable_host>:<port>` with the appropriate address and port for your system. For example, if running the quickstart configuration, replace `<queryable_host>:<port>` with localhost:8888.
+:::
+
+You can also enter them directly in the web console's Query view. Simply pasting a native query into the console switches the editor into JSON mode.
+
+![Native query](../assets/native-queries-01.png "Native query")
+
+Druid's native query language is JSON over HTTP, although many members of the community have contributed different
+[client libraries](https://druid.apache.org/libraries.html) in other languages to query Druid.
+
+The Content-Type/Accept Headers can also take 'application/x-jackson-smile'.
+
+```bash
+curl -X POST '<queryable_host>:<port>/druid/v2/?pretty' -H 'Content-Type:application/json' -H 'Accept:application/x-jackson-smile' -d @<query_json_file>
+```
+
+:::info
+ If the Accept header is not provided, it defaults to the value of 'Content-Type' header.
+:::
+
+Druid's native query is relatively low level, mapping closely to how computations are performed internally. Druid queries
+are designed to be lightweight and complete very quickly. This means that for more complex analysis, or to build
+more complex visualizations, multiple Druid queries may be required.
+
+Even though queries are typically made to Brokers or Routers, they can also be accepted by
+[Historical](../design/historical.md) processes and by [Peons (task JVMs)](../design/peons.md) that are running
+stream ingestion tasks. This may be valuable if you want to query results for specific segments that are served by
+specific processes.
+
+## Available queries
+
+Druid has numerous query types for various use cases. Queries are composed of various JSON properties and Druid has different types of queries for different use cases. The documentation for the various query types describe all the JSON properties that can be set.
+
+### Aggregation queries
+
+* [Timeseries](../querying/timeseriesquery.md)
+* [TopN](../querying/topnquery.md)
+* [GroupBy](../querying/groupbyquery.md)
+
+### Metadata queries
+
+* [TimeBoundary](../querying/timeboundaryquery.md)
+* [SegmentMetadata](../querying/segmentmetadataquery.md)
+* [DatasourceMetadata](../querying/datasourcemetadataquery.md)
+
+### Other queries
+
+* [Scan](../querying/scan-query.md)
+* [Search](../querying/searchquery.md)
+
+## Which query type should I use?
+
+For aggregation queries, if more than one would satisfy your needs, we generally recommend using Timeseries or TopN
+whenever possible, as they are specifically optimized for their use cases. If neither is a good fit, you should use
+the GroupBy query, which is the most flexible.
+
+## Query cancellation
+
+Queries can be cancelled explicitly using their unique identifier.  If the
+query identifier is set at the time of query, or is otherwise known, the following
+endpoint can be used on the Broker or Router to cancel the query.
+
+```sh
+DELETE /druid/v2/{queryId}
+```
+
+For example, if the query ID is `abc123`, the query can be cancelled as follows:
+
+```sh
+curl -X DELETE "http://host:port/druid/v2/abc123"
+```
+
+## Query errors
+
+### Authentication and authorization failures
+
+For [secured](../operations/auth.md) Druid clusters, query requests respond with an HTTP 401 response code in case of an authentication failure. For authorization failures, an HTTP 403 response code is returned. 
+
+### Query execution failures
+
+If a query fails, Druid returns a response with an HTTP response code and a JSON object with the following structure:
+
+```json
+{
+  "error" : "Query timeout",
+  "errorMessage" : "Timeout waiting for task.",
+  "errorClass" : "java.util.concurrent.TimeoutException",
+  "host" : "druid1.example.com:8083"
+}
+```
+
+The fields in the response are:
+
+|field|description|
+|-----|-----------|
+|error|A well-defined error code (see below).|
+|errorMessage|A free-form message with more information about the error. May be null.|
+|errorClass|The class of the exception that caused this error. May be null.|
+|host|The host on which this error occurred. May be null.|
+
+Possible Druid error codes for the `error` field include:
+
+|Error code|HTTP response code|description|
+|----|-----------|-----------|
+|`SQL parse failed`|400|Only for SQL queries. The SQL query failed to parse.|
+|`Plan validation failed`|400|Only for SQL queries. The SQL query failed to validate.|
+|`Resource limit exceeded`|400|The query exceeded a configured resource limit (e.g. groupBy maxResults).|
+|`Query capacity exceeded`|429|The query failed to execute because of the lack of resources available at the time when the query was submitted. The resources could be any runtime resources such as [query scheduler lane capacity](../configuration/index.md#query-prioritization-and-laning), merge buffers, and so on. The error message should have more details about the failure.|
+|`Unsupported operation`|501|The query attempted to perform an unsupported operation. This may occur when using undocumented features or when using an incompletely implemented extension.|
+|`Query timeout`|504|The query timed out.|
+|`Query interrupted`|500|The query was interrupted, possibly due to JVM shutdown.|
+|`Query cancelled`|500|The query was cancelled through the query cancellation API.|
+|`Truncated response context`|500|An intermediate response context for the query exceeded the built-in limit of 7KiB.<br/><br/>The response context is an internal data structure that Druid servers use to share out-of-band information when sending query results to each other. It is serialized in an HTTP header with a maximum length of 7KiB. This error occurs when an intermediate response context sent from a data server (like a Historical) to the Broker exceeds this limit.<br/><br/>The response context is used for a variety of purposes, but the one most likely to generate a large context is sharing details about segments that move during a query. That means this error can potentially indicate that a very large number of segments moved in between the time a Broker issued a query and the time it was processed on Historicals. This should rarely, if ever, occur during normal operation.|
+|`Unknown exception`|500|Some other exception occurred. Check errorMessage and errorClass for details, although keep in mind that the contents of those fields are free-form and may change from release to release.|
+
+## Learn more
+
+To learn how to use the query context parameters, see [Set query context](./query-context.md).
diff --git a/docs/35.0.0/querying/scan-query.md b/docs/35.0.0/querying/scan-query.md
new file mode 100644
index 0000000000..07decff8b1
--- /dev/null
+++ b/docs/35.0.0/querying/scan-query.md
@@ -0,0 +1,214 @@
+---
+id: scan-query
+title: "Scan queries"
+sidebar_label: "Scan"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ Apache Druid supports two query languages: [Druid SQL](sql.md) and [native queries](querying.md).
+ This document describes a query
+ type in the native language. For information about when Druid SQL will use this query type, refer to the
+ [SQL documentation](sql-translation.md#query-types).
+:::
+
+The Scan query returns raw Apache Druid rows in streaming mode.  
+
+In addition to straightforward usage where a Scan query is issued to the Broker, the Scan query can also be issued
+directly to Historical processes or streaming ingestion tasks. This can be useful if you want to retrieve large
+amounts of data in parallel.
+
+An example Scan query object is shown below:
+
+```json
+ {
+   "queryType": "scan",
+   "dataSource": "wikipedia",
+   "resultFormat": "list",
+   "columns":[ "__time", "isRobot", "page","added", "isAnonymous", "user", "deleted" ],
+   "intervals": [
+     "2016-01-01/2017-01-02"
+   ],
+   "batchSize":20480,
+   "limit":2
+ }
+```
+
+The following are the main parameters for Scan queries:
+
+|property|description|required?|
+|--------|-----------|---------|
+|queryType|This String should always be "scan"; this is the first thing Druid looks at to figure out how to interpret the query|yes|
+|dataSource|A String or Object defining the data source to query, very similar to a table in a relational database. See [DataSource](../querying/datasource.md) for more information.|yes|
+|intervals|A JSON Object representing ISO-8601 Intervals. This defines the time ranges to run the query over.|yes|
+|resultFormat|How the results are represented: list, compactedList or valueVector. Currently only `list` and `compactedList` are supported. Default is `list`|no|
+|filter|See [Filters](../querying/filters.md)|no|
+|columns|A String array of dimensions and metrics to scan. If left empty, all dimensions and metrics are returned.|no|
+|batchSize|The maximum number of rows buffered before being returned to the client. Default is `20480`|no|
+|limit|How many rows to return. If not specified, all rows will be returned.|no|
+|offset|Skip this many rows when returning results. Skipped rows will still need to be generated internally and then discarded, meaning that raising offsets to high values can cause queries to use additional resources.<br /><br />Together, "limit" and "offset" can be used to implement pagination. However, note that if the underlying datasource is modified in between page fetches in ways that affect overall query results, then the different pages will not necessarily align with each other.|no|
+|order|The ordering of returned rows based on timestamp.  "ascending", "descending", and "none" (default) are supported.  Currently, "ascending" and "descending" are only supported for queries where the `__time` column is included in the `columns` field and the requirements outlined in the [time ordering](#time-ordering) section are met.|none|
+|context|An additional JSON Object which can be used to specify certain flags (see the `query context properties` section below).|no|
+
+## Example results
+
+The format of the result when resultFormat equals `list`:
+
+```json
+ [ {
+  "segmentId" : "wikipedia_2016-06-27T00:00:00.000Z_2016-06-28T00:00:00.000Z_2024-12-17T13:08:03.142Z",
+  "columns" : [ "__time", "isRobot", "page","added", "isAnonymous", "user", "deleted" ],
+  "events" : [ {
+    "__time" : 1466985611080,
+    "isRobot" : "true",
+    "page" : "Salo Toraut",
+    "added" : 31,
+    "isAnonymous" : "false",
+    "user" : "Lsjbot",
+    "deleted" : 0
+  }, {
+    "__time" : 1466985634959,
+    "isRobot" : "false",
+    "page" : "Bailando 2015",
+    "added" : 2,
+    "isAnonymous" : "true",
+    "user" : "181.230.118.178",
+    "deleted" : 0
+  } ],
+  "rowSignature" : [ {
+    "name" : "__time",
+    "type" : "LONG"
+  }, {
+    "name" : "isRobot",
+    "type" : "STRING"
+  }, {
+    "name" : "page",
+    "type" : "STRING"
+  }, {
+    "name" : "added",
+    "type" : "LONG"
+  }, {
+    "name" : "isAnonymous",
+    "type" : "STRING"
+  }, {
+    "name" : "user",
+    "type" : "STRING"
+  }, {
+    "name" : "deleted",
+    "type" : "LONG"
+  } ]
+} ]
+```
+
+The format of the result when resultFormat equals `compactedList`:
+
+```json
+ [ {
+  "segmentId" : "wikipedia_2016-06-27T00:00:00.000Z_2016-06-28T00:00:00.000Z_2024-12-17T13:08:03.142Z",
+  "columns" : [ "__time", "isRobot", "isUnpatrolled", "page","added", "isNew", "delta", "isAnonymous", "user", "deleted", "namespace" ],
+  "events" : [
+    [ 1466985611080, "true", "Salo Toraut", 31, "false", "Lsjbot", 0 ],
+    [ 1466985634959, "false", "Bailando 2015", 2, "true", "181.230.118.178", 0]
+  ],
+  "rowSignature" : [ {
+    "name" : "__time",
+    "type" : "LONG"
+  }, {
+    "name" : "isRobot",
+    "type" : "STRING"
+  }, {
+    "name" : "page",
+    "type" : "STRING"
+  }, {
+    "name" : "added",
+    "type" : "LONG"
+  }, {
+    "name" : "isAnonymous",
+    "type" : "STRING"
+  }, {
+    "name" : "user",
+    "type" : "STRING"
+  }, {
+    "name" : "deleted",
+    "type" : "LONG"
+  } ]
+} ]
+```
+
+## Time ordering
+
+The Scan query currently supports ordering based on timestamp.  Note that using time ordering will yield results that
+do not indicate which segment rows are from (`segmentId` will show up as `null`).  Furthermore, time ordering is only
+supported where the result set limit is less than `druid.query.scan.maxRowsQueuedForOrdering` rows **or** all segments
+scanned have fewer than `druid.query.scan.maxSegmentPartitionsOrderedInMemory` partitions.  Also, time ordering is not
+supported for queries issued directly to historicals unless a list of segments is specified.  The reasoning behind
+these limitations is that the implementation of time ordering uses two strategies that can consume too much heap memory
+if left unbounded.  These strategies (listed below) are chosen on a per-Historical basis depending on query result set
+limit and the number of segments being scanned.
+
+1. Priority Queue: Each segment on a Historical is opened sequentially.  Every row is added to a bounded priority
+queue which is ordered by timestamp.  For every row above the result set limit, the row with the earliest (if descending)
+or latest (if ascending) timestamp will be dequeued.  After every row has been processed, the sorted contents of the
+priority queue are streamed back to the Broker(s) in batches.  Attempting to load too many rows into memory runs the
+risk of Historical nodes running out of memory.  The `druid.query.scan.maxRowsQueuedForOrdering` property protects
+from this by limiting the number of rows in the query result set when time ordering is used.
+
+2. N-Way Merge: For each segment, each partition is opened in parallel.  Since each partition's rows are already
+time-ordered, an n-way merge can be performed on the results from each partition.  This approach doesn't persist the entire
+result set in memory (like the Priority Queue) as it streams back batches as they are returned from the merge function.
+However, attempting to query too many partition could also result in high memory usage due to the need to open
+decompression and decoding buffers for each.  The `druid.query.scan.maxSegmentPartitionsOrderedInMemory` limit protects
+from this by capping the number of partitions opened at any times when time ordering is used.
+
+Both `druid.query.scan.maxRowsQueuedForOrdering` and `druid.query.scan.maxSegmentPartitionsOrderedInMemory` are
+configurable and can be tuned based on hardware specs and number of dimensions being queried.  These config properties
+can also be overridden using the `maxRowsQueuedForOrdering` and `maxSegmentPartitionsOrderedInMemory` properties in
+the query context (see the Query Context Properties section).
+
+## Configuration Properties
+
+Configuration properties:
+
+|property|description|values|default|
+|--------|-----------|------|-------|
+|druid.query.scan.maxRowsQueuedForOrdering|The maximum number of rows returned when time ordering is used|An integer in [1, 2147483647]|100000|
+|druid.query.scan.maxSegmentPartitionsOrderedInMemory|The maximum number of segments scanned per historical when time ordering is used|An integer in [1, 2147483647]|50|
+
+
+## Query context properties
+
+|property|description|values|default|
+|--------|-----------|------|-------|
+|maxRowsQueuedForOrdering|The maximum number of rows returned when time ordering is used.  Overrides the identically named config.|An integer in [1, 2147483647]|`druid.query.scan.maxRowsQueuedForOrdering`|
+|maxSegmentPartitionsOrderedInMemory|The maximum number of segments scanned per historical when time ordering is used.  Overrides the identically named config.|An integer in [1, 2147483647]|`druid.query.scan.maxSegmentPartitionsOrderedInMemory`|
+
+Sample query context JSON object:
+
+```json
+{
+  "maxRowsQueuedForOrdering": 100001,
+  "maxSegmentPartitionsOrderedInMemory": 100
+}
+```
+
+## Legacy mode
+
+In older versions of Druid, the scan query supported a legacy mode designed for protocol compatibility with the former scan-query contrib extension from versions of Druid older than 0.11. This mode has been removed.
diff --git a/docs/35.0.0/querying/searchquery.md b/docs/35.0.0/querying/searchquery.md
new file mode 100644
index 0000000000..97ddf59372
--- /dev/null
+++ b/docs/35.0.0/querying/searchquery.md
@@ -0,0 +1,191 @@
+---
+id: searchquery
+title: "Search queries"
+sidebar_label: "Search"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ Apache Druid supports two query languages: [Druid SQL](sql.md) and [native queries](querying.md).
+ This document describes a query
+ type that is only available in the native language.
+:::
+
+A search query returns dimension values that match the search specification.
+
+```json
+{
+  "queryType": "search",
+  "dataSource": "sample_datasource",
+  "granularity": "day",
+  "searchDimensions": [
+    "dim1",
+    "dim2"
+  ],
+  "query": {
+    "type": "insensitive_contains",
+    "value": "Ke"
+  },
+  "sort" : {
+    "type": "lexicographic"
+  },
+  "intervals": [
+    "2013-01-01T00:00:00.000/2013-01-03T00:00:00.000"
+  ]
+}
+```
+
+There are several main parts to a search query:
+
+|property|description|required?|
+|--------|-----------|---------|
+|queryType|This String should always be "search"; this is the first thing Apache Druid looks at to figure out how to interpret the query.|yes|
+|dataSource|A String or Object defining the data source to query, very similar to a table in a relational database. See [DataSource](../querying/datasource.md) for more information.|yes|
+|granularity|Defines the granularity of the query. See [Granularities](../querying/granularities.md).|no (default to `all`)|
+|filter|See [Filters](../querying/filters.md).|no|
+|limit| Defines the maximum number per Historical process (parsed as int) of search results to return. |no (default to 1000)|
+|intervals|A JSON Object representing ISO-8601 Intervals. This defines the time ranges to run the query over.|yes|
+|searchDimensions|The dimensions to run the search over. Excluding this means the search is run over all dimensions.|no|
+|virtualColumns|A JSON list of [virtual columns](./virtual-columns.md) available to use in `searchDimensions`.| no (default none)|
+|query|See [SearchQuerySpec](#searchqueryspec).|yes|
+|sort|An object specifying how the results of the search should be sorted.<br/>Possible types are "lexicographic" (the default sort), "alphanumeric", "strlen", and "numeric".<br/>See [Sorting Orders](./sorting-orders.md) for more details.|no|
+|context|See [Context](../querying/query-context-reference.md)|no|
+
+The format of the result is:
+
+```json
+[
+  {
+    "timestamp": "2013-01-01T00:00:00.000Z",
+    "result": [
+      {
+        "dimension": "dim1",
+        "value": "Ke$ha",
+        "count": 3
+      },
+      {
+        "dimension": "dim2",
+        "value": "Ke$haForPresident",
+        "count": 1
+      }
+    ]
+  },
+  {
+    "timestamp": "2013-01-02T00:00:00.000Z",
+    "result": [
+      {
+        "dimension": "dim1",
+        "value": "SomethingThatContainsKe",
+        "count": 1
+      },
+      {
+        "dimension": "dim2",
+        "value": "SomethingElseThatContainsKe",
+        "count": 2
+      }
+    ]
+  }
+]
+```
+
+### Implementation details
+
+#### Strategies
+
+Search queries can be executed using two different strategies. The default strategy is determined by the
+"druid.query.search.searchStrategy" runtime property on the Broker. This can be overridden using "searchStrategy" in the
+query context. If neither the context field nor the property is set, the "useIndexes" strategy will be used.
+
+- "useIndexes" strategy, the default, first categorizes search dimensions into two groups according to their support for
+bitmap indexes. And then, it applies index-only and cursor-based execution plans to the group of dimensions supporting
+bitmaps and others, respectively. The index-only plan uses only indexes for search query processing. For each dimension,
+it reads the bitmap index for each dimension value, evaluates the search predicate, and finally checks the time interval
+and filter predicates. For the cursor-based execution plan, please refer to the "cursorOnly" strategy. The index-only
+plan shows low performance for the search dimensions of large cardinality which means most values of search dimensions
+are unique.
+
+- "cursorOnly" strategy generates a cursor-based execution plan. This plan creates a cursor which reads a row from a
+queryableIndexSegment, and then evaluates search predicates. If some filters support bitmap indexes, the cursor can read
+only the rows which satisfy those filters, thereby saving I/O cost. However, it might be slow with filters of low selectivity.
+
+## Server configuration
+
+The following runtime properties apply:
+
+|Property|Description|Default|
+|--------|-----------|-------|
+|`druid.query.search.searchStrategy`|Default search query strategy.|useIndexes|
+
+## Query context
+
+The following query context parameters apply:
+
+|Property|Description|
+|--------|-----------|
+|`searchStrategy`|Overrides the value of `druid.query.search.searchStrategy` for this query.|
+
+## SearchQuerySpec
+
+### `insensitive_contains`
+
+If any part of a dimension value contains the value specified in this search query spec, regardless of case, a "match" occurs. The grammar is:
+
+```json
+{
+  "type"  : "insensitive_contains",
+  "value" : "some_value"
+}
+```
+
+### `fragment`
+
+If any part of a dimension value contains all the values specified in this search query spec, regardless of case by default, a "match" occurs. The grammar is:
+
+```json
+{
+  "type" : "fragment",
+  "case_sensitive" : false,
+  "values" : ["fragment1", "fragment2"]
+}
+```
+
+### `contains`
+
+If any part of a dimension value contains the value specified in this search query spec, a "match" occurs. The grammar is:
+
+```json
+{
+  "type"  : "contains",
+  "case_sensitive" : true,
+  "value" : "some_value"
+}
+```
+
+### `regex`
+
+If any part of a dimension value contains the pattern specified in this search query spec, a "match" occurs. The grammar is:
+
+```json
+{
+  "type"  : "regex",
+  "pattern" : "some_pattern"
+}
+```
diff --git a/docs/35.0.0/querying/segmentmetadataquery.md b/docs/35.0.0/querying/segmentmetadataquery.md
new file mode 100644
index 0000000000..58eb93b4cf
--- /dev/null
+++ b/docs/35.0.0/querying/segmentmetadataquery.md
@@ -0,0 +1,223 @@
+---
+id: segmentmetadataquery
+title: "SegmentMetadata queries"
+sidebar_label: "SegmentMetadata"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ Apache Druid supports two query languages: [Druid SQL](sql.md) and [native queries](querying.md).
+ This document describes a query
+ type that is only available in the native language. However, Druid SQL contains similar functionality in
+ its [metadata tables](sql-metadata-tables.md).
+:::
+
+Segment metadata queries return per-segment information about:
+
+* Number of rows stored inside the segment
+* Interval the segment covers
+* Estimated total segment byte size in if it was stored in a 'flat format' (e.g. a csv file)
+* Segment id
+* Is the segment rolled up
+* Detailed per column information such as:
+  - type
+  - cardinality
+  - min/max values
+  - presence of null values
+  - estimated 'flat format' byte size
+
+
+```json
+{
+  "queryType":"segmentMetadata",
+  "dataSource":"sample_datasource",
+  "intervals":["2013-01-01/2014-01-01"]
+}
+```
+
+There are several main parts to a segment metadata query:
+
+|property|description|required?|
+|--------|-----------|---------|
+|queryType|This String should always be "segmentMetadata"; this is the first thing Apache Druid looks at to figure out how to interpret the query|yes|
+|dataSource|A String or Object defining the data source to query, very similar to a table in a relational database. See [DataSource](../querying/datasource.md) for more information.|yes|
+|intervals|A JSON Object representing ISO-8601 Intervals. This defines the time ranges to run the query over.|no|
+|toInclude|A JSON Object representing what columns should be included in the result. Defaults to "all".|no|
+|merge|Merge all individual segment metadata results into a single result|no|
+|context|See [Context](../querying/query-context-reference.md)|no|
+|analysisTypes|A list of Strings specifying what column properties (e.g. cardinality, size) should be calculated and returned in the result. Defaults to ["cardinality", "interval", "minmax"], but can be overridden with using the [segment metadata query config](../configuration/index.md#segmentmetadata-query-config). See section [analysisTypes](#analysistypes) for more details.|no|
+|aggregatorMergeStrategy| The strategy Druid uses to merge aggregators across segments. If true and if the `aggregators` analysis type is enabled, `aggregatorMergeStrategy` defaults to `strict`. Possible values include `strict`, `lenient`, `earliest`, and `latest`. See [`aggregatorMergeStrategy`](#aggregatormergestrategy) for details.|no|
+|lenientAggregatorMerge|Deprecated. Use `aggregatorMergeStrategy` property instead. If true, and if the `aggregators` analysis type is enabled, Druid merges aggregators leniently.|no|
+
+The format of the result is:
+
+```json
+[ {
+  "id" : "some_id",
+  "intervals" : [ "2013-05-13T00:00:00.000Z/2013-05-14T00:00:00.000Z" ],
+  "columns" : {
+    "__time" : { "type" : "LONG", "hasMultipleValues" : false, "hasNulls": false, "size" : 407240380, "cardinality" : null, "errorMessage" : null },
+    "dim1" : { "type" : "STRING", "hasMultipleValues" : false, "hasNulls": false, "size" : 100000, "cardinality" : 1944, "errorMessage" : null },
+    "dim2" : { "type" : "STRING", "hasMultipleValues" : true, "hasNulls": true, "size" : 100000, "cardinality" : 1504, "errorMessage" : null },
+    "metric1" : { "type" : "FLOAT", "hasMultipleValues" : false, "hasNulls": false, "size" : 100000, "cardinality" : null, "errorMessage" : null }
+  },
+  "aggregators" : {
+    "metric1" : { "type" : "longSum", "name" : "metric1", "fieldName" : "metric1" }
+  },
+  "queryGranularity" : {
+    "type": "none"
+  },
+  "size" : 300000,
+  "numRows" : 5000000
+} ]
+```
+
+All columns contain a `typeSignature` that Druid uses to represent the column type information internally. The `typeSignature` is typically the same value used to identify the JSON type information at query or ingest time. One of: `STRING`, `FLOAT`, `DOUBLE`, `LONG`, or `COMPLEX<typeName>`, e.g. `COMPLEX<hyperUnique>`.
+
+Columns also have a legacy `type` name. For some column types, the value may match the `typeSignature`  (`STRING`, `FLOAT`, `DOUBLE`, or `LONG`). For `COMPLEX` columns, the `type` only contains the name of the underlying complex type such as `hyperUnique`.
+
+New applications should use `typeSignature`, not `type`.
+
+If the `errorMessage` field is non-null, you should not trust the other fields in the response. Their contents are
+undefined.
+
+Only columns which are dictionary encoded (i.e., have type `STRING`) will have any cardinality. Rest of the columns (timestamp and metric columns) will show cardinality as `null`.
+
+## intervals
+
+If an interval is not specified, the query will use a default interval that spans a configurable period before the end time of the most recent segment.
+
+The length of this default time period is set in the Broker configuration via:
+  druid.query.segmentMetadata.defaultHistory
+
+## toInclude
+
+There are 3 types of toInclude objects.
+
+### All
+
+The grammar is as follows:
+
+``` json
+"toInclude": { "type": "all"}
+```
+
+### None
+
+The grammar is as follows:
+
+``` json
+"toInclude": { "type": "none"}
+```
+
+### List
+
+The grammar is as follows:
+
+``` json
+"toInclude": { "type": "list", "columns": [<string list of column names>]}
+```
+
+## analysisTypes
+
+This is a list of properties that determines the amount of information returned about the columns, i.e. analyses to be performed on the columns.
+
+By default, the "cardinality", "interval", and "minmax" types will be used. If a property is not needed, omitting it from this list will result in a more efficient query.
+
+The default analysis types can be set in the Broker configuration via:
+  `druid.query.segmentMetadata.defaultAnalysisTypes`
+
+Types of column analyses are described below:
+
+### cardinality
+
+* `cardinality` is the number of unique values present in string columns. It is null for other column types.
+
+Druid examines the size of string column dictionaries to compute the cardinality value. There is one dictionary per column per
+segment. If `merge` is off (false), this reports the cardinality of each column of each segment individually. If
+`merge` is on (true), this reports the highest cardinality encountered for a particular column across all relevant
+segments.
+
+### minmax
+
+* Estimated min/max values for each column. Only reported for string columns.
+
+### size
+
+* `size` is the estimated total byte size as if the data were stored in text format. This is _not_ the actual storage
+size of the column in Druid. If you want the actual storage size in bytes of a segment, look elsewhere. Some pointers:
+
+- To get the storage size in bytes of an entire segment, check the `size` field in the
+[`sys.segments` table](sql-metadata-tables.md#segments-table). This is the size of the memory-mappable content.
+- To get the storage size in bytes of a particular column in a particular segment, unpack the segment and look at the
+`meta.smoosh` file inside the archive. The difference between the third and fourth columns is the size in bytes.
+Currently, there is no API for retrieving this information.
+
+### interval
+
+* `intervals` in the result will contain the list of intervals associated with the queried segments.
+
+### timestampSpec
+
+* `timestampSpec` in the result will contain timestampSpec of data stored in segments. this can be null if timestampSpec of segments was unknown or unmergeable (if merging is enabled).
+
+### queryGranularity
+
+* `queryGranularity` in the result will contain query granularity of data stored in segments. this can be null if query granularity of segments was unknown or unmergeable (if merging is enabled).
+
+### aggregators
+
+* `aggregators` in the result will contain the list of aggregators usable for querying metric columns. This may be
+null if the aggregators are unknown or unmergeable (if merging is enabled).
+
+* Merging can be `strict`, `lenient`, `earliest`, or `latest`. See [`aggregatorMergeStrategy`](#aggregatormergestrategy) for details.
+
+* The form of the result is a map of column name to aggregator.
+
+### rollup
+
+* `rollup` in the result is true/false/null.
+* When merging is enabled, if some are rollup, others are not, result is null.
+
+### projections
+
+* `projections` in the result will contain the list of projections in segments. 
+* if any conflicting projections are identified, the conflicting one will be excluded, while the non-conflicting ones will be included.
+
+## aggregatorMergeStrategy
+
+Conflicts between aggregator metadata across segments can occur if some segments have unknown aggregators, or if
+two segments use incompatible aggregators for the same column, such as `longSum` changed to `doubleSum`.
+Druid supports the following aggregator merge strategies:
+
+- `strict`: If there are any segments with unknown aggregators or any conflicts of any kind, the merged aggregators
+  list is `null`.
+- `lenient`: Druid ignores segments with unknown aggregators. Conflicts between aggregators set the aggregator for
+  that particular column to null.
+- `earliest`: In the event of conflicts between segments, Druid selects the aggregator from the earliest segment
+  for that particular column.
+- `latest`: In the event of conflicts between segments, Druid selects the aggregator from the most recent segment
+   for that particular column.
+
+
+## lenientAggregatorMerge (deprecated)
+
+Deprecated. Use [`aggregatorMergeStrategy`](#aggregatormergestrategy) instead.
diff --git a/docs/35.0.0/querying/select-query.md b/docs/35.0.0/querying/select-query.md
new file mode 100644
index 0000000000..734073dc53
--- /dev/null
+++ b/docs/35.0.0/querying/select-query.md
@@ -0,0 +1,27 @@
+---
+id: select-query
+title: "Select queries"
+sidebar_label: "Select"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+ 
+Older versions of Apache Druid included a Select query type. Since Druid 0.17.0, it has been removed and replaced by the [Scan query](../querying/scan-query.md), which offers improved memory usage and performance. This solves issues that users had with Select queries causing Druid to run out of memory or slow down.
diff --git a/docs/35.0.0/querying/sorting-orders.md b/docs/35.0.0/querying/sorting-orders.md
new file mode 100644
index 0000000000..4860cdee52
--- /dev/null
+++ b/docs/35.0.0/querying/sorting-orders.md
@@ -0,0 +1,59 @@
+---
+id: sorting-orders
+title: "String comparators"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ Apache Druid supports two query languages: [Druid SQL](sql.md) and [native queries](querying.md).
+ This document describes the native
+ language. For information about functions available in SQL, refer to the
+ [SQL documentation](sql-scalar.md).
+:::
+
+These sorting orders are used by the [TopNMetricSpec](./topnmetricspec.md), [SearchQuery](./searchquery.md), GroupByQuery's [LimitSpec](./limitspec.md), and [BoundFilter](./filters.md#bound-filter).
+
+## Lexicographic
+Sorts values by converting Strings to their UTF-8 byte array representations and comparing lexicographically, byte-by-byte.
+
+## Alphanumeric
+Suitable for strings with both numeric and non-numeric content, e.g.: "file12 sorts after file2"
+
+See https://github.com/amjjd/java-alphanum for more details on how this ordering sorts values.
+
+This ordering is not suitable for numbers with decimal points or negative numbers.
+* For example, "1.3" precedes "1.15" in this ordering because "15" has more significant digits than "3".
+* Negative numbers are sorted after positive numbers (because numeric characters precede the "-" in the negative numbers).
+
+## Numeric
+Sorts values as numbers, supports integers and floating point values. Negative values are supported.
+
+This sorting order will try to parse all string values as numbers. Unparseable values are treated as nulls, and nulls precede numbers.
+
+When comparing two unparseable values (e.g., "hello" and "world"), this ordering will sort by comparing the unparsed strings lexicographically.
+
+## Strlen
+Sorts values by their string lengths. When there is a tie, this comparator falls back to using the String compareTo method.
+
+## Version
+Sorts values as versions, e.g.: "10.0 sorts after 9.0", "1.0.0-SNAPSHOT sorts after 1.0.0".
+
+See https://maven.apache.org/ref/3.6.0/maven-artifact/apidocs/org/apache/maven/artifact/versioning/ComparableVersion.html for more details on how this ordering sorts values.
diff --git a/docs/35.0.0/querying/sql-aggregations.md b/docs/35.0.0/querying/sql-aggregations.md
new file mode 100644
index 0000000000..90d4ae0537
--- /dev/null
+++ b/docs/35.0.0/querying/sql-aggregations.md
@@ -0,0 +1,159 @@
+---
+id: sql-aggregations
+title: "SQL aggregation functions"
+sidebar_label: "Aggregation functions"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+<!--
+  The format of the tables that describe the functions and operators
+  should not be changed without updating the script create-sql-docs
+  in web-console/script/create-sql-docs, because the script detects
+  patterns in this markdown file and parse it to TypeScript file for web console
+-->
+
+:::info
+ Apache Druid supports two query languages: Druid SQL and [native queries](querying.md).
+ This document describes the SQL language.
+:::
+
+You can use aggregation functions in the SELECT clause of any [Druid SQL](./sql.md) query.
+
+In the aggregation functions supported by Druid, only `COUNT`, `ARRAY_AGG`, and `STRING_AGG` accept the DISTINCT keyword.
+
+:::info
+ The order of aggregation operations across segments is not deterministic. This means that non-commutative aggregation
+ functions can produce inconsistent results across the same query.
+
+ Functions that operate on an input type of "float" or "double" may also see these differences in aggregation
+ results across multiple query runs because of this. If precisely the same value is desired across multiple query runs,
+ consider using the `ROUND` function to smooth out the inconsistencies between queries.
+:::
+
+## Filter aggregations
+
+Filter any aggregator using the FILTER clause, for example:
+
+```
+SELECT 
+  SUM(added) FILTER(WHERE channel = '#en.wikipedia')
+FROM wikipedia
+```
+
+The FILTER clause limits an aggregation query to only the rows that match the filter.
+Druid translates the FILTER clause to a native [filtered aggregator](aggregations.md#filtered-aggregator).
+Two aggregators in the same SQL query may have different filters.
+
+When no rows are selected, aggregation functions return their initial value. This can occur from the following:
+* When no rows match the filter while aggregating values across an entire table without a grouping, or
+* When using filtered aggregations within a grouping.
+
+The initial value varies by aggregator. `COUNT` and the approximate count distinct sketch functions
+always return 0 as the initial value.
+
+## General aggregation functions
+
+|Function|Notes|Default|
+|--------|-----|-------|
+|`COUNT(*)`|Counts the number of rows.|`0`|
+|`COUNT([DISTINCT] expr)`|Counts the values of `expr`.<br /><br />By default, using DISTINCT serves as an alias for `APPROX_COUNT_DISTINCT` (`useApproximateCountDistinct=true`). The specific algorithm depends on the value of [`druid.sql.approxCountDistinct.function`](../configuration/index.md#sql). In this mode, you can use strings, numbers, or prebuilt sketches. If counting prebuilt sketches, the prebuilt sketch type must match the selected algorithm.<br /><br />When `useApproximateCountDistinct=false`, returns the exact computation. In this case, `expr` must be string or numeric, since exact counts are not possible using prebuilt sketches. In exact mode, only one distinct count per query is permitted unless `useGroupingSetForExactDistinct` is enabled.<br /><br />Counts each distinct value in a [`multi-value`](../querying/multi-value-dimensions.md)-row separately.|`0`|
+|`SUM(expr)`|Sums numbers.|`null`|
+|`MIN(expr)`|Takes the minimum of numbers.|`null`|
+|`MAX(expr)`|Takes the maximum of numbers.|`null`|
+|`AVG(expr)`|Averages numbers.|`null`|
+|`APPROX_COUNT_DISTINCT(expr)`|Counts distinct values of `expr` using an approximate algorithm. The `expr` can be a regular column or a prebuilt sketch column.<br /><br />The specific algorithm depends on the value of [`druid.sql.approxCountDistinct.function`](../configuration/index.md#sql). By default, this is `APPROX_COUNT_DISTINCT_BUILTIN`. If the [DataSketches extension](../development/extensions-core/datasketches-extension.md) is loaded, you can set it to `APPROX_COUNT_DISTINCT_DS_HLL` or `APPROX_COUNT_DISTINCT_DS_THETA`.<br /><br />When run on prebuilt sketch columns, the sketch column type must match the implementation of this function. For example: when `druid.sql.approxCountDistinct.function` is set to `APPROX_COUNT_DISTINCT_BUILTIN`, this function runs on prebuilt hyperUnique columns, but not on prebuilt HLLSketchBuild columns.|
+|`APPROX_COUNT_DISTINCT_BUILTIN(expr)`|_Usage note:_ consider using `APPROX_COUNT_DISTINCT_DS_HLL` instead, which offers better accuracy in many cases.<br/><br/>Counts distinct values of `expr` using Druid's built-in "cardinality" or "hyperUnique" aggregators, which implement a variant of [HyperLogLog](http://algo.inria.fr/flajolet/Publications/FlFuGaMe07.pdf). The `expr` can be a string, a number, or a prebuilt hyperUnique column. Results are always approximate, regardless of the value of `useApproximateCountDistinct`.|
+|`APPROX_QUANTILE(expr, probability, [resolution])`|_Deprecated._ Use `APPROX_QUANTILE_DS` instead, which provides a superior distribution-independent algorithm with formal error guarantees.<br/><br/>Computes approximate quantiles on numeric or [approxHistogram](../development/extensions-core/approximate-histograms.md#approximate-histogram-aggregator) expressions. `probability` should be between 0 and 1, exclusive. `resolution` is the number of centroids to use for the computation. Higher resolutions will give more precise results but also have higher overhead. If not provided, the default resolution is 50. Load the [approximate histogram extension](../development/extensions-core/approximate-histograms.md) to use this function.|`NaN`|
+|`APPROX_QUANTILE_FIXED_BUCKETS(expr, probability, numBuckets, lowerLimit, upperLimit, [outlierHandlingMode])`|Computes approximate quantiles on numeric or [fixed buckets histogram](../development/extensions-core/approximate-histograms.md#fixed-buckets-histogram) expressions. `probability` should be between 0 and 1, exclusive. The `numBuckets`, `lowerLimit`, `upperLimit`, and `outlierHandlingMode` parameters are described in the fixed buckets histogram documentation. Load the [approximate histogram extension](../development/extensions-core/approximate-histograms.md) to use this function.|`0.0`|
+|`BLOOM_FILTER(expr, numEntries)`|Computes a bloom filter from values produced by `expr`, with `numEntries` maximum number of distinct values before false positive rate increases. See [bloom filter extension](../development/extensions-core/bloom-filter.md) documentation for additional details.|Empty base64 encoded bloom filter STRING|
+|`VAR_POP(expr)`|Computes variance population of `expr`. See [stats extension](../development/extensions-core/stats.md) documentation for additional details.|`null`|
+|`VAR_SAMP(expr)`|Computes variance sample of `expr`. See [stats extension](../development/extensions-core/stats.md) documentation for additional details.|`null`|
+|`VARIANCE(expr)`|Computes variance sample of `expr`. See [stats extension](../development/extensions-core/stats.md) documentation for additional details.|`null`|
+|`STDDEV_POP(expr)`|Computes standard deviation population of `expr`. See [stats extension](../development/extensions-core/stats.md) documentation for additional details.|`null`|
+|`STDDEV_SAMP(expr)`|Computes standard deviation sample of `expr`. See [stats extension](../development/extensions-core/stats.md) documentation for additional details.|`null`|
+|`STDDEV(expr)`|Computes standard deviation sample of `expr`. See [stats extension](../development/extensions-core/stats.md) documentation for additional details.|`null`|
+|`EARLIEST(expr, [maxBytesPerValue])`|Returns the earliest value of `expr`.<br />If `expr` comes from a relation with a timestamp column (like `__time` in a Druid datasource), the "earliest" is taken from the row with the overall earliest non-null value of the timestamp column.<br />If the earliest non-null value of the timestamp column appears in multiple rows, the `expr` may be taken from any of those rows. If `expr` does not come from a relation with a timestamp, then it is simply the first value encountered.<br /><br />If `expr` is a string or complex type `maxBytesPerValue` amount of space is allocated for the aggregation. Strings longer than this limit are truncated. The  `maxBytesPerValue` parameter should be set as low as possible, since high values will lead to wasted memory.<br/>If `maxBytesPerValue`is omitted; it defaults to `1024`. |`null`|
+|`EARLIEST_BY(expr, timestampExpr, [maxBytesPerValue])`|Returns the earliest value of `expr`.<br />The earliest value of `expr` is taken from the row with the overall earliest non-null value of `timestampExpr`. <br />If the earliest non-null value of `timestampExpr` appears in multiple rows, the `expr` may be taken from any of those rows.<br /><br />If `expr` is a string or complex type `maxBytesPerValue` amount of space is allocated for the aggregation. Strings longer than this limit are truncated. The  `maxBytesPerValue` parameter should be set as low as possible, since high values will lead to wasted memory.<br/>If `maxBytesPerValue`is omitted; it defaults to `1024`.<br /><br />Use `EARLIEST` instead of `EARLIEST_BY` on a table that has rollup enabled and was created with any variant of `EARLIEST`, `LATEST`, `EARLIEST_BY`, or `LATEST_BY`. In these cases, the intermediate type already stores the timestamp, and Druid ignores the value passed in `timestampExpr`. |`null`|
+|`LATEST(expr, [maxBytesPerValue])`|Returns the latest value of `expr`<br />The `expr` must come from a relation with a timestamp column (like `__time` in a Druid datasource) and the "latest" is taken from the row with the overall latest non-null value of the timestamp column.<br />If the latest non-null value of the timestamp column appears in multiple rows, the `expr` may be taken from any of those rows.<br /><br />If `expr` is a string or complex type `maxBytesPerValue` amount of space is allocated for the aggregation. Strings longer than this limit are truncated. The  `maxBytesPerValue` parameter should be set as low as possible, since high values will lead to wasted memory.<br/>If `maxBytesPerValue`is omitted; it defaults to `1024`. |`null`|
+|`LATEST_BY(expr, timestampExpr, [maxBytesPerValue])`|Returns the latest value of `expr`.<br />The latest value of `expr` is taken from the row with the overall latest non-null value of `timestampExpr`.<br />If the overall latest non-null value of `timestampExpr` appears in multiple rows, the `expr` may be taken from any of those rows.<br /><br />If `expr` is a string or complex type `maxBytesPerValue` amount of space is allocated for the aggregation. Strings longer than this limit are truncated. The `maxBytesPerValue` parameter should be set as low as possible, since high values will lead to wasted memory.<br/>If `maxBytesPerValue`is omitted; it defaults to `1024`.<br /><br />Use `LATEST` instead of `LATEST_BY` on a table that has rollup enabled and was created with any variant of `EARLIEST`, `LATEST`, `EARLIEST_BY`, or `LATEST_BY`. In these cases, the intermediate type already stores the timestamp, and Druid ignores the value passed in `timestampExpr`. |`null`|
+|`ANY_VALUE(expr, [maxBytesPerValue, [aggregateMultipleValues]])`|Returns any value of `expr` including null. This aggregator can simplify and optimize the performance by returning the first encountered value (including `null`).<br /><br />If `expr` is a string or complex type `maxBytesPerValue` amount of space is allocated for the aggregation. Strings longer than this limit are truncated. The `maxBytesPerValue` parameter should be set as low as possible, since high values will lead to wasted memory.<br/>If `maxBytesPerValue` is omitted; it defaults to `1024`. `aggregateMultipleValues` is an optional boolean flag controls the behavior of aggregating a [multi-value dimension](./multi-value-dimensions.md). `aggregateMultipleValues` is set as true by default and returns the stringified array in case of a multi-value dimension. By setting it to false, function will return first value instead. |`null`|
+|`GROUPING(expr, expr...)`|Returns a number to indicate which groupBy dimension is included in a row, when using `GROUPING SETS`. Refer to [additional documentation](aggregations.md#grouping-aggregator) on how to infer this number.|N/A|
+|`ARRAY_AGG([DISTINCT] expr, [size])`|Collects all values of the specified expression into an array. To include only unique values, specify `DISTINCT`. `size` determines the maximum aggregation size in bytes and defaults to 1024 bytes. If the resulting array exceeds the size limit, the query fails. `ORDER BY` is not supported. The order of elements in the output array may vary depending on the processing order.|`null`|
+|`ARRAY_CONCAT_AGG([DISTINCT] expr, [size])`|Concatenates array inputs into a single array. To include only unique values, specify `DISTINCT`. `expr` must be an array. `size` determines the maximum aggregation size in bytes and defaults to 1024 bytes. If the resulting array exceeds the size limit, the query fails. Druid ignores null array expressions, but null values within arrays are included in the output. `ORDER BY` is not supported. The order of elements in the output array may vary depending on the processing order.|`null`|
+|`STRING_AGG([DISTINCT] expr, [separator, [size]])`|Collects all values (or all distinct values) of `expr` into a single STRING, ignoring null values. Each value is joined by an optional `separator`, which must be a literal STRING. If the `separator` is not provided, strings are concatenated without a separator.<br /><br />An optional `size` in bytes can be supplied to limit aggregation size (default of 1024 bytes). If the aggregated string grows larger than the maximum size in bytes, the query will fail. Use of `ORDER BY` within the `STRING_AGG` expression is not currently supported, and the ordering of results within the output string may vary depending on processing order.|`null`|
+|`LISTAGG([DISTINCT] expr, [separator, [size]])`|Synonym for `STRING_AGG`.|`null`|
+|`BIT_AND(expr)`|Performs a bitwise AND operation on all input values.|`null`|
+|`BIT_OR(expr)`|Performs a bitwise OR operation on all input values.|`null`|
+|`BIT_XOR(expr)`|Performs a bitwise XOR operation on all input values.|`null`|
+
+## Sketch functions
+
+These functions create sketch objects that you can use to perform fast, approximate analyses.
+For advice on choosing approximate aggregation functions, check out our [approximate aggregations documentation](aggregations.md#approximate-aggregations).
+To operate on sketch objects, see the scalar [DataSketches post aggregator functions](sql-scalar.md#sketch-functions).
+
+### HLL sketch functions
+
+Load the [DataSketches extension](../development/extensions-core/datasketches-extension.md) to use the following functions.
+
+|Function|Notes|Default|
+|--------|-----|-------|
+|`APPROX_COUNT_DISTINCT_DS_HLL(expr, [lgK, tgtHllType])`|Counts distinct values of `expr`, which can be a regular column or an [HLL sketch](../development/extensions-core/datasketches-hll.md) column. Results are always approximate, regardless of the value of [`useApproximateCountDistinct`](sql-query-context.md). The `lgK` and `tgtHllType` parameters here are, like the equivalents in the [aggregator](../development/extensions-core/datasketches-hll.md#aggregators), described in the HLL sketch documentation. See also `COUNT(DISTINCT expr)`.|`0`|
+|`DS_HLL(expr, [lgK, tgtHllType])`|Creates an [HLL sketch](../development/extensions-core/datasketches-hll.md) on the values of `expr`, which can be a regular column or a column containing HLL sketches. The `lgK` and `tgtHllType` parameters are described in the HLL sketch documentation.|`'0'` (STRING)|
+
+
+### Theta sketch functions
+
+Load the [DataSketches extension](../development/extensions-core/datasketches-extension.md) to use the following functions.
+
+|Function|Notes|Default|
+|--------|-----|-------|
+|`APPROX_COUNT_DISTINCT_DS_THETA(expr, [size])`|Counts distinct values of `expr`, which can be a regular column or a [Theta sketch](../development/extensions-core/datasketches-theta.md) column. Results are always approximate, regardless of the value of [`useApproximateCountDistinct`](sql-query-context.md). The `size` parameter is described in the Theta sketch documentation. See also `COUNT(DISTINCT expr)`.|`0`|
+|`DS_THETA(expr, [size])`|Creates a [Theta sketch](../development/extensions-core/datasketches-theta.md) on the values of `expr`, which can be a regular column or a column containing Theta sketches. The `size` parameter is described in the Theta sketch documentation.|`'0.0'` (STRING)|
+
+
+### Quantiles sketch functions
+
+Load the [DataSketches extension](../development/extensions-core/datasketches-extension.md) to use the following functions.
+
+|Function|Notes|Default|
+|--------|-----|-------|
+|`APPROX_QUANTILE_DS(expr, probability, [k])`|Computes approximate quantiles on numeric or [Quantiles sketch](../development/extensions-core/datasketches-quantiles.md) expressions. The `probability` value should be between 0 and 1, exclusive. The `k` parameter is described in the Quantiles sketch documentation.<br/><br/>See the [known issue](sql-translation.md#approximations) with this function.|`NaN`|
+|`DS_QUANTILES_SKETCH(expr, [k])`|Creates a [Quantiles sketch](../development/extensions-core/datasketches-quantiles.md) on the values of `expr`, which can be a regular column or a column containing quantiles sketches. The `k` parameter is described in the Quantiles sketch documentation.<br/><br/>See the [known issue](sql-translation.md#approximations) with this function.|`'0'` (STRING)|
+
+
+### Tuple sketch functions
+
+Load the [DataSketches extension](../development/extensions-core/datasketches-extension.md) to use the following functions.
+
+|Function|Notes|Default|
+|--------|-----|-------|
+|`DS_TUPLE_DOUBLES(expr[, nominalEntries])`|Creates a [Tuple sketch](../development/extensions-core/datasketches-tuple.md) on a precomputed sketch column `expr`, where the precomputed Tuple sketch contains an array of double values as its Summary Object. The `nominalEntries` override parameter is optional and described in the Tuple sketch documentation.
+|`DS_TUPLE_DOUBLES(dimensionColumnExpr, metricColumnExpr1[, metricColumnExpr2, ...], [nominalEntries])`|Creates a [Tuple sketch](../development/extensions-core/datasketches-tuple.md) on raw data. The Tuples sketch will contain an array of double values as its Summary Object based on the dimension value of `dimensionColumnExpr` and the numeric metric values contained in one or more `metricColumnExpr` columns. If the last value of the array is a numeric literal, Druid assumes that the value is an override parameter for [nominal entries](../development/extensions-core/datasketches-tuple.md).
+
+### T-Digest sketch functions
+
+Load the T-Digest extension to use the following functions. See the [T-Digest extension](../development/extensions-contrib/tdigestsketch-quantiles.md) for additional details and for more information on these functions.
+
+|Function|Notes|Default|
+|--------|-----|-------|
+|`TDIGEST_QUANTILE(expr, quantileFraction, [compression])`|Builds a T-Digest sketch on values produced by `expr` and returns the value for the quantile. Compression parameter (default value 100) determines the accuracy and size of the sketch. Higher compression means higher accuracy but more space to store sketches.|`Double.NaN`|
+|`TDIGEST_GENERATE_SKETCH(expr, [compression])`|Builds a T-Digest sketch on values produced by `expr`. Compression parameter (default value 100) determines the accuracy and size of the sketch Higher compression means higher accuracy but more space to store sketches.|Empty base64 encoded T-Digest sketch STRING|
diff --git a/docs/35.0.0/querying/sql-array-functions.md b/docs/35.0.0/querying/sql-array-functions.md
new file mode 100644
index 0000000000..5073fc3efc
--- /dev/null
+++ b/docs/35.0.0/querying/sql-array-functions.md
@@ -0,0 +1,66 @@
+---
+id: sql-array-functions
+title: "SQL ARRAY functions"
+sidebar_label: "Array functions"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+<!--
+  The format of the tables that describe the functions and operators
+  should not be changed without updating the script create-sql-docs
+  in web-console/script/create-sql-docs, because the script detects
+  patterns in this markdown file and parse it to TypeScript file for web console
+-->
+
+
+:::info
+ Apache Druid supports two query languages: Druid SQL and [native queries](querying.md).
+ This document describes the SQL language.
+:::
+
+This page describes the operations you can perform on arrays using [Druid SQL](./sql.md). See [`ARRAY` data type documentation](./sql-data-types.md#arrays) for additional details. 
+
+All array references in the array function documentation can refer to multi-value string columns or `ARRAY` literals.
+These functions are largely identical to the [multi-value string functions](sql-multivalue-string-functions.md), but
+use `ARRAY` types and behavior. Multi-value string `VARCHAR` columns can be converted to `VARCHAR ARRAY` to use with
+these functions using `MV_TO_ARRAY`, and `ARRAY` types can be converted to multi-value string `VARCHAR` with
+`ARRAY_TO_MV`.
+
+The following table describes array functions. To learn more about array aggregation functions, see [SQL aggregation functions](./sql-aggregations.md).
+
+|Function|Description|
+|--------|-----|
+|`ARRAY[expr1, expr2, ...]`|Constructs a SQL `ARRAY` literal from the provided expression arguments. All arguments must be of the same type.|
+|`ARRAY_APPEND(arr, expr)`|Appends the expression to the array. The source array type determines the resulting array type.|
+|`ARRAY_CONCAT(arr1, arr2)`|Concatenates two arrays. The type of `arr1` determines the resulting array type.|
+|`ARRAY_CONTAINS(arr, expr)`|Checks if the array contains the specified expression. If the specified expression is a scalar value, returns true if the source array contains the value. If the specified expression is an array, returns true if the source array contains all elements of the expression.|
+|`ARRAY_LENGTH(arr)`|Returns the length of the array.|
+|`ARRAY_OFFSET(arr, long)`|Returns the array element at the specified zero-based index. Returns null if the index is out of bounds.|
+|`ARRAY_OFFSET_OF(arr, expr)`|Returns the 0-based index of the first occurrence of `expr` in the array. If no matching elements exist in the array, returns `null`.|
+|`ARRAY_ORDINAL(arr, long)`|Returns the array element at the specified one-based index. Returns null if the index is out of bounds.|
+|`ARRAY_ORDINAL_OF(arr, expr)`|Returns the 1-based index of the first occurrence of `expr` in the array. If no matching elements exist in the array, returns `null`.|
+|`ARRAY_OVERLAP(arr1, arr2)`|Returns true if two arrays have any elements in common. Treats `NULL` values as known elements.|
+|`ARRAY_PREPEND(expr, arr)`|Prepends the expression to the array. The source array type determines the resulting array type.|
+|`ARRAY_SLICE(arr, start, end)`|Returns a subset of the array from the zero-based index `start` (inclusive) to `end` (exclusive). Returns null if `start` is less than 0, greater than the length of the array, or greater than `end`.|
+|`ARRAY_TO_MV(arr)`|Converts an array of any type into a [multi-value string](sql-data-types.md#multi-value-strings).|
+|`ARRAY_TO_STRING(arr, delimiter)`|Joins all elements of the array into a string using the specified delimiter.|
+|`SCALAR_IN_ARRAY(expr, arr)`|Checks if the scalar value is present in the array. Returns false if the value is non-null, or `UNKNOWN` if the value is `NULL`. Returns `UNKNOWN` if the array is `NULL`.|
+|`STRING_TO_ARRAY(string, delimiter)`|Splits the string into an array of substrings using the specified delimiter. The delimiter must be a valid regular expression.|
diff --git a/docs/35.0.0/querying/sql-data-types.md b/docs/35.0.0/querying/sql-data-types.md
new file mode 100644
index 0000000000..08492fcf76
--- /dev/null
+++ b/docs/35.0.0/querying/sql-data-types.md
@@ -0,0 +1,162 @@
+---
+id: sql-data-types
+title: "SQL data types"
+sidebar_label: "SQL data types"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ Apache Druid supports two query languages: Druid SQL and [native queries](querying.md).
+ This document describes the SQL language.
+:::
+
+Druid associates each column with a specific data type. This topic describes supported data types in [Druid SQL](./sql.md).
+
+## Standard types
+
+Druid natively supports the following basic column types:
+
+* LONG: 64-bit signed int
+* FLOAT: 32-bit float
+* DOUBLE: 64-bit float
+* STRING: UTF-8 encoded strings and string arrays
+* COMPLEX: non-standard data types, such as nested JSON, hyperUnique and approxHistogram, and DataSketches
+* ARRAY: arrays composed of any of these types
+
+Druid treats timestamps (including the `__time` column) as LONG, with the value being the number of
+milliseconds since 1970-01-01 00:00:00 UTC, not counting leap seconds. Therefore, timestamps in Druid do not carry any
+timezone information. They only carry information about the exact moment in time they represent. See
+[Time functions](sql-scalar.md#date-and-time-functions) for more information about timestamp handling.
+
+The following table describes how Druid maps SQL types onto native types when running queries:
+
+|SQL type|Druid runtime type|Default value<sup>*</sup>|Notes|
+|--------|------------------|-------------|-----|
+|CHAR|STRING|`''`||
+|VARCHAR|STRING|`''`|Druid STRING columns are reported as VARCHAR. Can include [multi-value strings](#multi-value-strings) as well.|
+|DECIMAL|DOUBLE|`0.0`|DECIMAL uses floating point, not fixed point math|
+|FLOAT|FLOAT|`0.0`|Druid FLOAT columns are reported as FLOAT|
+|REAL|DOUBLE|`0.0`||
+|DOUBLE|DOUBLE|`0.0`|Druid DOUBLE columns are reported as DOUBLE|
+|BOOLEAN|LONG|`false`||
+|TINYINT|LONG|`0`||
+|SMALLINT|LONG|`0`||
+|INTEGER|LONG|`0`||
+|BIGINT|LONG|`0`|Druid LONG columns (except `__time`) are reported as BIGINT|
+|TIMESTAMP|LONG|`0`, meaning 1970-01-01 00:00:00 UTC|Druid's `__time` column is reported as TIMESTAMP. Casts between string and timestamp types assume standard SQL formatting, such as `2000-01-02 03:04:05`, not ISO 8601 formatting. For handling other formats, use one of the [time functions](sql-scalar.md#date-and-time-functions).|
+|DATE|LONG|`0`, meaning 1970-01-01|Casting TIMESTAMP to DATE rounds down the timestamp to the nearest day. Casts between string and date types assume standard SQL formatting&mdash;for example, `2000-01-02`. For handling other formats, use one of the [time functions](sql-scalar.md#date-and-time-functions).|
+|ARRAY|ARRAY|`NULL`|Druid native array types work as SQL arrays, and multi-value strings can be converted to arrays. See [Arrays](#arrays) for more information.|
+|OTHER|COMPLEX|none|May represent various Druid column types such as hyperUnique, approxHistogram, etc.|
+
+<sup>*</sup> 
+The default value is <code>NULL</code> for all types. 
+<br /><br />
+For casts between two SQL types, the behavior depends on the runtime type:
+
+* Casts between two SQL types with the same Druid runtime type have no effect other than the exceptions noted in the table.
+
+* Casts between two SQL types that have different Druid runtime types generate a runtime cast in Druid.
+
+If a value cannot be cast to the target type, as in `CAST('foo' AS BIGINT)`, Druid a substitutes [NULL](#null-values).
+
+## Arrays
+
+Druid supports [`ARRAY` types](arrays.md), which behave as standard SQL arrays, where results are grouped by matching entire arrays. The [`UNNEST` operator](./sql.md#unnest) can be used to perform operations on individual array elements, translating each element into a separate row. 
+
+`ARRAY` typed columns can be stored in segments with JSON-based ingestion using the 'auto' typed dimension schema shared with [schema auto-discovery](../ingestion/schema-design.md#schema-auto-discovery-for-dimensions) to detect and ingest arrays as ARRAY typed columns. For [SQL based ingestion](../multi-stage-query/index.md), the query context parameter `arrayIngestMode` must be specified as `"array"` to ingest ARRAY types. In Druid 28, the default mode for this parameter is `"mvd"` for backwards compatibility, which instead can only handle `ARRAY<STRING>` which it stores in [multi-value string columns](#multi-value-strings). 
+
+You can convert multi-value dimensions to standard SQL arrays explicitly with `MV_TO_ARRAY` or implicitly using [array functions](./sql-array-functions.md). You can also use the array functions to construct arrays from multiple columns.
+
+Druid serializes `ARRAY` results as a JSON string of the array by default, which can be controlled by the context parameter
+[`sqlStringifyArrays`](sql-query-context.md). When set to `false` and using JSON [result formats](../api-reference/sql-api.md#responses), the arrays will instead be returned as regular JSON arrays instead of in stringified form.
+
+## Multi-value strings
+
+Druid's native type system allows strings to have multiple values. These [multi-value string dimensions](multi-value-dimensions.md) are reported in SQL as type VARCHAR and can be
+syntactically used like any other VARCHAR. Regular string functions that refer to multi-value string dimensions are applied to all values for each row individually.
+
+You can treat multi-value string dimensions as arrays using special
+[multi-value string functions](sql-multivalue-string-functions.md), which perform powerful array-aware operations, but retain their VARCHAR type and behavior.
+
+Grouping by multi-value dimensions observes the native Druid multi-value aggregation behavior, which is similar to an implicit SQL UNNEST. See [Grouping](multi-value-dimensions.md#grouping) for more information.
+
+:::info
+Because the SQL planner treats multi-value dimensions as VARCHAR, there are some inconsistencies between how they are handled in Druid SQL and in native queries. For instance, expressions involving multi-value dimensions may be incorrectly optimized by the Druid SQL planner. For example, `multi_val_dim = 'a' AND multi_val_dim = 'b'` is optimized to
+`false`, even though it is possible for a single row to have both `'a'` and `'b'` as values for `multi_val_dim`.
+
+The SQL behavior of multi-value dimensions may change in a future release to more closely align with their behavior in native queries, but the [multi-value string functions](./sql-multivalue-string-functions.md) should be able to provide nearly all possible native functionality.
+:::
+
+## Multi-value strings behavior
+
+The behavior of Druid [multi-value string dimensions](multi-value-dimensions.md) varies depending on the context of
+their usage.
+
+When used with standard VARCHAR functions which expect a single input value per row, such as CONCAT, Druid will map
+the function across all values in the row. If the row is null or empty, the function receives `NULL` as its input.
+
+When used with the explicit [multi-value string functions](./sql-multivalue-string-functions.md), Druid processes the
+row values as if they were ARRAY typed. Any operations which produce null and empty rows are distinguished as
+separate values (unlike implicit mapping behavior). These multi-value string functions, typically denoted with an `MV_`
+prefix, retain their VARCHAR type after the computation is complete. Note that Druid multi-value columns do _not_
+distinguish between empty and null rows. An empty row will never appear natively as input to a multi-valued function,
+but any multi-value function which manipulates the array form of the value may produce an empty array, which is handled
+separately while processing.
+
+:::info
+ Do not mix the usage of multi-value functions and normal scalar functions within the same expression, as the planner will be unable
+ to determine how to properly process the value given its ambiguous usage. A multi-value string must be treated consistently within
+ an expression.
+:::
+
+When converted to ARRAY or used with [array functions](./sql-array-functions.md), multi-value strings behave as standard SQL arrays and can no longer
+be manipulated with non-array functions.
+
+By default Druid serializes multi-value VARCHAR results as a JSON string of the array, if grouping was not applied on the value.
+If the value was grouped, due to the implicit UNNEST behavior, all results will always be standard single value
+VARCHAR. ARRAY typed results serialization is controlled with the context parameter [`sqlStringifyArrays`](sql-query-context.md). When set
+to `false` and using JSON [result formats](../api-reference/sql-api.md#responses), the arrays will instead be returned
+as regular JSON arrays instead of in stringified form.
+
+
+## NULL values
+
+By default, Druid treats NULL values similarly to the ANSI SQL standard.
+
+For examples of null handling, see the [null handling tutorial](../tutorials/tutorial-sql-null.md).
+
+## Boolean logic
+
+Druid uses [SQL three-valued logic](https://en.wikipedia.org/wiki/Three-valued_logic#SQL) for filter processing and boolean expression evaluation.
+
+## Nested columns
+
+Druid supports storing nested data structures in segments using the native `COMPLEX<json>` type. See [Nested columns](./nested-columns.md) for more information.
+
+You can interact with nested data using [JSON functions](./sql-json-functions.md), which can extract nested values, parse from string, serialize to string, and create new `COMPLEX<json>` structures.
+
+COMPLEX types have limited functionality outside the specialized functions that use them, so their behavior is undefined when:
+
+* Grouping on complex values.
+* Filtering directly on complex values.
+* Used as inputs to aggregators without specialized handling for a specific complex type.
+
+In many cases, functions are provided to translate COMPLEX value types to STRING, which serves as a workaround solution until COMPLEX type functionality can be improved.
diff --git a/docs/35.0.0/querying/sql-functions.md b/docs/35.0.0/querying/sql-functions.md
new file mode 100644
index 0000000000..beaa4c4eb3
--- /dev/null
+++ b/docs/35.0.0/querying/sql-functions.md
@@ -0,0 +1,6261 @@
+---
+id: sql-functions
+title: "All Druid SQL functions"
+sidebar_label: "All functions"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ Apache Druid supports two query languages: Druid SQL and [native queries](querying.md).
+ This document describes the SQL language.
+:::
+
+This page provides a reference of Apache Druid&circledR; SQL functions in alphabetical order. For more details on a function, refer to the following:
+* [Aggregation functions](sql-aggregations.md)
+* [Array functions](sql-array-functions.md)
+* [JSON functions](sql-json-functions.md)
+* [Multi-value string functions](sql-multivalue-string-functions.md)
+* [Scalar functions](sql-scalar.md)
+* [Window functions](sql-window-functions.md)
+
+## Example data
+
+The examples on this page use the following example datasources:
+* `array-example` created with [SQL-based ingestion](../multi-stage-query/index.md)
+* `flight-carriers` using `FlightCarrierOnTime (1 month)` included with Druid
+* `kttm` using `KoalasToTheMax one day` included with Druid
+* `mvd-example` using [SQL-based ingestion](multi-value-dimensions.md#sql-based-ingestion)
+* `taxi-trips` using `NYC Taxi cabs (3 files)` included with Druid
+
+To load a datasource included with Druid,
+access the [web console](../operations/web-console.md)
+and go to **Load data > Batch - SQL > Example data**.
+Select **Connect data**, and parse using the default settings.
+On the page to configure the schema, select the datasource label
+and enter the name of the datasource listed above.
+
+Use the following query to create the `array-example` datasource:
+
+<details>
+<summary>Datasource for arrays</summary>
+
+```sql
+REPLACE INTO "array-example" OVERWRITE ALL
+WITH "ext" AS (
+  SELECT *
+  FROM TABLE(
+    EXTERN(
+      '{"type":"inline","data":"{\"timestamp\": \"2023-01-01T00:00:00\", \"label\": \"row1\", \"arrayString\": [\"a\", \"b\"],  \"arrayLong\":[1, null,3], \"arrayDouble\":[1.1, 2.2, null]}\n{\"timestamp\": \"2023-01-01T00:00:00\", \"label\": \"row2\", \"arrayString\": [null, \"b\"], \"arrayLong\":null,        \"arrayDouble\":[999, null, 5.5]}\n{\"timestamp\": \"2023-01-01T00:00:00\", \"label\": \"row3\", \"arrayString\": [],          \"arrayLong\":[1, 2, 3],   \"arrayDouble\":[null, 2.2, 1.1]} \n{\"timestamp\": \"2023-01-01T00:00:00\", \"label\": \"row4\", \"arrayString\": [\"a\", \"b\"],  \"arrayLong\":[1, 2, 3],   \"arrayDouble\":[]}\n{\"timestamp\": \"2023-01-01T00:00:00\", \"label\": \"row5\", \"arrayString\": null,        \"arrayLong\":[],          \"arrayDouble\":null}"}',
+      '{"type":"json"}'
+    )
+  ) EXTEND (
+    "timestamp" VARCHAR,
+    "label" VARCHAR,
+    "arrayString" VARCHAR ARRAY,
+    "arrayLong" BIGINT ARRAY,
+    "arrayDouble" DOUBLE ARRAY
+  )
+)
+SELECT
+    TIME_PARSE("timestamp") AS "__time",
+    "label",
+    "arrayString",
+    "arrayLong",
+    "arrayDouble"
+FROM "ext"
+PARTITIONED BY DAY
+```
+
+</details>
+
+Use the following query to create the `mvd-example` datasource:
+
+<details>
+<summary>Datasource for multi-value string dimensions</summary>
+
+```sql
+REPLACE INTO "mvd-example" OVERWRITE ALL
+WITH "ext" AS (
+  SELECT *
+  FROM TABLE(
+    EXTERN(
+      '{"type":"inline","data":"{\"timestamp\": \"2011-01-12T00:00:00.000Z\", \"label\": \"row1\", \"tags\": [\"t1\",\"t2\",\"t3\"]}\n{\"timestamp\": \"2011-01-13T00:00:00.000Z\", \"label\": \"row2\", \"tags\": [\"t3\",\"t4\",\"t5\"]}\n{\"timestamp\": \"2011-01-14T00:00:00.000Z\", \"label\": \"row3\", \"tags\": [\"t5\",\"t6\",\"t7\"]}\n{\"timestamp\": \"2011-01-14T00:00:00.000Z\", \"label\": \"row4\", \"tags\": []}"}',
+      '{"type":"json"}',
+      '[{"name":"timestamp", "type":"STRING"},{"name":"label", "type":"STRING"},{"name":"tags", "type":"ARRAY<STRING>"}]'
+    )
+  )
+)
+SELECT
+  TIME_PARSE("timestamp") AS "__time",
+  "label",
+  ARRAY_TO_MV("tags") AS "tags"
+FROM "ext"
+PARTITIONED BY DAY
+```
+
+</details>
+
+## ABS
+
+Calculates the absolute value of a numeric expression.
+
+* **Syntax:** `ABS(<NUMERIC>)`
+* **Function type:** Scalar, numeric
+
+<details>
+<summary>Example</summary>
+
+The following example applies the ABS function to the `ArrDelay` column from the `flight-carriers` datasource.
+
+```sql
+SELECT
+  "ArrDelay" AS "arrival_delay",
+  ABS("ArrDelay") AS "absolute_arrival_delay"
+FROM "flight-carriers"
+WHERE "ArrDelay" < 0
+LIMIT 1
+```
+Returns the following:
+
+| `arrival_delay` | `absolute_arrival_delay` |
+| -- | -- |
+| `-27` | `27` |
+</details>
+
+[Learn more](sql-scalar.md#numeric-functions)
+
+## ACOS
+
+Calculates the arc cosine (arccosine) of a numeric expression.
+
+* **Syntax:** `ACOS(expr)`
+* **Function type:** Scalar, numeric
+
+<details>
+<summary>Example</summary>
+
+The following example calculates the arc cosine of `0`.
+
+```sql
+SELECT ACOS(0) AS "arc_cosine"
+```
+Returns the following:
+
+| `arc_cosine` |  
+| -- |
+| `1.5707963267948966` |
+
+</details>
+
+[Learn more](sql-scalar.md#numeric-functions)
+
+## ANY_VALUE
+
+Returns any value of the specified expression.
+
+* **Syntax**: `ANY_VALUE(expr, [maxBytesPerValue, [aggregateMultipleValues]])`
+* **Function type:** Aggregation
+
+<details>
+<summary>Example</summary>
+
+The following example returns the state abbreviation, state name, and average flight time grouped by each state in `flight-carriers`:
+
+```sql
+SELECT
+  "OriginState",
+  ANY_VALUE("OriginStateName") AS "OriginStateName",
+  AVG("ActualElapsedTime") AS "AverageFlightTime"
+FROM "flight-carriers"
+GROUP BY 1
+LIMIT 3
+```
+
+Returns the following:
+
+|`OriginState`|`OriginStateName`|`AverageFlightTime`|
+|-------------|-----------------|-------------------|
+|`AK`|`Alaska`|`113.2777967841259`|
+|`AL`|`Alabama`|`92.28766697732215`|
+|`AR`|`Arkansas`|`95.0391382405745`|
+
+</details>
+
+[Learn more](sql-aggregations.md)
+
+## APPROX_COUNT_DISTINCT
+
+Counts distinct values of a regular column or a prebuilt sketch column using an approximate algorithm.
+
+* **Syntax**: `APPROX_COUNT_DISTINCT(expr)`
+* **Function type:** Aggregation
+
+<details>
+<summary>Example</summary>
+
+The following example counts the number of distinct airlines reported in `flight-carriers`:
+
+```sql
+SELECT APPROX_COUNT_DISTINCT("Reporting_Airline") AS "num_airlines"
+FROM "flight-carriers"
+```
+
+Returns the following:
+
+| `num_airlines` |
+| -- |
+| `20` |
+
+</details>
+
+[Learn more](sql-aggregations.md)
+
+## APPROX_COUNT_DISTINCT_BUILTIN
+
+Counts distinct values of a string, numeric, or `hyperUnique` column using Druid's built-in `cardinality` or `hyperUnique` aggregators.
+Consider using `APPROX_COUNT_DISTINCT_DS_HLL` instead, which offers better accuracy in many cases.
+
+* **Syntax**: `APPROX_COUNT_DISTINCT_BUILTIN(expr)`
+* **Function type:** Aggregation
+
+<details>
+<summary>Example</summary>
+
+The following example counts the number of distinct airlines reported in `flight-carriers`:
+
+```sql
+SELECT APPROX_COUNT_DISTINCT_BUILTIN("Reporting_Airline") AS "num_airlines"
+FROM "flight-carriers"
+```
+
+Returns the following:
+
+| `num_airlines` |
+| -- |
+| `20` |
+
+</details>
+
+[Learn more](sql-aggregations.md)
+
+## APPROX_COUNT_DISTINCT_DS_HLL
+
+Returns the approximate number of distinct values in a HLL sketch column or a regular column. See [DataSketches HLL Sketch module](../development/extensions-core/datasketches-hll.md) for a description of optional parameters.
+
+* **Syntax:** `APPROX_COUNT_DISTINCT_DS_HLL(expr, [lgK, tgtHllType])`
+* **Function type:** Aggregation
+
+<details>
+<summary>Example</summary>
+
+The following example returns the approximate number of distinct tail numbers in the `flight-carriers` datasource.
+
+```sql
+SELECT APPROX_COUNT_DISTINCT_DS_HLL("Tail_Number") AS "estimate"
+FROM "flight-carriers"
+```
+
+Returns the following:
+
+| `estimate` |
+| -- |
+| `4686` |
+
+</details>
+
+[Learn more](sql-aggregations.md)
+
+## APPROX_COUNT_DISTINCT_DS_THETA
+
+Returns the approximate number of distinct values in a Theta sketch column or a regular column. See [DataSketches Theta Sketch module](../development/extensions-core/datasketches-theta.md#aggregator) for a description of optional parameters.
+
+* **Syntax:** `APPROX_COUNT_DISTINCT_DS_THETA(expr, [size])`
+* **Function type:** Aggregation
+
+<details>
+<summary>Example</summary>
+
+The following example returns the approximate number of distinct tail numbers in the `Tail_Number` column of the `flight-carriers` datasource.
+
+```sql 
+SELECT APPROX_COUNT_DISTINCT_DS_THETA("Tail_Number") AS "estimate"
+FROM "flight-carriers"
+```
+
+Returns the following:
+
+| `estimate` |
+| -- |
+| `4667` |
+
+</details>
+
+[Learn more](sql-aggregations.md)
+
+## APPROX_QUANTILE
+
+:::info
+Deprecated in favor of [`APPROX_QUANTILE_DS`](#approx_quantile_ds).
+:::
+
+* **Syntax:** `APPROX_QUANTILE(expr, probability, [k])`
+* **Function type:** Aggregation
+
+[Learn more](sql-aggregations.md)
+
+## APPROX_QUANTILE_DS
+
+Computes approximate quantiles on a Quantiles sketch column or a regular numeric column. See [DataSketches Quantiles Sketch module](../development/extensions-core/datasketches-quantiles.md) for a description of parameters.
+
+* **Syntax:** `APPROX_QUANTILE_DS(expr, probability, [k])`
+* **Function type:** Aggregation
+
+<details>
+<summary>Example</summary>
+
+The following example approximates the median of the `Distance` column from the `flight-carriers` datasource. The query may return a different approximation on each execution.
+
+```sql
+SELECT APPROX_QUANTILE_DS("Distance", 0.5, 128)  AS "estimate_median"
+FROM "flight-carriers"
+```
+
+Returns a result similar to the following:
+
+| `estimate_median` |
+| -- |
+| `569` |
+
+</details>
+
+[Learn more](sql-aggregations.md)
+
+## APPROX_QUANTILE_FIXED_BUCKETS
+
+Computes approximate quantiles on fixed buckets histogram column or a regular numeric column. See [Fixed buckets histogram](../development/extensions-core/approximate-histograms.md#fixed-buckets-histogram) for a description of parameters.
+
+* **Syntax:** `APPROX_QUANTILE_FIXED_BUCKETS(expr, probability, numBuckets, lowerLimit, upperLimit, [outlierHandlingMode])`
+* **Function type:** Aggregation
+
+<details>
+<summary>Example</summary>
+
+The following example approximates the median of a histogram on the `Distance` column from the `flight-carriers` datasource. The histogram has 10 buckets, a lower limit of zero, an upper limit of 2500, and ignores outlier values. 
+
+```sql
+SELECT APPROX_QUANTILE_FIXED_BUCKETS("Distance", 0.5, 10, 0, 2500, 'ignore')  AS "estimate_median"
+FROM "flight-carriers"
+```
+
+Returns the following:
+
+| `estimate_median` |
+| -- |
+| `571.6983032226562` |
+
+</details>
+
+[Learn more](sql-aggregations.md)
+
+## ARRAY
+
+Constructs a SQL `ARRAY` literal from the provided expression arguments. All arguments must be of the same type.
+
+* **Syntax**: `ARRAY[expr1, expr2, ...]`
+* **Function type:** Array
+
+<details>
+<summary>Example</summary>
+
+The following example constructs arrays from the values of the `agent_category`, `browser`, and `browser_version` columns in the `kttm` datasource.
+
+```sql
+SELECT ARRAY["agent_category", "browser", "browser_version"] AS "user_agent_details"
+FROM "kttm"
+LIMIT 5
+```
+
+Returns the following:
+
+| `user_agent_details` |
+| -- |
+| `["Personal computer","Chrome","76.0.3809.100"]` |
+| `["Smartphone","Chrome Mobile","50.0.2661.89"]` |
+| `["Personal computer","Chrome","76.0.3809.100"]` |
+| `["Personal computer","Opera","62.0.3331.116"]` |
+| `["Smartphone","Mobile Safari","12.0"]` |
+
+</details>
+
+[Learn more](sql-array-functions.md)
+
+## ARRAY_AGG
+
+Returns an array of all values of the specified expression. To include only unique values, specify `DISTINCT`.
+
+* **Syntax**: `ARRAY_AGG([DISTINCT] expr, [size])`
+* **Function type:** Aggregation
+
+<details>
+<summary>Example</summary>
+
+The following example returns arrays of unique values from the `OriginState` column in the `flight-carriers` datasource, grouped by `Reporting_Airline`.
+
+```sql
+SELECT "Reporting_Airline", ARRAY_AGG(DISTINCT "OriginState", 50000) AS "Origin"
+FROM "flight-carriers"
+GROUP BY "Reporting_Airline"
+LIMIT 5
+```
+
+Returns the following:
+
+| `Reporting_Airline` | `Origin` |
+| -- | -- |
+| `AA` |`["AL","AR","AZ","CA","CO","CT","FL","GA","HI","IL","IN","KS","KY","LA","MA","MD","MI","MN","MO","NC","NE","NJ","NM","NV","NY","OH","OK","OR","PA","PR","RI","TN","TX","UT","VA","VI","WA"]`|
+| `AS` |`["AK","AZ","CA","CO","FL","ID","IL","MA","NJ","NV","OR","TX","VA","WA"]`|
+| `B6` |`["AZ","CA","CO","FL","LA","MA","NJ","NV","NY","OR","PR","UT","VA","VT","WA"]`|
+| `CO` |`["AK","AL","AZ","CA","CO","CT","FL","GA","HI","IL","IN","LA","MA","MD","MI","MN","MO","MS","NC","NE","NH","NJ","NM","NV","NY","OH","OK","OR","PA","PR","RI","SC","TN","TX","UT","VA","VI","WA"]`|
+| `DH` |`["AL","CA","CT","FL","GA","IL","MA","ME","MI","NC","NH","NJ","NV","NY","OH","PA","RI","SC","TN","VA","VT","WA","WV"]`|
+
+</details>
+
+[Learn more](sql-aggregations.md)
+
+## ARRAY_APPEND
+
+Appends the expression to the array. The source array type determines the resulting array type.
+
+* **Syntax**: `ARRAY_APPEND(arr, expr)`
+* **Function type:** Array
+
+<details>
+<summary>Example</summary>
+
+The following example appends `c` to the values in the `arrayString` column from the `array-example` datasource.
+
+```sql
+SELECT ARRAY_APPEND("arrayString",'c') AS "array_appended"
+FROM "array-example"
+```
+
+Returns the following:
+
+| `array_appended` |
+| -- |
+| `[a, b, c]` |
+| `[null,"b","c"]`|
+| `[c]` |
+| `[a, b, c]`|
+| `null` |
+
+</details>
+
+[Learn more](sql-array-functions.md)
+
+## ARRAY_CONCAT
+
+Concatenates two arrays. The type of `arr1` determines the resulting array type.
+
+* **Syntax**: `ARRAY_CONCAT(arr1, arr2)`
+* **Function type:** Array
+
+<details>
+<summary>Example</summary>
+
+The following example concatenates the arrays in the `arrayLong` and `arrayDouble` columns from the `array-example` datasource.
+
+```sql
+SELECT ARRAY_CONCAT("arrayLong", "arrayDouble") AS "arrayConcatenated" 
+FROM "array-example"
+```
+
+Returns the following:
+
+| `arrayConcatenated` |
+| -- |
+| `[1,null,3,1.1,2.2,null]` |
+| `null`|
+| `[1,2,3,null,2.2,1.1]` |
+| `[1,2,3]`|
+| `null` |
+
+</details>
+
+[Learn more](sql-array-functions.md)
+
+## ARRAY_CONCAT_AGG
+
+Concatenates array inputs into a single array. To include only unique values, specify `DISTINCT`.
+
+* **Syntax**: `ARRAY_CONCAT_AGG([DISTINCT] expr, [size])`
+* **Function type:** Aggregation
+
+<details>
+<summary>Example</summary>
+
+The following example concatenates the array inputs from the `arrayDouble` column of the `array-example` datasource into a single array.
+
+```sql
+SELECT ARRAY_CONCAT_AGG( DISTINCT "arrayDouble") AS "array_concat_agg_distinct"
+FROM "array-example"
+```
+
+Returns the following:
+
+| `array_concat_agg_distinct` |
+| -- |
+| `[null,1.1,2.2,5.5,999]` |
+
+</details>
+
+[Learn more](sql-aggregations.md)
+
+## ARRAY_CONTAINS
+
+Checks if the array contains the specified expression.
+
+### Scalar
+
+If the specified expression is a scalar value, returns true if the source array contains the value.
+
+* **Syntax**: `ARRAY_CONTAINS(arr, expr)`
+* **Function type:** Array
+
+<details>
+<summary>Example</summary>
+
+The following example returns true if the `arraySring` column from the `array-example` datasource contains `2`.
+
+```sql
+SELECT "arrayLong", ARRAY_CONTAINS("arrayLong", 2) AS "arrayContains"
+FROM "array-example"
+```
+
+Returns the following:
+
+| `arrayLong` | `arrayContains` |
+| -- | --|
+| `[1,null,3]` | `false` |
+| `null` | `null` |
+| `[1,2,3]` |  `true` |
+| `[1,2,3]` | `true` |
+| `[]` | `false` |
+
+</details>
+
+[Learn more](sql-array-functions.md)
+
+### Array
+
+If the specified expression is an array, returns true if the source array contains all elements of the expression.
+
+* **Syntax**: `ARRAY_CONTAINS(arr, expr)`
+* **Function type:** Array
+
+<details>
+<summary>Example</summary>
+
+The following example returns true if the `arrayLong` column from the `array-example` datasource contains all elements of the provided expression.
+
+```sql
+SELECT "label", "arrayLong", ARRAY_CONTAINS("arrayLong", ARRAY[1,2,3]) AS "arrayContains"
+FROM "array-example"
+```
+
+Returns the following:
+
+| `label` | `arrayLong` | `arrayContains` |
+| -- | -- | -- |
+| `row1` | `[1,null,3]` | `false` |
+| `row2`| `null` | `null` |
+| `row3`| `[1,2,3]` | `true` |
+| `row4`| `[1,2,3]` | `true` |
+| `row5`| `[]` | `false` |
+
+</details>
+
+[Learn more](sql-array-functions.md)
+
+## ARRAY_LENGTH
+
+Returns the length of the array.
+
+* **Syntax**: `ARRAY_LENGTH(arr)`
+* **Function type:** Array
+
+<details>
+<summary>Example</summary>
+
+The following example returns the length of array expressions in the `arrayDouble` column from the `array-example` datasource.
+
+```sql
+SELECT "arrayDouble" AS "array", ARRAY_LENGTH("arrayDouble") AS "arrayLength"
+FROM "array-example"
+```
+
+Returns the following:
+
+| `larray` | `arrayLength` |
+| -- | -- |
+| `row1` | 3 |
+| `row2`| 3 |
+| `row3`| 3 |
+| `row4`| 0 |
+| `row5`| `null` |
+
+</details>
+
+[Learn more](sql-array-functions.md)
+
+## ARRAY_OFFSET
+
+Returns the array element at the specified zero-based index. Returns null if the index is out of bounds.
+
+* **Syntax**: `ARRAY_OFFSET(arr, long)`
+* **Function type:** Array
+
+<details>
+<summary>Example</summary>
+
+The following example returns the element at the specified zero-based index from the arrays in the `arrayLong` column of the `array-example` datasource.
+
+```sql
+SELECT "arrayLong" as "array", ARRAY_OFFSET("arrayLong", 2) AS "elementAtIndex"
+FROM "array-example"
+```
+
+Returns the following:
+
+| `array` | `elementAtIndex` |
+| -- | -- |
+| `[1,null,3]` | 3 |
+| `null`| `null` |
+| `[1,2,3]`| 3 |
+| `[1,2,3]`| 3 |
+| `[]`| `null` |
+
+</details>
+
+[Learn more](sql-array-functions.md)
+
+## ARRAY_OFFSET_OF
+
+Returns the zero-based index of the first occurrence of the expression in the array. Returns null if the value isn't present.
+
+* **Syntax**: `ARRAY_OFFSET_OF(arr, expr)`
+* **Function type:** Array
+
+<details>
+<summary>Example</summary>
+
+The following example returns the zero-based index of the fist occurrence of `3` in the arrays in the `arrayLong` column of the `array-example` datasource.
+
+```sql
+SELECT "arrayLong" as "array", ARRAY_OFFSET_OF("arrayLong", 3) AS "offset"
+FROM "array-example"
+```
+
+Returns the following:
+
+| `array` | `offset` |
+| -- | -- |
+| `[1,null,3]` | 2 |
+| `null`| `null` |
+| `[1,2,3]`| 2 |
+| `[1,2,3]`| 2 |
+| `[]`| `null` |
+
+</details>
+
+[Learn more](sql-array-functions.md)
+
+## ARRAY_ORDINAL
+
+Returns the array element at the specified one-based index. Returns null if the index is out of bounds.
+
+* **Syntax**: `ARRAY_ORDINAL(arr, long)`
+* **Function type:** Array
+
+<details>
+<summary>Example</summary>
+
+The following example returns the element at the specified one-based index from the arrays in the `arrayLong` column of the `array-example` datasource.
+
+```sql
+SELECT "arrayLong" as "array", ARRAY_ORDINAL("arrayLong", 2) AS "elementAtIndex"
+FROM "array-example"
+```
+
+Returns the following:
+
+| `array` | `elementAtIndex` |
+| -- | -- |
+| `[1,null,3]` | `null` |
+| `null`| `null` |
+| `[1,2,3]`| 2 |
+| `[1,2,3]`| 2 |
+| `[]`| `null` |
+
+</details>
+
+[Learn more](sql-array-functions.md)
+
+## ARRAY_ORDINAL_OF
+
+Returns the one-based index of the first occurrence of the expression in the array. Returns null if the value isn't present.
+
+* **Syntax**: `ARRAY_ORDINAL_OF(arr, expr)`
+* **Function type:** Array
+
+<details>
+<summary>Example</summary>
+
+The following example returns the one-based index of the fist occurrence of `3` in the arrays in the `arrayLong` column of the `array-example` datasource.
+
+```sql
+SELECT "arrayLong" as "array", ARRAY_ORDINAL_OF("arrayLong", 3) AS "ordinal"
+FROM "array-example"
+```
+
+Returns the following:
+
+| `array` | `ordinal` |
+| -- | -- |
+| `[1,null,3]` | 3 |
+| `null`| `null` |
+| `[1,2,3]`| 3 |
+| `[1,2,3]`| 3 |
+| `[]`| `null` |
+
+</details>
+
+[Learn more](sql-array-functions.md)
+
+## ARRAY_OVERLAP
+
+Returns true if two arrays have any elements in common. Treats `NULL` values as known elements.
+
+* **Syntax**: `ARRAY_OVERLAP(arr1, arr2)`
+* **Function type:** Array
+
+<details>
+<summary>Example</summary>
+
+The following example returns true if columns `arrayString` and `arrayDouble` from the `array-example` datasource have common elements.
+
+```sql
+SELECT "arrayString", "arrayDouble",  ARRAY_OVERLAP("arrayString", "arrayDouble") AS "overlap"
+FROM "array-example"
+```
+
+Returns the following:
+
+| `arrayString` | `arrayDouble` | `overlap`|
+| -- | -- | -- |
+| `["a","b"]` | `[1.1,2.2,null]` | false |
+| `[null,"b"]`| `[999,null,5.5]` | true |
+| `[]`| `[null,2.2,1.1]` | false |
+| `["a","b"]`| `[]` | false |
+| `null`| `null` | `null` |
+
+</details>
+
+[Learn more](sql-array-functions.md)
+
+## SCALAR_IN_ARRAY
+
+Checks if the scalar value is present in the array. Returns false if the value is non-null, or `UNKNOWN` if the value is `NULL`. Returns `UNKNOWN` if the array is `NULL`.
+
+* **Syntax**: `SCALAR_IN_ARRAY(expr, arr)`
+* **Function type:** Array
+
+<details>
+<summary>Example</summary>
+
+The following example returns true if the value `36` is present in the array generated from the elements in the `DestStateFips` column from the `flight-carriers` datasource.
+
+```sql
+SELECT "Reporting_Airline", ARRAY_AGG(DISTINCT "DestStateFips") AS "StateFipsArray", SCALAR_IN_ARRAY(36, ARRAY_AGG(DISTINCT "DestStateFips")) AS "ValueInArray"
+FROM "flight-carriers"
+GROUP BY "Reporting_Airline"
+LIMIT 5
+```
+
+Returns the following:
+
+| `Reporting_Airline` | `StateFipsArray` | `ValueInArray`|
+| -- | -- | -- |
+| `AA` | `[1,4,5,6,8,9,12,13,15,17,18,20,21,22,24,25,26,27,29,31,32,34,35,36,37,39,40,41,42,44,47,48,49,51,53,72,78]` | true |
+| `AS`| `[2,4,6,8,12,16,17,25,32,34,41,48,51,53]` | false |
+| `B6`| `[4,6,8,12,22,25,32,34,36,41,49,50,51,53,72]` | true |
+| `CO`| `[1,2,4,6,8,9,12,13,15,17,18,22,24,25,26,27,28,29,31,32,33,34,35,36,37,39,40,41,42,44,45,47,48,49,51,53,72,78]` | true |
+| `DH`| `[1,6,9,12,13,17,23,25,26,32,33,34,36,37,39,42,44,45,47,50,51,53,54]` | true |
+
+</details>
+
+[Learn more](sql-array-functions.md)
+
+## ARRAY_PREPEND
+
+Prepends the expression to the array. The source array type determines the resulting array type.
+
+* **Syntax**: `ARRAY_PREPEND(expr, arr)`
+* **Function type:** Array
+
+<details>
+<summary>Example</summary>
+
+The following example prepends `c` to the arrays in the `arrayString` column from the `array-example` datasource.
+
+```sql
+SELECT ARRAY_PREPEND('c', "arrayString") AS "arrayPrepended"
+FROM "array-example"
+```
+
+Returns the following:
+
+| `arrayPrepended` |
+| -- |
+| `[c, a, b]` |
+| `["c",null,"b"]`|
+| `[c]`|
+| `[c,a,b]`|
+| `null`|
+
+</details>
+
+[Learn more](sql-array-functions.md)
+
+## ARRAY_SLICE
+
+Returns a subset of the array from the zero-based index `start` (inclusive) to `end` (exclusive). Returns null if `start` is less than 0, greater than the length of the array, or greater than `end`.
+
+* **Syntax**: `ARRAY_SLICE(arr, start, end)`
+* **Function type:** Array
+
+<details>
+<summary>Example</summary>
+
+The following example constructs a new array from the elements of arrays in the `arrayDouble` column from the `array-example` datasource.
+
+```sql
+SELECT "arrayDouble", ARRAY_SLICE("arrayDouble", 0, 2) AS "arrayNew"
+FROM "array-example"
+```
+
+Returns the following:
+
+| `arrayDouble` | `arrayNew` |
+| -- | -- |
+| `[1.1,2.2,null]` | `[1.1,2.2]` |
+| `[999,null,5.5]`| `[999,null]` |
+| `[null,2.2,1.1]`| `[null,2.2]` |
+| `[]`| `[null,null]` |
+| `null`| `null` |
+
+</details>
+
+[Learn more](sql-array-functions.md)
+
+## ARRAY_TO_MV
+
+Converts an array of any type into a [multi-value string](sql-data-types.md#multi-value-strings).
+
+* **Syntax**: `ARRAY_TO_MV(arr)`
+* **Function type:** Array
+
+<details>
+<summary>Example</summary>
+
+The following example converts the arrays in the `arrayDouble` column from the `array-example` datasource into multi-value strings.
+
+```sql
+SELECT ARRAY_TO_MV("arrayDouble") AS "multiValueString"
+FROM "array-example"
+```
+
+Returns the following:
+
+| `multiValueString` |
+| -- |
+| `["1.1","2.2",null]` |
+| `["999.0",null,"5.5"]`|
+| `[null,"2.2","1.1"]`|
+| `[]`|
+| `null`|
+
+</details>
+
+[Learn more](sql-array-functions.md)
+
+## ARRAY_TO_STRING
+
+Joins all elements of the array into a string using the specified delimiter.
+
+* **Syntax**: `ARRAY_TO_STRING(arr, delimiter)`
+* **Function type:** Array
+
+<details>
+<summary>Example</summary>
+
+The following example converts the arrays in the `arrayDouble` column of the `array-example` datasource into concatenated strings.
+
+```sql
+SELECT ARRAY_TO_STRING("arrayDouble", '') AS "notSeparated"
+FROM "array-example"
+```
+
+Returns the following:
+
+| `multiValueString` |
+| -- |
+| `1.12.2null` |
+| `999.0null5.5` |
+| `null2.21.1` |
+| ` ` |
+| `null`|
+
+</details>
+
+[Learn more](sql-array-functions.md)
+
+## ASIN
+
+Calculates the arc sine (arcsine) of a numeric expression.
+
+* **Syntax:** `ASIN(expr)`
+* **Function type:** Scalar, numeric
+
+<details>
+<summary>Example</summary>
+
+The following example calculates the arc sine of `1`.
+
+```sql
+SELECT ASIN(1) AS "arc_sine"
+```
+Returns the following:
+
+| `arc_sine` |  
+| -- |
+| `1.5707963267948966` |
+</details>
+
+[Learn more](sql-scalar.md#numeric-functions)
+
+## ATAN
+
+Calculates the arc tangent (arctangent) of a numeric expression.
+
+* **Syntax:** `ATAN(expr)`
+* **Function type:** Scalar, numeric
+
+<details>
+<summary>Example</summary>
+
+The following example calculates the arc tangent of `1`.
+
+```sql
+SELECT ATAN(1) AS "arc_tangent"
+```
+Returns the following:
+
+| `arc_tangent` |  
+| -- |
+| `0.7853981633974483` |
+</details>
+
+[Learn more](sql-scalar.md#numeric-functions)
+
+## ATAN2
+
+Calculates the arc tangent (arctangent) of a specified x and y coordinate.
+
+* **Syntax:** `ATAN2(x, y)`
+* **Function type:** Scalar, numeric
+
+<details>
+<summary>Example</summary>
+
+The following example calculates the arc tangent of the coordinate `(1, -1)`
+
+```sql
+SELECT ATAN2(1,-1) AS "arc_tangent_2"
+```
+Returns the following:
+
+| `arc_tangent_2` |  
+| -- |
+| `2.356194490192345` |
+</details>
+
+[Learn more](sql-scalar.md#numeric-functions)
+
+## AVG
+
+Calculates the average of a set of values.
+
+* **Syntax**: `AVG(<NUMERIC>)`
+* **Function type:** Aggregation
+
+
+<details>
+<summary>Example</summary>
+
+The following example calculates the average minutes of delay for a particular airlines in `flight-carriers`:
+
+```sql
+SELECT AVG("DepDelayMinutes") AS avg_delay
+FROM "flight-carriers"
+WHERE "Reporting_Airline" = 'AA'
+```
+
+Returns the following:
+
+| `avg_delay` |
+| -- |
+| `8.936` |
+
+</details>
+
+[Learn more](sql-aggregations.md)
+
+## BIT_AND
+
+Performs a bitwise AND operation on all input values.
+
+* **Syntax**: `BIT_AND(expr)`
+* **Function type:** Aggregation
+
+<details>
+<summary>Example</summary>
+
+The following example returns the bitwise AND operation for all values in `passenger-count` from `taxi-trips`:
+
+```sql
+SELECT
+  BIT_AND("passenger_count") AS "bit_and"
+FROM "taxi-trips"
+```
+
+Returns the following:
+
+| `bit_and` |
+| -- |
+| `0` |
+
+</details>
+
+[Learn more](sql-aggregations.md)
+
+## BIT_OR
+
+Performs a bitwise OR operation on all input values.
+
+* **Syntax**: `BIT_OR(expr)`
+* **Function type:** Aggregation
+
+<details>
+<summary>Example</summary>
+
+The following example returns the bitwise OR operation for all values in `passenger-count` from `taxi-trips`:
+
+```sql
+SELECT
+  BIT_OR("passenger_count") AS "bit_or"
+FROM "taxi-trips"
+```
+
+Returns the following:
+
+| `bit_or` |
+| -- |
+| `15` |
+
+</details>
+
+[Learn more](sql-aggregations.md)
+
+## BIT_XOR
+
+Performs a bitwise XOR operation on all input values.
+
+* **Syntax**: `BIT_XOR(expr)`
+* **Function type:** Aggregation
+
+<details>
+<summary>Example</summary>
+
+The following example returns the bitwise XOR operation for all values in `passenger-count` from `taxi-trips`:
+
+```sql
+SELECT
+  BIT_OR("passenger_count") AS "bit_xor"
+FROM "taxi-trips"
+```
+
+Returns the following:
+
+| `bit_xor` |
+| -- |
+| `6` |
+
+</details>
+
+[Learn more](sql-aggregations.md)
+
+## BITWISE_AND
+
+Returns the bitwise AND between two expressions: `expr1 & expr2`. 
+
+* **Syntax:** `BITWISE_AND(expr1, expr2)`
+* **Function type:** Scalar, numeric
+
+<details>
+<summary>Example</summary>
+
+The following example performs the bitwise AND operation `12 & 10`.
+
+```sql
+SELECT BITWISE_AND(12, 10) AS "bitwise_and"
+```
+Returns the following:
+
+| `bitwise_and` |
+| -- |
+| 8 |
+
+</details>
+
+[Learn more](sql-scalar.md#numeric-functions)
+
+## BITWISE_COMPLEMENT
+
+Returns the bitwise complement (bitwise not) for the expression: `~expr`.
+
+* **Syntax:** `BITWISE_COMPLEMENT(expr)`
+* **Function type:** Scalar, numeric
+
+<details>
+<summary>Example</summary>
+
+The following example performs the bitwise complement operation `~12`.
+
+```sql
+SELECT BITWISE_COMPLEMENT(12) AS "bitwise_complement"
+```
+Returns the following:
+
+| `bitwise_complement` |
+| -- |
+| -13 |
+
+</details>
+
+[Learn more](sql-scalar.md#numeric-functions)
+
+## BITWISE_CONVERT_DOUBLE_TO_LONG_BITS
+
+Converts the bits of an IEEE 754 floating-point double value to long.
+
+* **Syntax:**`BITWISE_CONVERT_DOUBLE_TO_LONG_BITS(expr)`
+* **Function type:** Scalar, numeric
+
+<details>
+<summary>Example</summary>
+
+The following example returns the IEEE 754 floating-point double representation of `255` as a long. 
+
+```sql
+SELECT BITWISE_CONVERT_DOUBLE_TO_LONG_BITS(255) AS "ieee_754_double_to_long"
+```
+Returns the following:
+
+| `ieee_754_double_to_long` |
+| -- |
+| `4643176031446892544` |
+
+</details>
+
+[Learn more](sql-scalar.md#numeric-functions)
+
+
+## BITWISE_CONVERT_LONG_BITS_TO_DOUBLE
+
+Converts a long to the IEEE 754 floating-point double specified by the bits stored in the long.
+
+* **Syntax:**`BITWISE_CONVERT_LONG_BITS_TO_DOUBLE(expr)`
+* **Function type:** Scalar, numeric
+
+<details>
+<summary>Example</summary>
+
+The following example returns the long representation of `4643176031446892544` as an IEEE 754 floating-point double.
+
+```sql
+SELECT BITWISE_CONVERT_LONG_BITS_TO_DOUBLE(4643176031446892544) AS "long_to_ieee_754_double"
+```
+Returns the following:
+
+| `long_to_ieee_754_double` |
+| -- |
+| `255` |
+
+</details>
+
+[Learn more](sql-scalar.md#numeric-functions)
+
+## BITWISE_OR
+
+Returns the bitwise OR between the two expressions: `expr1 | expr2`.
+
+* **Syntax:** `BITWISE_OR(expr1, expr2)`
+* **Function type:** Scalar, numeric
+
+<details>
+<summary>Example</summary>
+
+The following example performs the bitwise OR operation `12 | 10`.
+
+```sql
+SELECT BITWISE_OR(12, 10) AS "bitwise_or"
+```
+Returns the following:
+
+| `bitwise_or` |
+| -- |
+| `14` |
+
+</details>
+
+[Learn more](sql-scalar.md#numeric-functions)
+
+## BITWISE_SHIFT_LEFT
+
+Returns the bitwise left shift by x positions of an expr: `expr << x`.
+
+* **Syntax:** `BITWISE_SHIFT_LEFT(expr, x)`
+* **Function type:** Scalar, numeric
+
+<details>
+<summary>Example</summary>
+
+The following example performs the bitwise SHIFT operation `2 << 3`.
+
+```sql
+SELECT BITWISE_SHIFT_LEFT(2, 3) AS "bitwise_shift_left"
+```
+Returns the following:
+
+| `bitwise_shift_left` |
+| -- |
+| `16` |
+
+</details>
+
+[Learn more](sql-scalar.md#numeric-functions)
+
+## BITWISE_SHIFT_RIGHT
+
+Returns the bitwise right shift by x positions of an expr: `expr >> x`.
+
+* **Syntax:** `BITWISE_SHIFT_RIGHT(expr, x)`
+* **Function type:** Scalar, numeric
+
+<details>
+<summary>Example</summary>
+
+The following example performs the bitwise SHIFT operation `16 >> 3`.
+
+```sql
+SELECT BITWISE_SHIFT_RIGHT(16, 3) AS "bitwise_shift_right"
+```
+Returns the following:
+
+| `bitwise_shift_right` |
+| -- |
+| `2` |
+
+</details>
+
+[Learn more](sql-scalar.md#numeric-functions)
+
+## BITWISE_XOR
+
+Returns the bitwise exclusive OR between the two expressions: `expr1 ^ expr2`.
+
+* **Syntax:** `BITWISE_XOR(expr1, expr2)`
+* **Function type:** Scalar, numeric
+
+<details>
+<summary>Example</summary>
+
+The following example performs the bitwise XOR operation `12 ^ 10`.
+
+```sql
+SELECT BITWISE_XOR(12, 10) AS "bitwise_xor"
+```
+Returns the following:
+
+| `bitwise_xor` |
+| -- |
+| `6` |
+
+</details>
+
+[Learn more](sql-scalar.md#numeric-functions)
+
+## BLOOM_FILTER
+
+Computes a [Bloom filter](../development/extensions-core/bloom-filter.md) from values provided in an expression.
+
+
+* **Syntax:** `BLOOM_FILTER(expr, numEntries)`  
+  `numEntries` specifies the maximum number of distinct values before the false positive rate increases.
+* **Function type:** Aggregation
+
+<details>
+<summary>Example</summary>
+
+The following example returns a Base64-encoded Bloom filter representing the set of devices, `agent_category`, used in Albania:
+
+```sql
+SELECT "country",
+  BLOOM_FILTER(agent_category, 10) as albanian_bloom
+FROM "kttm"
+WHERE "country" = 'Albania'
+GROUP BY "country"
+```
+
+Returns the following:
+
+|`country`| `albanian_bloom`|
+|---| --- | 
+|`Albania`|`BAAAAAgAAACAAEAAAAAAAAAAAEIAAAAAAAAAAAAAAAAAAAAAAAIIAAAAAAAAAAAAAAAAAAIAAAAAAQAAAAAAAAAAAAAA`|
+
+</details>
+
+[Learn more](sql-aggregations.md)
+
+## BLOOM_FILTER_TEST
+
+Returns true if an expression is contained in a Base64-encoded [Bloom filter](../development/extensions-core/bloom-filter.md) string.
+
+* **Syntax:** `BLOOM_FILTER_TEST(expr, <STRING>)`
+* **Function type:** Scalar, other
+
+<details>
+<summary>Example</summary>
+
+The following example returns `true` when a device type, `agent_category`, exists in the Bloom filter representing the set of devices used in Albania:
+
+```sql
+SELECT agent_category,
+BLOOM_FILTER_TEST("agent_category", 'BAAAAAgAAACAAEAAAAAAAAAAAEIAAAAAAAAAAAAAAAAAAAAAAAIIAAAAAAAAAAAAAAAAAAIAAAAAAQAAAAAAAAAAAAAA') AS bloom_test
+FROM "kttm"
+GROUP BY 1
+```
+
+Returns the following:
+
+| `agent_category` | `bloom_test` |
+| --- | --- |
+| `empty` | `false` |
+| `Game console` | `false` |
+| `Personal computer` | `true` |
+| `Smart TV` | `false` |
+| `Smartphone` | `true` |
+| `Tablet` | `false` |
+
+</details>
+
+[Learn more](sql-scalar.md#other-scalar-functions)
+
+
+## BTRIM
+
+Trims characters from both the leading and trailing ends of an expression. Defaults `chars` to a space if none is provided.
+
+* **Syntax:** `BTRIM(expr[, chars])`
+* **Function type:** Scalar, string
+
+<details>
+<summary>Example</summary>
+
+The following example trims the `_` characters from both ends of the string expression.
+
+```sql
+SELECT 
+  '___abc___' AS "original_string",
+  BTRIM('___abc___', '_') AS "trim_both_ends"
+```
+
+Returns the following:
+
+| `original_string` | `trim_both_ends` |
+| -- | -- |
+| `___abc___` | `abc` |
+
+</details>
+
+[Learn more](sql-scalar.md#string-functions)
+
+## CASE
+
+Returns a result based on given conditions.
+
+### Simple CASE
+
+Compares an expression to a set of values or expressions.
+
+* **Syntax:** `CASE expr WHEN value1 THEN result1 \[ WHEN value2 THEN result2 ... \] \[ ELSE resultN \] END`
+* **Function type:** Scalar, other
+
+<details>
+<summary>Example</summary>
+
+The following example returns a UI type based on the value of `agent_category` from the `kttm` datasource.
+
+```sql
+SELECT "agent_category" AS "device_type",
+CASE "agent_category"
+    WHEN 'Personal computer' THEN 'Large UI'
+    WHEN 'Smartphone' THEN 'Mobile UI'
+    ELSE 'other'
+END AS "UI_type"
+FROM "kttm"
+LIMIT 2
+```
+
+Returns the following:
+
+| `device_type` | `UI_type` |
+| -- | -- |
+| `Personal computer` | `Large UI` |
+| `Smartphone` | `Mobile UI` |
+
+</details>
+
+[Lean more](sql-scalar.md#other-scalar-functions)
+
+### Searched CASE
+
+Evaluates a set of Boolean expressions.
+
+* **Syntax:** `CASE WHEN boolean_expr1 THEN result1 \[ WHEN boolean_expr2 THEN result2 ... \] \[ ELSE resultN \] END`
+* **Function type:** Scalar, other
+
+<details>
+<summary>Example</summary>
+
+The following example returns the departure location corresponding to the value of the `OriginStateName` column from the `flight-carriers` datasource.
+
+```sql
+SELECT "OriginStateName" AS "flight_origin",
+CASE
+    WHEN "OriginStateName" = 'Puerto Rico' THEN 'U.S. Territory'
+    WHEN "OriginStateName" = 'U.S. Virgin Islands' THEN 'U.S. Territory'
+    ELSE 'U.S. State'
+END AS "state_status"
+FROM "flight-carriers"
+LIMIT 2
+```
+
+Returns the following:
+
+| `flight_origin` | `departure_location` |
+| -- | -- |
+| `Puerto Rico` | `U.S. Territory` |
+| `Massachusetts` | `U.S. State` |
+
+</details>
+
+[Lean more](sql-scalar.md#other-scalar-functions)
+
+## CAST
+
+Converts a value into the specified data type.
+
+* **Syntax:** `CAST(value AS TYPE)`
+* **Function type:** Scalar, other
+
+<details>
+<summary>Example</summary>
+
+The following example converts the values in the `Distance` column from the `flight-carriers` datasource from `DOUBLE` to `VARCHAR`.
+
+```sql
+SELECT "Distance" AS "original_column",
+      CAST("Distance" AS VARCHAR) "cast_to_string" 
+FROM "flight-carriers"
+LIMIT 1
+```
+
+Returns the following:
+
+| `original_column` | `cast_to_string` |
+| -- | -- |
+| `1571` | `1571.0` |
+
+</details>
+
+[Learn more](sql-scalar.md#other-scalar-functions)
+
+## CEIL
+
+### Date and time
+
+Rounds up a timestamp by a given time unit.
+
+* **Syntax:** `CEIL(timestamp_expr TO unit>)`
+* **Function type:** Scalar, date and time
+
+<details>
+<summary>Example</summary>
+
+The following example rounds up the `__time` column from the `taxi-trips` datasource to the nearest year.
+
+```sql
+SELECT
+  "__time" AS "original_time",
+  CEIL("__time" TO YEAR) AS "ceiling"
+FROM "taxi-trips"
+LIMIT 1
+```
+
+Returns the following:
+
+| `original_time` | `ceiling` |
+| -- | -- |
+| `2013-08-01T08:14:37.000Z` | `2014-01-01T00:00:00.000Z` |
+
+</details>
+
+[Learn more](sql-scalar.md#date-and-time-functions)
+
+### Numeric
+
+Calculates the smallest integer value greater than or equal to the numeric expression.
+* **Syntax:** `CEIL(<NUMERIC>)`
+* **Function type:** Scalar, numeric
+
+<details>
+<summary>Example</summary>
+
+The following example applies the CEIL function to the `fare_amount` column from the `taxi-trips` datasource.
+
+```sql
+SELECT
+  "fare_amount" AS "fare_amount",
+  CEIL("fare_amount") AS "ceiling_fare_amount"
+FROM "taxi-trips"
+LIMIT 1
+```
+Returns the following:
+
+| `fare_amount` | `ceiling_fare_amount` |
+| -- | -- |
+| `21.25` | `22` |
+</details>
+
+[Learn more](sql-scalar.md#numeric-functions)
+
+## CHAR_LENGTH
+
+Alias for [`LENGTH`](#length).
+
+* **Syntax:** `CHAR_LENGTH(expr)`
+* **Function type:** Scalar, string 
+
+[Learn more](sql-scalar.md#string-functions)
+
+## CHARACTER_LENGTH
+
+Alias for [`LENGTH`](#length).
+
+* **Syntax:** `CHARACTER_LENGTH(expr)`
+* **Function type:** Scalar, string 
+
+[Learn more](sql-scalar.md#string-functions)
+
+
+## COALESCE
+
+Returns the first non-null value.
+* **Syntax:** `COALESCE(expr, expr, ...)`
+* **Function type:** Scalar, other
+
+<details>
+<summary>Example</summary>
+
+The following example returns the first non-null value from the list of parameters.
+
+```sql
+SELECT COALESCE(null, null, 5, 'abc') AS "first_non_null"
+```
+
+Returns the following:
+
+| `first_non_null` |
+| -- |
+| `5` |
+
+</details>
+
+[Learn more](sql-scalar.md#other-scalar-functions)
+
+## CONCAT
+
+Concatenates a list of expressions.
+
+* **Syntax:** `CONCAT(expr[, expr,...])`
+* **Function type:** Scalar, string
+
+<details>
+<summary>Example</summary>
+
+The following example concatenates the `OriginCityName` column from `flight-carriers`, the string ` to `, and the `DestCityName` column from `flight-carriers`. 
+
+```sql
+SELECT
+  "OriginCityName" AS "origin_city",
+  "DestCityName" AS "destination_city",
+  CONCAT("OriginCityName", ' to ', "DestCityName") AS "concatenate_flight_details"
+FROM "flight-carriers"
+LIMIT 1
+```
+
+Returns the following:
+
+| `origin_city` | `destination_city` | `concatenate_flight_details` |
+| -- | -- | -- |
+| `San Juan, PR` | `Washington, DC` | `San Juan, PR to Washington, DC` |
+
+</details>
+
+[Learn more](sql-scalar.md#string-functions)
+
+## CONTAINS_STRING
+
+Returns true if `str` is a substring of `expr`, case-sensitive. Otherwise, returns false.
+
+* **Syntax:** `CONTAINS_STRING(expr, str)`
+* **Function type:** Scalar, string
+
+<details>
+<summary>Example</summary>
+
+The following example returns true if the `OriginCityName` column from the `flight-carriers` datasource contains the substring `San`. 
+
+```sql
+SELECT
+  "OriginCityName" AS "origin_city",
+  CONTAINS_STRING("OriginCityName", 'San') AS "contains_string"
+FROM "flight-carriers"
+LIMIT 2
+```
+
+Returns the following:
+
+| `origin_city` | `contains_string` |
+| -- | -- |
+| `San Juan, PR` | `true` |
+| `Boston, MA` | `false` |
+
+</details>
+
+
+[Learn more](sql-scalar.md#string-functions)
+
+## COS
+
+Calculates the trigonometric cosine of an angle expressed in radians.
+
+* **Syntax:** `COS(expr)`
+* **Function type:** Scalar, numeric
+
+<details>
+<summary>Example</summary>
+
+The following example calculates the cosine of angle `PI/3` radians.
+
+```sql
+SELECT COS(PI / 3) AS "cosine"
+```
+Returns the following:
+
+| `cosine` |  
+| -- |
+| `0.5000000000000001` |
+</details>
+
+[Learn more](sql-scalar.md#numeric-functions)
+
+## COT
+
+Calculates the trigonometric cotangent of an angle expressed in radians.
+
+* **Syntax:** `COT(expr)`
+* **Function type:** Scalar, numeric
+
+<details>
+<summary>Example</summary>
+
+The following example calculates the cotangent of angle `PI/3` radians.
+
+```sql
+SELECT COT(PI / 3) AS "cotangent"
+```
+Returns the following:
+
+| `cotangent` |  
+| -- |
+| `0.577350269189626` |
+</details>
+
+[Learn more](sql-scalar.md#numeric-functions)
+
+## COUNT
+
+Counts the number of rows.
+
+* **Syntax**: `COUNT([DISTINCT] expr)` `COUNT(*)`  
+COUNT DISTINCT is an alias for [`APPROX_COUNT_DISTINCT`](#approx_count_distinct).
+* **Function type:** Aggregation
+
+<details>
+<summary>Example</summary>
+
+The following example counts the number of distinct flights per day after `'2005-01-01 00:00:00'` in `flight-carriers`:
+
+```sql
+SELECT
+  TIME_FLOOR(__time, 'P1D') AS "flight_day",
+  COUNT(*) AS "num_flights"
+FROM "flight-carriers"
+WHERE __time > '2005-01-01 00:00:00'
+GROUP BY 1
+LIMIT 3
+```
+
+Returns the following:
+
+|`flight_day`|`num_flights`|
+|------------|------------|
+|`2005-11-01T00:00:00.000Z`|`18961`|
+|`2005-11-02T00:00:00.000Z`|`19434`|
+|`2005-11-03T00:00:00.000Z`|`19745`|
+
+</details>
+
+[Learn more](sql-aggregations.md)
+
+## CUME_DIST
+
+Returns the cumulative distribution of the current row within the window calculated as `number of window rows at the same rank or higher than current row` / `total window rows`. The return value ranges between `1/number of rows` and 1.
+
+* **Syntax**: `CUME_DIST()`
+* **Function type:** Window
+
+<details>
+<summary>Example</summary>
+
+The following example returns the cumulative distribution of number of flights by airline from two airports on a single day.
+
+```sql
+SELECT FLOOR("__time" TO DAY)  AS "flight_day",
+    "Origin" AS "airport",
+    "Reporting_Airline" as "airline",
+    COUNT("Flight_Number_Reporting_Airline") as "num_flights",
+    CUME_DIST() OVER (PARTITION BY "Origin" ORDER BY COUNT("Flight_Number_Reporting_Airline") DESC) AS "cume_dist"
+FROM "flight-carriers"
+WHERE FLOOR("__time" TO DAY) = '2005-11-01'
+   AND "Origin" IN ('KOA', 'LIH')
+GROUP BY 1, 2, 3
+```
+
+Returns the following:
+
+| `flight_day` | `airport` | `airline` | `num_flights` | `cume_dist` |
+| --- | --- | --- | --- | ---|
+| `2005-11-01T00:00:00.000Z` | `KOA` | `HA` | `11` | `0.25` |
+| `2005-11-01T00:00:00.000Z` | `KOA` | `UA` | `4` |  `0.5` |
+| `2005-11-01T00:00:00.000Z` | `KOA` | `AA` | `1` |  `1` |
+| `2005-11-01T00:00:00.000Z` | `KOA` | `NW` | `1` | `1` |
+| `2005-11-01T00:00:00.000Z` | `LIH` | `HA` | `15` |  `0.3333333333333333` |
+| `2005-11-01T00:00:00.000Z` | `LIH` | `AA` | `2` | `1`|
+| `2005-11-01T00:00:00.000Z` | `LIH` | `UA` | `2` | `1` |
+ 
+</details>
+
+
+[Learn more](sql-window-functions.md#window-function-reference)
+
+## CURRENT_DATE
+
+Returns the current date in UTC time, unless you specify a different timezone in the query context.
+
+* **Syntax:** `CURRENT_DATE`
+* **Function type:** Scalar, date and time
+
+<details>
+<summary>Example</summary>
+
+The following example returns the current date.
+
+```sql
+SELECT CURRENT_DATE AS "current_date"
+```
+
+Returns the following:
+
+| `current_date` |
+| -- |
+| `2024-08-14T00:00:00.000Z `|
+
+</details>
+
+[Learn more](sql-scalar.md#date-and-time-functions)
+
+## CURRENT_TIMESTAMP
+
+Returns the current timestamp in UTC time, unless you specify a different timezone in the query context.
+
+
+* **Syntax:** `CURRENT_TIMESTAMP`
+* **Function type:** Scalar, date and time
+
+<details>
+<summary>Example</summary>
+
+The following example returns the current timestamp.
+
+```sql
+SELECT CURRENT_TIMESTAMP AS "current_timestamp"
+```
+
+Returns the following:
+
+| `current_timestamp` |
+| -- |
+| `2024-08-14T21:30:13.793Z` |
+
+</details>
+
+[Learn more](sql-scalar.md#date-and-time-functions)
+
+## DATE_TRUNC
+
+Rounds down a timestamp by a given time unit.
+
+* **Syntax:** `DATE_TRUNC(unit, timestamp_expr)` 
+* **Function type:** Scalar, date and time
+
+<details>
+<summary>Example</summary>
+
+The following example truncates a timestamp from the `__time` column from the `taxi-trips` datasource to the most recent `decade`.
+
+```sql
+SELECT 
+  "__time" AS "original_timestamp",
+  DATE_TRUNC('decade', "__time") AS "truncate_timestamp"
+FROM "taxi-trips"
+LIMIT 1
+```
+
+Returns the following:
+
+| `original_timestamp` | `truncate_time` |
+| -- | -- |
+| `2013-08-01T08:14:37.000Z` | `2010-01-01T00:00:00.000Z` |
+
+</details>
+
+[Learn more](sql-scalar.md#date-and-time-functions)
+
+
+## DECODE_BASE64_COMPLEX
+
+Decodes a Base64-encoded expression into a complex data type.
+
+You can use the function to ingest data when a column contains an encoded data sketch such as Theta or HLL.
+
+The function supports `hyperUnique` and `serializablePairLongString` data types by default.
+To enable support for a complex data type, load the [corresponding extension](../configuration/extensions.md):
+
+- `druid-bloom-filter`: `bloom`
+- `druid-datasketches`: `arrayOfDoublesSketch`, `HLLSketch`, `KllDoublesSketch`, `KllFloatsSketch`, `quantilesDoublesSketch`, `thetaSketch`
+- `druid-histogram`: `approximateHistogram`, `fixedBucketsHistogram`
+- `druid-stats`: `variance`
+- `druid-compressed-bigdecimal`: `compressedBigDecimal`
+- `druid-momentsketch`: `momentSketch`
+- `druid-tdigestsketch`: `tDigestSketch`
+
+* **Syntax:** `DECODE_BASE64_COMPLEX(dataType, expr)`
+* **Function type:** Scalar, other
+
+<details>
+<summary>Example</summary>
+
+The following example returns a Theta sketch complex type from a Base64-encoded string representation of the sketch:
+
+```sql
+SELECT DECODE_BASE64_COMPLEX('thetaSketch','AgMDAAAazJNBAAAAAACAP+k/tkWGkSoFYWMAG0y+3gVabvKcIUNrBv0jAkGsw7sK5szX1k0ScwtMfCQmFP/rDhFK6yU7PPkObZ/Ugw5fcBQZ+GaO+Nt6FP+Whz6TmxkWyRJ+gaQLFhcts1+c0Q/vF9FLFfaVlOkb3/XpXaZ3JhyZ2dG8Di2/HO10sMs9C0AdM4FdHuye6SB+GYinIhTOITOHzB5SAfIiph3de9qIGSM89V+s/TkdI/WZVzK9wF0npfi4ZrmgBSnVjphCtQA5K2fp0x59UCwvMopZarsSkzEo81OIxjznNNXLr1BbQBo1Ei3OxJOoNzVs0x9xzsm4NfgAZSvZQvI1c2TmPsZvlzpW7tmIlizOOsr6pGWoh0U99/tV8RFwhz0SJoWyU1Z2P0hZ5d7KRnZBjlWC+e/FLEKrWsu14rlFRXhsOuxRId9FboEuH9PqMUixI2lB8MhLS803hJDoZ7tMy7Egl+YNU04QM11stXX4Tu96NHHcGiZRuCyciGiTGVQflMLmNt6lW6zIwJy0baNdbwjMCTjtUF7oZOtugWLYYJE9sJU3HuVijc0J10l6SmPslbfY6Fw0Za9w/Zdhn/5nIuKc1WMrYWnAJQJKXY73bHYWq7gI6dRvYdC2fLJyv3F8qwQcOJgFc0GaGXw8KRF3w3IVCwxsMntWhdTkaJ88e++5NFyM1Hd/D79wg0b9vH8=') AS "theta_sketch"
+```
+
+You can perform Theta sketch operations on the resulting `COMPLEX<thetaSketch>` value which resembles the input string. 
+
+</details>
+
+[Learn more](./sql-scalar.md#other-scalar-functions)
+
+## DECODE_BASE64_UTF8
+
+Decodes a Base64-encoded expression into a UTF-8 encoded string.
+
+* **Syntax:** `DECODE_BASE64_UTF8(expr)`
+* **Function type:** Scalar, string
+
+<details>
+<summary>Example</summary>
+
+The following example decodes the Base64-encoded representation of "Hello, World!":
+
+```sql
+SELECT
+  DECODE_BASE64_UTF8('SGVsbG8sIFdvcmxkIQ==') as decoded
+```
+
+Returns the following:
+
+| `decoded` |
+| -- |
+| `Hello, World!` |
+
+</details>
+
+[Learn more](./sql-scalar.md#string-functions)
+
+## DEGREES
+
+Converts an angle from radians to degrees.
+
+* **Syntax:** `DEGREES(expr)`
+* **Function type:** Scalar, numeric
+
+<details>
+<summary>Example</summary>
+
+The following example converts an angle of `PI` radians to degrees
+
+```sql
+SELECT DEGREES(PI) AS "degrees"
+```
+Returns the following:
+
+| `degrees` |  
+| -- |
+| `180` |
+</details>
+
+[Learn more](sql-scalar.md#numeric-functions)
+
+## DENSE_RANK
+
+Returns the rank for a row within a window without gaps. For example, if two rows tie for a rank of 1, the subsequent row is ranked 2.
+
+* **Syntax**: `DENSE_RANK()`
+* **Function type:** Window
+
+<details>
+<summary>Example</summary>
+
+The following example returns the dense rank by airline for flights from two airports on a single day.
+
+```sql
+SELECT FLOOR("__time" TO DAY)  AS "flight_day",
+    "Origin" AS "airport",
+    "Reporting_Airline" as "airline",
+    COUNT("Flight_Number_Reporting_Airline") as "num_flights",
+    DENSE_RANK() OVER (PARTITION BY "Origin" ORDER BY COUNT("Flight_Number_Reporting_Airline") DESC) AS "dense_rank"
+FROM "flight-carriers"
+WHERE FLOOR("__time" TO DAY) = '2005-11-01'
+    AND "Origin" IN ('KOA', 'LIH')
+GROUP BY 1, 2, 3
+```
+
+Returns the following:
+
+| `flight_day` | `airport` | `airline` | `num_flights` | `dense_rank` |
+| --- | --- | --- | --- | ---|
+| `2005-11-01T00:00:00.000Z` | `KOA` | `HA` | `11` | `1` |
+| `2005-11-01T00:00:00.000Z` | `KOA` | `UA` | `4` | `2` |
+| `2005-11-01T00:00:00.000Z` | `KOA` | `AA` | `1` | `3` |
+| `2005-11-01T00:00:00.000Z` | `KOA` | `NW` | `1` | `3` |
+| `2005-11-01T00:00:00.000Z` | `LIH` | `HA` | `15` | `1` |
+| `2005-11-01T00:00:00.000Z` | `LIH` | `AA` | `2` | `2`|
+| `2005-11-01T00:00:00.000Z` | `LIH` | `UA` | `2` | `2` |
+ 
+</details>
+
+[Learn more](sql-window-functions.md#window-function-reference)
+
+## DIV
+
+Returns the result of integer division of `x` by `y`.
+
+:::info
+The `DIV` function is not implemented in Druid versions 30.0.0 or earlier. Consider using [`SAFE_DIVIDE`](./sql-functions.md#safe_divide) instead. 
+:::
+
+* **Syntax:** `DIV(x, y)`
+* **Function type:** Scalar, numeric
+
+
+<details>
+<summary>Example</summary>
+
+  The following calculates integer divisions of `78` by `10`.
+
+  ```sql
+  SELECT DIV(78, 10) as "division"
+  ``` 
+
+  Returns the following:
+
+  | `division` |
+  | -- |
+  | `7` |
+
+</details>
+
+
+[Learn more](sql-scalar.md#numeric-functions)
+
+## DS_CDF
+
+Returns a string representing an approximation to the cumulative distribution function given a list of split points that define the edges of the bins from a Quantiles sketch.  
+
+* **Syntax:** `DS_CDF(expr, splitPoint0, splitPoint1, ...)`
+* **Function type:** Scalar, sketch
+
+<details>
+<summary>Example</summary>
+
+The following example specifies three split points to return cumulative distribution function approximations on the `Distance` column from the `flight-carriers` datasource. The query may return a different approximation for each bin on each execution.
+
+```sql 
+SELECT DS_CDF( DS_QUANTILES_SKETCH("Distance"), 750, 1500, 2250) AS "estimate_cdf"
+FROM "flight-carriers"
+```
+
+Returns a result similar to the following:
+
+| `estimate_cdf` |
+| -- |
+| `[0.6332237016416492,0.8908411023460711,0.9612303007393957,1.0]` |
+
+</details>
+
+[Learn more](sql-scalar.md#sketch-functions)
+
+## DS_GET_QUANTILE
+
+Returns the quantile estimate corresponding to the fraction from a Quantiles sketch. 
+
+* **Syntax:** `DS_GET_QUANTILE(expr, fraction)`
+* **Function type:** Scalar, sketch
+
+<details>
+<summary>Example</summary>
+
+The following example approximates the median of the `Distance` column from the `flight-carriers` datasource. The query may return a different approximation with each execution.
+
+```sql
+SELECT DS_GET_QUANTILE( DS_QUANTILES_SKETCH("Distance"), 0.5) AS "estimate_median"
+FROM "flight-carriers"
+```
+
+Returns a result similar to the following:
+
+| `estimate_median` |
+| -- |
+| `569` |
+
+</details>
+
+[Learn more](sql-scalar.md#sketch-functions)
+
+## DS_GET_QUANTILES
+
+Returns a string representing an array of quantile estimates corresponding to a list of fractions from a Quantiles sketch. 
+
+* **Syntax:** `DS_GET_QUANTILES(expr, fraction0, fraction1, ...)`
+* **Function type:** Scalar, sketch
+
+<details>
+<summary>Example</summary>
+
+The following example approximates the 25th, 50th, and 75th percentiles of the `Distance` column from the `flight-carriers` datasource. The query may return a different approximation for each percentile on each execution.
+
+```sql 
+SELECT DS_GET_QUANTILES( DS_QUANTILES_SKETCH("Distance"), 0.25, 0.5, 0.75) AS "estimate_fractions"
+FROM "flight-carriers"
+```
+
+Returns a result similar to the following:
+
+| `estimate_fractions` |
+| -- |
+| `[316.0,571.0,951.0]` |
+
+</details>
+
+[Learn more](sql-scalar.md#sketch-functions)
+
+## DS_HISTOGRAM
+
+Returns an approximation to the histogram from a Quantiles sketch. The split points define the histogram bins. 
+
+* **Syntax:** `DS_HISTOGRAM(expr, splitPoint0, splitPoint1, ...)`
+* **Function type:** Scalar, sketch
+
+<details>
+<summary>Example</summary>
+
+The following example specifies three split points to approximate a histogram on the `Distance` column from the `flight-carriers` datasource. The query may return a different approximation for each bin on each execution.
+
+```sql
+SELECT DS_HISTOGRAM( DS_QUANTILES_SKETCH("Distance"), 750, 1500, 2250) AS "estimate_histogram"
+FROM "flight-carriers"
+
+```
+
+Returns a result similar to the following:
+
+| `estimate_histogram` |
+| -- |
+| `[358496.0,153974.99999999997,39909.99999999999,13757.000000000005]` |
+
+</details>
+
+[Learn more](sql-scalar.md#sketch-functions)
+
+## DS_HLL
+
+Creates a HLL sketch on a column containing HLL sketches or a regular column. See [DataSketches HLL Sketch module](../development/extensions-core/datasketches-hll.md) for a description of optional parameters.
+
+* **Syntax:**`DS_HLL(expr, [lgK, tgtHllType])`
+* **Function type:** Aggregation
+
+<details>
+<summary>Example</summary>
+
+The following example creates a HLL sketch on the `Tail_number` column of the `flight-carriers` datasource grouping by `OriginState` and `DestState`.
+
+```sql
+SELECT
+  "OriginState" AS "origin_state",
+  "DestState" AS "destination_state",
+  DS_HLL("Tail_Number") AS "hll_tail_number"
+FROM "flight-carriers"
+GROUP BY 1,2
+LIMIT 1
+```
+
+Returns the following:
+
+| `origin_state` | `destination_state` | `hll_tail_number` |
+| -- | -- | -- |
+| `AK` | `AK` | `"AwEHDAcIAAFBAAAAfY..."` |
+
+</details>
+
+
+[Learn more](sql-aggregations.md)
+
+## DS_QUANTILE_SUMMARY
+
+Returns a string summary of a Quantiles sketch. 
+* **Syntax:** `DS_QUANTILE_SUMMARY(expr)`
+* **Function type:** Scalar, sketch
+
+<details>
+<summary>Example</summary>
+
+The following example returns a summary of a Quantiles sketch on the `Distance` column from the `flight-carriers` datasource.
+
+```sql
+SELECT DS_QUANTILE_SUMMARY( DS_QUANTILES_SKETCH("Distance") ) AS "summary"
+FROM "flight-carriers"
+```
+
+Returns the following:
+
+<table>
+<tr>
+<td><code>summary</code></td>
+</tr>
+<tr>
+<td>
+
+```
+### Quantiles DirectCompactDoublesSketch SUMMARY: 
+   Empty                        : false
+   Memory, Capacity bytes       : true, 6128
+   Estimation Mode              : true
+   K                            : 128
+   N                            : 566,138
+   Levels (Needed, Total, Valid): 12, 12, 5
+   Level Bit Pattern            : 100010100011
+   BaseBufferCount              : 122
+   Combined Buffer Capacity     : 762
+   Retained Items               : 762
+   Compact Storage Bytes        : 6,128
+   Updatable Storage Bytes      : 14,368
+   Normalized Rank Error        : 1.406%
+   Normalized Rank Error (PMF)  : 1.711%
+   Min Item                     : 2.400000e+01
+   Max Item                     : 4.962000e+03
+### END SKETCH SUMMARY
+```
+
+</td>
+</tr>
+</table>
+
+</details>
+
+[Learn more](sql-scalar.md#sketch-functions)
+
+## DS_QUANTILES_SKETCH
+
+Creates a Quantiles sketch on a Quantiles sketch column or a regular column. See [DataSketches Quantiles Sketch module](../development/extensions-core/datasketches-quantiles.md) for a description of parameters.
+
+* **Syntax:** `DS_QUANTILES_SKETCH(expr, [k])`
+* **Function type:** Aggregation
+
+<details>
+<summary>Example</summary>
+
+The following example creates a Quantile sketch on the `Distance` column from the `flight-carriers` datasource.
+
+```sql
+SELECT DS_QUANTILES_SKETCH("Distance") AS "quantile_sketch"
+FROM "flight-carriers"
+```
+
+Returns the following:
+
+| `quantile_sketch` |
+| -- |
+| `AgMIGoAAAAB6owgAA...` |
+
+</details>
+
+[Learn more](sql-aggregations.md)
+
+## DS_RANK
+
+Returns an approximate rank of a given value in a distribution. The rank represents the fraction of the distribution less than the given value.
+
+* **Syntax:** `DS_RANK(expr, value)`
+* **Function type:** Scalar, sketch
+
+<details>
+<summary>Example</summary>
+
+The following example estimates the fraction of records in the `flight-carriers` datasource where the value in the `Distance` column is less than 500. The query may return a different approximation on each execution.
+
+```sql
+SELECT DS_RANK( DS_QUANTILES_SKETCH("Distance"), 500) AS "estimate_rank"
+FROM "flight-carriers"
+```
+
+Returns a result similar to the following:
+
+| `estimate_rank` |
+| -- |
+| `0.43837721544923675 ` |
+
+
+</details>
+
+[Learn more](sql-scalar.md#sketch-functions)
+
+## DS_THETA
+
+Creates a Theta sketch on a column containing Theta sketches or a regular column. See [DataSketches Theta Sketch module](../development/extensions-core/datasketches-theta.md#aggregator) for a description of optional parameters.
+
+* **Syntax:** `DS_THETA(expr, [size])`
+* **Function type:** Aggregation
+
+<details>
+<summary>Example</summary>
+
+The following example creates a Theta sketch on the `Tail_number` column of the `flight-carriers` datasource grouping by `OriginState` and `DestState`.
+
+```sql
+SELECT
+  "OriginState" AS "origin_state",
+  "DestState" AS "destination_state",
+  DS_THETA("Tail_Number") AS "theta_tail_number"
+FROM "flight-carriers"
+GROUP BY 1,2
+LIMIT 1
+```
+
+Returns the following:
+
+| `origin_state` | `destination_state` | `theta_tail_number` |
+| -- | -- | -- |
+| `AK` | `AK` | `AgMDAAAazJNBAAAAA...` |
+
+</details>
+
+[Learn more](sql-aggregations.md)
+
+## DS_TUPLE_DOUBLES
+
+Creates a Tuple sketch on raw data or a precomputed sketch column. See [DataSketches Tuple Sketch module](../development/extensions-core/datasketches-tuple.md) for a description of parameters.
+
+* **Syntax**: `DS_TUPLE_DOUBLES(expr[, nominalEntries])`  
+              `DS_TUPLE_DOUBLES(dimensionColumnExpr, metricColumnExpr1[, metricColumnExpr2, ...], [nominalEntries])`
+* **Function type:** Aggregation
+
+<details>
+<summary>Example</summary>
+
+The following example creates a Tuples sketch column that stores the arrival and departure delay minutes for each airline in `flight-carriers`:
+
+```sql
+SELECT
+  "Reporting_Airline",
+  DS_TUPLE_DOUBLES("Reporting_Airline", "ArrDelayMinutes", "DepDelayMinutes") AS tuples_delay
+FROM "flight-carriers"
+GROUP BY 1
+LIMIT 2
+```
+
+Returns the following:
+
+|`Reporting_Airline`|`tuples_delay`|
+|-------------------|--------------|
+|`AA`|`1.0`|
+|`AS`|`1.0`|
+
+</details>
+
+[Learn more](sql-aggregations.md)
+
+## DS_TUPLE_DOUBLES_INTERSECT
+
+Returns an intersection of Tuple sketches which each contain an array of double values as their Summary Objects. The values contained in the Summary Objects are summed when combined. If the last value of the array is a numeric literal, Druid assumes that the value is an override parameter for [nominal entries](../development/extensions-core/datasketches-tuple.md).
+
+* **Syntax**: `DS_TUPLE_DOUBLES_INTERSECT(expr, ..., [nominalEntries])`
+* **Function type:** Scalar, sketch
+
+<details>
+<summary>Example</summary>
+
+The following example calculates the total minutes of arrival delay for airlines flying out of `SFO` or `LAX`.
+An airline that doesn't fly out of both airports returns a value of 0.
+
+```sql
+SELECT
+  "Reporting_Airline",
+  DS_TUPLE_DOUBLES_METRICS_SUM_ESTIMATE(
+    DS_TUPLE_DOUBLES_INTERSECT(
+      DS_TUPLE_DOUBLES("Reporting_Airline", "ArrDelayMinutes") FILTER(WHERE "Origin" = 'SFO'),
+      DS_TUPLE_DOUBLES("Reporting_Airline", "ArrDelayMinutes") FILTER(WHERE "Origin" = 'LAX')
+    )
+  ) AS arrival_delay_sfo_lax
+FROM "flight-carriers"
+GROUP BY 1
+LIMIT 5
+```
+
+Returns the following:
+
+|`Reporting_Airline`|`arrival_delay_sfo_lax`|
+|----|---------|
+|`AA`|`[33296]`|
+|`AS`|`[13694]`|
+|`B6`|`[0]`|
+|`CO`|`[13582]`|
+|`DH`|`[0]`|
+
+</details>
+
+[Learn more](sql-scalar.md#tuple-sketch-functions)
+
+## DS_TUPLE_DOUBLES_METRICS_SUM_ESTIMATE
+
+Computes approximate sums of the values contained within a Tuple sketch which contains an array of double values as the Summary Object.
+
+* **Syntax**: `DS_TUPLE_DOUBLES_METRICS_SUM_ESTIMATE(expr)`
+* **Function type:** Scalar, sketch
+
+<details>
+<summary>Example</summary>
+
+The following example calculates the sum of arrival and departure delay minutes for each airline in `flight-carriers`:
+
+```sql
+SELECT
+  "Reporting_Airline",
+  DS_TUPLE_DOUBLES_METRICS_SUM_ESTIMATE(DS_TUPLE_DOUBLES("Reporting_Airline", "ArrDelayMinutes", "DepDelayMinutes")) AS sum_delays
+FROM "flight-carriers"
+GROUP BY 1
+LIMIT 2
+```
+
+Returns the following:
+
+|`Reporting_Airline`|`sum_delays`|
+|----|-----------------|
+|`AA`|`[612831,474309]`|
+|`AS`|`[157340,141462]`|
+
+Compare this example with an analogous SQL statement that doesn't use approximations:
+
+```sql
+SELECT
+  "Reporting_Airline",
+  SUM("ArrDelayMinutes") AS sum_arrival_delay,
+  SUM("DepDelayMinutes") AS sum_departure_delay
+FROM "flight-carriers"
+GROUP BY 1
+LIMIT 2
+```
+
+Returns the following:
+
+|`Reporting_Airline`|`sum_arrival_delay`|`sum_departure_delay`|
+|----|--------|--------|
+|`AA`|`612831`|`475735`|
+|`AS`|`157340`|`143620`|
+
+</details>
+
+[Learn more](sql-scalar.md#tuple-sketch-functions)
+
+## DS_TUPLE_DOUBLES_NOT
+
+Returns a set difference of Tuple sketches which each contain an array of double values as their Summary Objects. The values contained in the Summary Object are preserved as is. If the last value of the array is a numeric literal, Druid assumes that the value is an override parameter for [nominal entries](../development/extensions-core/datasketches-tuple.md).
+
+* **Syntax**: `DS_TUPLE_DOUBLES_NOT(expr, ..., [nominalEntries])`
+* **Function type:** Scalar, sketch
+
+<details>
+<summary>Example</summary>
+
+The following example calculates the total minutes of arrival delay for airlines that fly out of `SFO` but not `LAX`.
+
+```sql
+SELECT
+  "Reporting_Airline",
+  DS_TUPLE_DOUBLES_METRICS_SUM_ESTIMATE(
+    DS_TUPLE_DOUBLES_NOT(
+      DS_TUPLE_DOUBLES("Reporting_Airline", "ArrDelayMinutes") FILTER(WHERE "Origin" = 'SFO'),
+      DS_TUPLE_DOUBLES("Reporting_Airline", "ArrDelayMinutes") FILTER(WHERE "Origin" = 'LAX')
+    )
+  ) AS arrival_delay_sfo_lax
+FROM "flight-carriers"
+GROUP BY 1
+LIMIT 5
+```
+
+Returns the following:
+
+|`Reporting_Airline`|`arrival_delay_sfo_lax`|
+|----|---------|
+|`AA`|`[0]`|
+|`AS`|`[0]`|
+|`B6`|`[0]`|
+|`CO`|`[0]`|
+|`DH`|`[93]`|
+
+</details>
+
+[Learn more](sql-scalar.md#tuple-sketch-functions)
+
+## DS_TUPLE_DOUBLES_UNION
+
+Returns a union of Tuple sketches which each contain an array of double values as their Summary Objects. The values contained in the Summary Objects are summed when combined. If the last value of the array is a numeric literal, Druid assumes that the value is an override parameter for [nominal entries](../development/extensions-core/datasketches-tuple.md).
+
+* **Syntax**: `DS_TUPLE_DOUBLES_UNION(expr, ..., [nominalEntries])`
+* **Function type:** Scalar, sketch
+
+<details>
+<summary>Example</summary>
+
+The following example calculates the total minutes of arrival delay for airlines flying out of either `SFO` or `LAX`.
+
+```sql
+SELECT
+  "Reporting_Airline",
+  DS_TUPLE_DOUBLES_METRICS_SUM_ESTIMATE(
+    DS_TUPLE_DOUBLES_UNION(
+      DS_TUPLE_DOUBLES("Reporting_Airline", "ArrDelayMinutes") FILTER(WHERE "Origin" = 'SFO'),
+      DS_TUPLE_DOUBLES("Reporting_Airline", "ArrDelayMinutes") FILTER(WHERE "Origin" = 'LAX')
+    )
+  ) AS arrival_delay_sfo_lax
+FROM "flight-carriers"
+GROUP BY 1
+LIMIT 5
+```
+
+Returns the following:
+
+|`Reporting_Airline`|`arrival_delay_sfo_lax`|
+|----|---------|
+|`AA`|`[33296]`|
+|`AS`|`[13694]`|
+|`B6`|`[0]`|
+|`CO`|`[13582]`|
+|`DH`|`[93]`|
+
+</details>
+
+[Learn more](sql-scalar.md#tuple-sketch-functions)
+
+## EARLIEST
+
+Returns the value of a numeric or string expression corresponding to the earliest `__time` value.
+
+* **Syntax**: `EARLIEST(expr, [maxBytesPerValue])`
+* **Function type:** Aggregation
+
+<details>
+<summary>Example</summary>
+
+The following example returns the origin airport code associated with the earliest departing flight daily after `'2005-01-01 00:00:00'` in `flight-carriers`:
+
+```sql
+SELECT
+  TIME_FLOOR(__time, 'P1D') AS "departure_day",
+  EARLIEST("Origin") AS "origin"
+FROM "flight-carriers"
+WHERE __time >= TIMESTAMP '2005-01-01 00:00:00'
+GROUP BY 1
+LIMIT 2
+```
+
+Returns the following:
+
+|`departure_day`|`origin`|
+|------------|--------|
+|`2005-11-01T00:00:00.000Z`|`LAS`|
+|`2005-11-02T00:00:00.000Z`|`SDF`|
+
+</details>
+
+[Learn more](sql-aggregations.md)
+
+## EARLIEST_BY
+
+Returns the value of a numeric or string expression corresponding to the earliest time value from `timestampExpr`.
+
+* **Syntax**: `EARLIEST_BY(expr, timestampExpr, [maxBytesPerValue])`
+* **Function type:** Aggregation
+
+<details>
+<summary>Example</summary>
+
+The following example returns the destination airport code associated with the earliest arriving flight daily after `'2005-01-01 00:00:00'` in `flight-carriers`:
+
+```sql
+SELECT
+  TIME_FLOOR(TIME_PARSE("arrivalime"), 'P1D') AS "arrival_day",
+  EARLIEST_BY("Dest", TIME_PARSE("arrivalime")) AS "dest"
+FROM "flight-carriers"
+WHERE TIME_PARSE("arrivalime") >= TIMESTAMP '2005-01-01 00:00:00'
+GROUP BY 1
+LIMIT 2
+```
+
+Returns the following:
+
+|`arrival_day`|`origin`|
+|-------------|--------|
+|`2005-11-01T00:00:00.000Z`|`RSW`|
+|`2005-11-02T00:00:00.000Z`|`CLE`|
+
+</details>
+
+[Learn more](sql-aggregations.md)
+
+## EXP
+
+Calculates _e_ raised to the power of the numeric expression.
+
+* **Syntax:** `EXP(<NUMERIC>)`
+* **Function type:** Scalar, numeric
+
+<details>
+<summary>Example</summary>
+
+The following example calculates _e_ to the power of 1.
+
+```sql
+SELECT EXP(1) AS "exponential" 
+```
+Returns the following:
+
+| `exponential` |
+| -- |
+| `2.7182818284590455` |
+</details>
+
+[Learn more](sql-scalar.md#numeric-functions)
+
+## EXTRACT
+
+Extracts the value of some unit from the timestamp.
+
+* **Syntax:** `EXTRACT(unit FROM timestamp_expr)`
+* **Function type:** Scalar, date and time
+
+<details>
+<summary>Example</summary>
+
+The following example extracts the year from the `__time` column from the `taxi-trips` datasource.
+
+```sql
+SELECT 
+  "__time" AS "original_time",
+  EXTRACT(YEAR FROM "__time" ) AS "year"
+FROM "taxi-trips"
+LIMIT 1
+```
+
+Returns the following:
+
+| `original_time` | `year` |
+| -- | -- |
+| `2013-08-01T08:14:37.000Z` | `2013` |
+
+</details>
+
+[Learn more](sql-scalar.md#date-and-time-functions)
+
+## FIRST_VALUE
+
+Returns the value evaluated for the expression for the first row within the window.
+
+* **Syntax**: `FIRST_VALUE(expr)`
+* **Function type:** Window
+
+<details>
+<summary>Example</summary>
+
+The following example returns the name of the first airline in the window of flights by airline for two airports on a single day.
+
+```sql
+SELECT FLOOR("__time" TO DAY)  AS "flight_day",
+    "Origin" AS "airport",
+    "Reporting_Airline" as "airline",
+    COUNT("Flight_Number_Reporting_Airline") as "num_flights",
+    FIRST_VALUE("Reporting_Airline") OVER (PARTITION BY "Origin" ORDER BY COUNT("Flight_Number_Reporting_Airline") DESC) AS "first_val"
+FROM "flight-carriers"
+WHERE FLOOR("__time" TO DAY) = '2005-11-01'
+    AND "Origin" IN ('KOA', 'LIH')
+GROUP BY 1, 2, 3
+```
+
+Returns the following:
+
+| `flight_day` | `airport` | `airline` | `num_flights` | `first_val` |
+| --- | --- | --- | --- | ---|
+| `2005-11-01T00:00:00.000Z` | `KOA` | `HA` | `11` | `HA` |
+| `2005-11-01T00:00:00.000Z` | `KOA` | `UA` | `4` | `HA` |
+| `2005-11-01T00:00:00.000Z` | `KOA` | `AA` | `1` | `HA` |
+| `2005-11-01T00:00:00.000Z` | `KOA` | `NW` | `1` | `HA` |
+| `2005-11-01T00:00:00.000Z` | `LIH` | `HA` | `15` | `HA` |
+| `2005-11-01T00:00:00.000Z` | `LIH` | `AA` | `2` | `HA` |
+| `2005-11-01T00:00:00.000Z` | `LIH` | `UA` | `2` | `HA` |
+ 
+</details>
+
+[Learn more](sql-window-functions.md#window-function-reference)
+
+## FLOOR
+
+### Date and time
+
+Rounds down a timestamp by a given time unit. 
+
+* **Syntax:** `FLOOR(timestamp_expr TO unit)`
+* **Function type:** Scalar, date and time
+
+<details>
+<summary>Example</summary>
+
+The following example rounds down the `__time` column from the `taxi-trips` datasource to the nearest year.
+
+```sql
+SELECT
+  "__time" AS "original_time",
+  FLOOR("__time" TO YEAR) AS "floor"
+FROM "taxi-trips"
+LIMIT 1
+```
+
+Returns the following:
+
+| `original_time` | `floor` |
+| -- | -- |
+| `2013-08-01T08:14:37.000Z` | `2013-01-01T00:00:00.000Z` |
+
+</details>
+
+[Learn more](sql-scalar.md#date-and-time-functions)
+
+### Numeric
+
+Calculates the largest integer less than or equal to the numeric expression.
+
+* **Syntax:** `FLOOR(expr)`
+* **Function type:** Scalar, numeric
+
+<details>
+<summary>Example</summary>
+
+The following example applies the FLOOR function to the `fare_amount` column from the `taxi-trips` datasource.
+
+```sql
+SELECT
+  "fare_amount" AS "fare_amount",
+  FLOOR("fare_amount") AS "floor_fare_amount"
+FROM "taxi-trips"
+LIMIT 1
+```
+Returns the following:
+
+| `fare_amount` | `floor_fare_amount` |
+| -- | -- |
+| `21.25` | `21` |
+</details>
+
+[Learn more](sql-scalar.md#numeric-functions)
+
+## GREATEST
+
+Returns the maximum value from the provided expressions. For information on how Druid interprets the arguments passed into the function, see [Reduction functions](sql-scalar.md#reduction-functions).
+
+* **Syntax:** `GREATEST([expr1, ...])`
+* **Function type:** Scalar, reduction
+
+<details>
+<summary>Example</summary>
+
+The following example returns the greatest value between the numeric constant `PI`, the integer number `4`, and the double `-5.0`. Druid interprets these arguments as DOUBLE data type.
+
+```sql
+SELECT GREATEST(PI, 4, -5.0) AS "greatest"
+```
+
+Returns the following:
+
+| `greatest` |
+| -- |
+| `4` |
+
+</details>
+
+[Learn more](sql-scalar.md#reduction-functions)
+
+
+## GROUPING
+
+Returns a number for each output row of a groupBy query, indicating whether the specified dimension is included for that row.
+
+* **Syntax**: `GROUPING(expr, expr...)`
+* **Function type:** Aggregation
+
+<details>
+<summary>Example</summary>
+
+The following example returns the total minutes of flight delay for each day of the week in `flight-carriers`.
+The GROUP BY clause creates two grouping sets, one for the day of the week and one for the grand total.
+
+For more information, refer to [CASE](#case) and grouping sets with [SQL GROUP BY](sql.md#group-by).
+
+```sql
+SELECT
+  CASE
+     WHEN GROUPING("DayOfWeek") = 1 THEN 'Total'
+     ELSE "DayOfWeek"
+  END AS "DayOfWeek",
+  GROUPING("DayOfWeek") AS Subgroup,
+  SUM("DepDelayMinutes") AS "MinutesDelayed"
+FROM "flight-carriers"
+GROUP BY GROUPING SETS("DayOfWeek", ())
+```
+
+Returns the following:
+
+|`DayOfWeek`|`Subgroup`|`MinutesDelayed`|
+|-----------|-----------|----------------|
+|`1`|`0`|`998505`|
+|`2`|`0`|`1031599`|
+|`3`|`0`|`884677`|
+|`4`|`0`|`525351`|
+|`5`|`0`|`519413`|
+|`6`|`0`|`354601`|
+|`7`|`0`|`848704`|
+|`Total`|`1`|`5162850`|
+
+</details>
+
+[Learn more](sql-aggregations.md)
+
+## HLL_SKETCH_ESTIMATE
+
+Returns the distinct count estimate from a HLL sketch. To round the distinct count estimate, set `round` to true. `round` defaults to false.
+
+* **Syntax:** `HLL_SKETCH_ESTIMATE(expr, [round])`
+* **Function type:** Scalar, sketch
+
+
+<details>
+<summary>Example</summary>
+
+The following example estimates the distinct number of unique tail numbers in the `flight-carriers` datasource.
+
+```sql
+SELECT
+  HLL_SKETCH_ESTIMATE(DS_HLL("Tail_Number")) AS "estimate"
+FROM "flight-carriers"
+```
+
+Returns the following:
+
+| `estimate` |
+| -- |
+| `4685.8815405960595` |
+
+</details>
+
+[Learn more](sql-scalar.md#sketch-functions)
+
+## HLL_SKETCH_ESTIMATE_WITH_ERROR_BOUNDS
+
+Returns the distinct count estimate and error bounds from a HLL sketch. To specify the number of standard bound deviations, use `numStdDev`.
+
+* **Syntax:** `HLL_SKETCH_ESTIMATE_WITH_ERROR_BOUNDS(expr, [numStdDev])`
+* **Function type:** Scalar, sketch
+
+<details>
+<summary>Example</summary>
+
+The following example estimates the number of unique tail numbers in the `flight-carriers` datasource with error bounds at plus or minus one standard deviation.
+
+```sql
+SELECT
+  HLL_SKETCH_ESTIMATE_WITH_ERROR_BOUNDS(DS_HLL("Tail_Number"), 1) AS "estimate_with_errors"
+FROM "flight-carriers"
+```
+
+Returns the following:
+
+| `estimate_with_errors` |
+| -- |
+| `[4685.8815405960595,4611.381540678335,4762.978259800803]` |
+
+
+</details>
+
+[Learn more](sql-scalar.md#sketch-functions)
+
+## HLL_SKETCH_TO_STRING
+
+Returns a human-readable string representation of a HLL sketch for debugging.
+
+* **Syntax:** `HLL_SKETCH_TO_STRING(expr)`
+* **Function type:** Scalar, sketch
+
+<details>
+<summary>Example</summary>
+
+The following example returns the HLL sketch on column `Tail_Number` from the `flight-carriers` datasource as a human-readable string.
+
+```sql
+SELECT
+  HLL_SKETCH_TO_STRING( DS_HLL("Tail_Number") ) AS "summary"
+FROM "flight-carriers"
+```
+
+Returns the following:
+
+<table>
+<tr>
+<td><code>summary</code></td>
+</tr>
+<tr>
+<td>
+
+```
+### HLL SKETCH SUMMARY: 
+  Log Config K   : 12
+  Hll Target     : HLL_4
+  Current Mode   : HLL
+  Memory         : false
+  LB             : 4611.381540678335
+  Estimate       : 4685.8815405960595
+  UB             : 4762.978259800803
+  OutOfOrder Flag: true
+  CurMin         : 0
+  NumAtCurMin    : 1316
+  HipAccum       : 0.0
+  KxQ0           : 2080.7755126953125
+  KxQ1           : 0.0
+  Rebuild KxQ Flg: false
+```
+
+</td>
+</tr>
+</table>
+
+</details>
+
+[Learn more](sql-scalar.md#sketch-functions)
+
+## HLL_SKETCH_UNION
+
+Returns a union of HLL sketches. See [DataSketches HLL Sketch module](../development/extensions-core/datasketches-hll.md) for a description of optional parameters.
+
+* **Syntax:** `HLL_SKETCH_UNION([lgK, tgtHllType], expr0, expr1, ...)`
+* **Function type:** Scalar, sketch
+
+
+<details>
+<summary>Example</summary>
+
+The following example estimates the union of the HLL sketch of tail numbers that took off from `CA` and the HLL sketch of tail numbers that took off from `TX`. The example uses the `Tail_Number` and `OriginState` columns from the `flight-carriers` datasource. 
+
+```sql
+SELECT
+  HLL_SKETCH_ESTIMATE(
+    HLL_SKETCH_UNION( 
+      DS_HLL("Tail_Number") FILTER(WHERE "OriginState" = 'CA'),
+      DS_HLL("Tail_Number") FILTER(WHERE "OriginState" = 'TX')
+    )
+  ) AS "estimate_union"
+FROM "flight-carriers"
+```
+
+Returns the following:
+
+| `estimate_union` |
+| -- |
+| `4204.798431046455` |
+
+</details>
+
+[Learn more](sql-scalar.md#sketch-functions)
+
+## HUMAN_READABLE_BINARY_BYTE_FORMAT
+
+Converts an integer byte size into human-readable [IEC](https://en.wikipedia.org/wiki/Binary_prefix) format.
+
+* **Syntax:** `HUMAN_READABLE_BINARY_BYTE_FORMAT(value[, precision])`
+* **Function type:** Scalar, numeric
+
+<details>
+<summary>Example</summary>
+
+  The following example converts `1000000` into IEC format.
+
+  ```sql
+    SELECT HUMAN_READABLE_BINARY_BYTE_FORMAT(1000000, 2) AS "iec_format"
+  ```
+  
+  Returns the following:
+
+  | `iec_format` |
+  | -- |
+  | `976.56 KiB` |
+ 
+</details>
+
+[Learn more](sql-scalar.md#numeric-functions)
+
+## HUMAN_READABLE_DECIMAL_BYTE_FORMAT
+
+Converts a byte size into human-readable [SI](https://en.wikipedia.org/wiki/Binary_prefix) format.
+
+* **Syntax:** `HUMAN_READABLE_DECIMAL_BYTE_FORMAT(value[, precision])`
+* **Function type:** Scalar, numeric
+
+<details>
+<summary>Example</summary>
+
+The following example converts `1000000` into SI format.
+
+```sql
+SELECT HUMAN_READABLE_DECIMAL_BYTE_FORMAT(1000000, 2) AS "si_format"
+```
+
+Returns the following:
+
+|`si_format`|
+|--|
+|`1.00 MB`|
+
+</details>
+
+[Learn more](sql-scalar.md#numeric-functions)
+
+## HUMAN_READABLE_DECIMAL_FORMAT
+
+Converts a byte size into human-readable SI format with single-character units.
+
+* **Syntax:** `HUMAN_READABLE_DECIMAL_FORMAT(value[, precision])`
+* **Function type:** Scalar, numeric
+
+<details>
+<summary>Example</summary>
+
+  The following example converts `1000000` into single character SI format.
+
+```sql
+SELECT HUMAN_READABLE_DECIMAL_FORMAT(1000000, 2) AS "single_character_si_format"
+```
+
+Returns the following:
+
+|`single_character_si_format`|
+|--|
+|`1.00 M`|
+</details>
+
+[Learn more](sql-scalar.md#numeric-functions)
+
+## ICONTAINS_STRING
+
+Returns true if `str` is a substring of `expr`, case-insensitive. Otherwise, returns false.
+
+* **Syntax:** `ICONTAINS_STRING(expr, str)`
+* **Function type:** Scalar, string
+
+<details>
+<summary>Example</summary>
+
+The following example returns true if the `OriginCityName` column from the `flight-carriers` datasource contains the case-insensitive substring `san`.  
+
+```sql
+SELECT
+  "OriginCityName" AS "origin_city",
+  ICONTAINS_STRING("OriginCityName", 'san') AS "contains_case_insensitive_string"
+FROM "flight-carriers"
+LIMIT 2
+```
+
+Returns the following:
+
+| `origin_city` | `contains_case_insensitive_string` |
+| -- | -- |
+| `San Juan, PR` | `true` |
+| `Boston, MA` | `false` |
+
+</details>
+
+[Learn more](sql-scalar.md#string-functions)
+
+## IPV4_MATCH
+
+Returns true if the IPv4 `address` belongs to the `subnet` literal, otherwise returns false.
+
+* **Syntax:** `IPV4_MATCH(address, subnet)`
+* **Function type:** Scalar, IP address
+
+<details>
+<summary>Example</summary>
+
+The following example returns true if the IPv4 address in the `forward_for` column from the `kttm` datasource belongs to the subnet `181.13.41.0/24`.
+
+```sql
+SELECT 
+  "forwarded_for" AS "ipv4_address",
+  IPV4_MATCH("forwarded_for", '181.13.41.0/24') AS "belongs_in_subnet"
+FROM "kttm"
+LIMIT 2
+```
+
+Returns the following:
+
+| `ipv4_address` | `belongs_in_subnet`|
+| -- | -- |
+| `181.13.41.82` | `true`|
+| `177.242.100.0` | `false`|
+
+</details>
+
+
+[Learn more](sql-scalar.md#ip-address-functions)
+
+
+## IPV4_PARSE
+
+Parses an IPv4 `address` into its integer notation.
+
+* **Syntax:** `IPV4_PARSE(address)`
+* **Function type:** Scalar, IP address
+
+<details>
+<summary>Example</summary>
+
+The following example returns an integer that represents the IPv4 address `5.5.5.5`.
+
+```sql
+SELECT 
+  '5.5.5.5' AS "ipv4_address",
+  IPV4_PARSE('5.5.5.5') AS "integer"
+```
+
+Returns the following:
+
+| `ipv4_address` | `integer` |
+| -- | -- |
+| `5.5.5.5` | `84215045` |
+
+</details>
+
+[Learn more](sql-scalar.md#ip-address-functions)
+
+## IPV4_STRINGIFY
+
+Converts an IPv4 `address` in integer notation into dot-decimal notation.
+
+* **Syntax:** `IPV4_STRINGIFY(address)`
+* **Function type:** Scalar, IP address
+
+<details>
+<summary>Example</summary>
+
+The following example returns the integer `84215045` in IPv4 dot-decimal notation.
+
+```sql
+SELECT 
+  '84215045' AS "integer",
+  IPV4_STRINGIFY(84215045) AS "dot_decimal_notation"
+```
+
+Returns the following:
+
+| `integer` | `dot_decimal_notation` |
+| -- | -- |
+| `84215045` | `5.5.5.5` |
+
+</details>
+
+[Learn more](sql-scalar.md#ip-address-functions)
+
+## IPV6_MATCH
+
+Returns true if the IPv6 `address` belongs to the `subnet` literal. Otherwise, returns false.
+
+* **Syntax:** `IPV6_MATCH(address, subnet)`
+* **Function type:** Scalar, IP address
+
+<details>
+<summary>Example</summary>
+
+The following example returns true because `75e9:efa4:29c6:85f6::232c` is in the subnet of `75e9:efa4:29c6:85f6::/64`.
+
+```sql
+SELECT 
+  '75e9:efa4:29c6:85f6::232c' AS "ipv6_address",
+  IPV6_MATCH('75e9:efa4:29c6:85f6::232c', '75e9:efa4:29c6:85f6::/64') AS "belongs_in_subnet" 
+```
+
+Returns the following: 
+
+| `ipv6_address` | `belongs_in_subnet` |
+| -- | -- |
+| `75e9:efa4:29c6:85f6::232c` | `true` |
+
+
+</details>
+
+[Learn more](sql-scalar.md#ip-address-functions)
+
+
+## JSON_KEYS
+
+Returns an array of field names from an expression, at a specified path.
+
+* **Syntax:** `JSON_KEYS(expr, path)`
+* **Function type:** JSON
+
+<details>
+<summary>Example</summary>
+
+The following example returns an array of field names from the nested column `agent`:
+
+```sql
+SELECT
+  JSON_KEYS(agent, '$.') AS agent_keys
+FROM "kttm_nested"
+LIMIT 1
+```
+
+Returns the following:
+
+| `agent_keys` |
+| -- |
+| `[type, category, browser, browser_version, os, platform]` |
+
+</details>
+
+[Learn more](sql-json-functions.md)
+
+## JSON_MERGE
+
+Merges two or more JSON `STRING` or `COMPLEX<json>` expressions into one, preserving the rightmost value when there are key overlaps.
+Returns `NULL` if any argument is `NULL`.
+The function always returns a `COMPLEX<json>` object.
+
+* **Syntax:** `JSON_MERGE(expr1, expr2[, expr3 ...])`
+* **Function type:** JSON
+
+<details>
+<summary>Example</summary>
+
+The following example merges the `event` object with a static string `example_string`:
+
+```sql
+SELECT 
+  event,
+  JSON_MERGE(event, '{"example_string": 123}') as event_with_string
+FROM "kttm_nested"
+LIMIT 1
+```
+
+Returns the following:
+
+| `event` | `event_with_string` |
+| -- | -- |
+| `{"type":"PercentClear","percentage":55}` | `{"type":"PercentClear","percentage":55,"example_string":123}` |
+
+</details>
+
+[Learn more](sql-json-functions.md)
+
+## JSON_OBJECT
+
+Constructs a new `COMPLEX<json>` object from one or more expressions. 
+The `KEY` expressions must evaluate to string types.
+The `VALUE` expressions can be composed of any input type, including other `COMPLEX<json>` objects.
+The function can accept colon-separated key-value pairs.
+
+* **Syntax:** `JSON_OBJECT(KEY expr1 VALUE expr2[, KEY expr3 VALUE expr4, ...])`  
+  or  
+  `JSON_OBJECT(expr1:expr2[, expr3:expr4, ...])`
+* **Function type:** JSON
+
+<details>
+<summary>Example</summary>
+
+The following example creates a new object `combinedJSON` from `continent` in `geo_ip` and `type` in `event`:
+
+```sql
+SELECT
+  JSON_OBJECT(
+     KEY 'geo_ip' VALUE JSON_QUERY(geo_ip, '$.continent'),
+     KEY 'event' VALUE JSON_QUERY(event, '$.type')
+     )
+  as combined_JSON
+FROM "kttm_nested"
+LIMIT 1
+```
+
+Returns the following:
+
+| `combined_JSON` |
+| -- |
+| `{"geo_ip": {"continent": "South America"},"event": {"type": "PercentClear"}}` |
+
+</details>
+
+[Learn more](sql-json-functions.md)
+
+## JSON_PATHS
+
+Returns an array of all paths which refer to primitive values in an expression, in JSONPath format.
+
+* **Syntax:** `JSON_PATHS(expr)`  
+* **Function type:** JSON
+
+<details>
+<summary>Example</summary>
+
+The following example returns an array of distinct paths in the `geo_ip` nested column:
+
+```sql
+SELECT
+  ARRAY_CONCAT_AGG(DISTINCT JSON_PATHS(geo_ip)) AS geo_ip_paths
+from "kttm_nested"
+```
+
+Returns the following:
+
+| `geo_ip_paths` |
+| -- |
+| `[$.city, $.continent, $.country, $.region]` |
+
+</details>
+
+[Learn more](sql-json-functions.md)
+
+## JSON_QUERY
+
+Extracts a `COMPLEX<json>` value from an expression at a specified path.
+
+* **Syntax:** `JSON_QUERY(expr, path)`  
+* **Function type:** JSON
+
+<details>
+<summary>Example</summary>
+
+The following example returns the values of `percentage` in the `event` nested column:
+
+```sql
+SELECT
+   "event",
+   JSON_QUERY("event", '$.percentage')
+FROM "kttm_nested"
+LIMIT 2
+```
+
+Returns the following:
+
+| `event` | `percentage` |
+| -- | -- |
+| `{"type":"PercentClear","percentage":55}` | `55` |
+| `{"type":"PercentClear","percentage":80}` | `80` |
+
+</details>
+
+[Learn more](sql-json-functions.md)
+
+## JSON_QUERY_ARRAY
+
+Extracts an `ARRAY<COMPLEX<json>>` value from an expression at a specified path.
+
+If the value isn't an array, the function translates it into a single element `ARRAY` containing the value at `path`.
+This function is mainly used to extract arrays of objects to use as inputs to other [array functions](./sql-array-functions.md).
+
+* **Syntax:** `JSON_QUERY_ARRAY(expr, path)`
+* **Function type:** JSON
+
+<details>
+<summary>Example</summary>
+
+The following example returns an array of `percentage` values in the `event` nested column:
+
+```sql
+SELECT
+   "event",
+   JSON_QUERY_ARRAY("event", '$.percentage')
+FROM "kttm_nested"
+LIMIT 2
+```
+
+Returns the following:
+
+| `event` | `percentage` |
+| -- | -- |
+| `{"type":"PercentClear","percentage":55}` | `[55]` |
+| `{"type":"PercentClear","percentage":80}` | `[80]` |
+
+</details>
+
+[Learn more](sql-json-functions.md)
+
+## JSON_VALUE
+
+Extracts a primitive value from an expression at a specified path.
+
+If you include `RETURNING` and specify a SQL type (such as `VARCHAR`, `BIGINT`, `DOUBLE`) the function plans the query using the suggested type.
+If `RETURNING` isn't included, the function attempts to infer the type based on the context.
+If the function can't infer the type, it defaults to `VARCHAR`.  Primitive arrays can also be returned, but only if `RETURNING` is specified as an `ARRAY` type, e.g. `RETURNING VARCHAR ARRAY`.
+
+* **Syntax:** `JSON_VALUE(expr, path [RETURNING sqlType])`
+* **Function type:** JSON
+
+<details>
+<summary>Example</summary>
+
+The following example returns the value of `city` in the `geo_ip` nested column:
+
+```sql
+SELECT
+  geo_ip,
+  JSON_VALUE(geo_ip, '$.city' RETURNING VARCHAR) as city
+FROM "kttm_nested"
+WHERE JSON_VALUE(geo_ip, '$.continent') = 'Asia'
+LIMIT 2
+```
+
+Returns the following:
+
+| `geo_ip` | `city` |
+| -- | -- |
+| `{"continent":"Asia","country":"Taiwan","region":"Taipei City","city":"Taipei"}` | `Taipei` |
+| `{"continent":"Asia","country":"Thailand","region":"Bangkok","city":"Bangkok"}` | `Bangkok` |
+
+</details>
+
+[Learn more](sql-json-functions.md)
+
+## LAG
+
+If you do not supply an `offset`, returns the value evaluated at the row preceding the current row. Specify an offset number `n` to return the value evaluated at `n` rows preceding the current one.
+
+* **Syntax**: `LAG(expr[, offset])`
+* **Function type:** Window
+
+<details>
+<summary>Example</summary>
+
+The following example returns the preceding airline in the window for flights by airline from two airports on a single day.
+
+```sql
+SELECT FLOOR("__time" TO DAY)  AS "flight_day",
+    "Origin" AS "airport",
+    "Reporting_Airline" as "airline",
+    COUNT("Flight_Number_Reporting_Airline") as "num_flights",
+    LAG("Reporting_Airline") OVER (PARTITION BY "Origin" ORDER BY COUNT("Flight_Number_Reporting_Airline") DESC) AS "lag"
+FROM "flight-carriers"
+WHERE FLOOR("__time" TO DAY) = '2005-11-01'
+    AND "Origin" IN ('KOA', 'LIH')
+GROUP BY 1, 2, 3
+```
+
+Returns the following:
+
+| `flight_day` | `airport` | `airline` | `num_flights` | `lag` |
+| --- | --- | --- | --- | ---|
+| `2005-11-01T00:00:00.000Z` | `KOA` | `HA` | `11` | `null` |
+| `2005-11-01T00:00:00.000Z` | `KOA` | `UA` | `4` | `HA` |
+| `2005-11-01T00:00:00.000Z` | `KOA` | `AA` | `1` | `UA` |
+| `2005-11-01T00:00:00.000Z` | `KOA` | `NW` | `1` | `AA` |
+| `2005-11-01T00:00:00.000Z` | `LIH` | `HA` | `15` | `null` |
+| `2005-11-01T00:00:00.000Z` | `LIH` | `AA` | `2` | `HA` |
+| `2005-11-01T00:00:00.000Z` | `LIH` | `UA` | `2` | `AA` |
+ 
+</details>
+
+[Learn more](sql-window-functions.md#window-function-reference)
+
+## LAST_VALUE
+
+Returns the value evaluated for the expression for the last row within the window.
+
+* **Syntax**: `LAST_VALUE(expr)`
+* **Function type:** Window
+
+<details>
+<summary>Example</summary>
+
+The following example returns the last airline name in the window for flights for two airports on a single day.
+Note that the RANGE BETWEEN clause defines the window frame between the current row and the final row in the window instead of the default of RANGE BETWEEN UNBOUNDED PRECEDING AND CURRENT ROW when using ORDER BY.
+
+```sql
+SELECT FLOOR("__time" TO DAY)  AS "flight_day",
+    "Origin" AS "airport",
+    "Reporting_Airline" as "airline",
+    COUNT("Flight_Number_Reporting_Airline") as "num_flights",
+    LAST_VALUE("Reporting_Airline") OVER (PARTITION BY "Origin" ORDER BY COUNT("Flight_Number_Reporting_Airline") DESC
+      RANGE BETWEEN CURRENT ROW AND UNBOUNDED FOLLOWING) AS "last_value"
+FROM "flight-carriers"
+WHERE FLOOR("__time" TO DAY) = '2005-11-01'
+    AND "Origin" IN ('KOA', 'LIH')
+GROUP BY 1, 2, 3
+```
+
+Returns the following:
+
+| `flight_day` | `airport` | `airline` | `num_flights` | `last_value` |
+| --- | --- | --- | --- | ---|
+| `2005-11-01T00:00:00.000Z` | `KOA` | `HA` | `11` | `NW` |
+| `2005-11-01T00:00:00.000Z` | `KOA` | `UA` | `4` | `NW` |
+| `2005-11-01T00:00:00.000Z` | `KOA` | `AA` | `1` | `NW` |
+| `2005-11-01T00:00:00.000Z` | `KOA` | `NW` | `1` | `NW` |
+| `2005-11-01T00:00:00.000Z` | `LIH` | `HA` | `15` | `UA` |
+| `2005-11-01T00:00:00.000Z` | `LIH` | `AA` | `2` | `UA` |
+| `2005-11-01T00:00:00.000Z` | `LIH` | `UA` | `2` | `UA` |
+ 
+</details>
+
+[Learn more](sql-window-functions.md#window-function-reference)
+
+## LATEST
+
+Returns the value of a numeric or string expression corresponding to the latest `__time` value.
+
+* **Syntax**: `LATEST(expr, [maxBytesPerValue])`
+* **Function type:** Aggregation
+
+<details>
+<summary>Example</summary>
+
+The following example returns the origin airport code associated with the latest departing flight daily after `'2005-01-01 00:00:00'` in `flight-carriers`:
+
+```sql
+SELECT
+  TIME_FLOOR(__time, 'P1D') AS "departure_day",
+  LATEST("Origin") AS "origin"
+FROM "flight-carriers"
+WHERE __time >= TIMESTAMP '2005-01-01 00:00:00'
+GROUP BY 1
+LIMIT 2
+```
+
+Returns the following:
+
+|`departure_day`|`origin`|
+|------------|--------|
+|`2005-11-01T00:00:00.000Z`|`LAS`|
+|`2005-11-02T00:00:00.000Z`|`LAX`|
+
+</details>
+
+[Learn more](sql-aggregations.md)
+
+## LATEST_BY
+
+Returns the value of a numeric or string expression corresponding to the latest time value from `timestampExpr`.
+
+* **Syntax**: `LATEST_BY(expr, timestampExpr, [maxBytesPerValue])`
+* **Function type:** Aggregation
+
+<details>
+<summary>Example</summary>
+
+The following example returns the destination airport code associated with the latest arriving flight daily after `'2005-01-01 00:00:00'` in `flight-carriers`:
+
+```sql
+SELECT
+  TIME_FLOOR(TIME_PARSE("arrivalime"), 'P1D') AS "arrival_day",
+  LATEST_BY("Dest", TIME_PARSE("arrivalime")) AS "dest"
+FROM "flight-carriers"
+WHERE TIME_PARSE("arrivalime") >= TIMESTAMP '2005-01-01 00:00:00'
+GROUP BY 1
+LIMIT 2
+```
+
+Returns the following:
+
+|`arrival_day`|`origin`|
+|-------------|--------|
+|`2005-11-01T00:00:00.000Z`|`MCO`|
+|`2005-11-02T00:00:00.000Z`|`BUF`|
+
+</details>
+
+[Learn more](sql-aggregations.md)
+
+## LEAD
+
+If you do not supply an `offset`, returns the value evaluated at the row following the current row. Specify an offset number `n` to return the value evaluated at `n` rows following the current one; if there is no such row, returns the given default value.
+
+* **Syntax**: `LEAD(expr[, offset])`
+* **Function type:** Window
+
+<details>
+<summary>Example</summary>
+
+The following example returns the subsequent value for an airline in the window for flights from two airports on a single day.
+
+```sql
+SELECT FLOOR("__time" TO DAY)  AS "flight_day",
+    "Origin" AS "airport",
+    "Reporting_Airline" as "airline",
+    COUNT("Flight_Number_Reporting_Airline") as "num_flights",
+    LEAD("Reporting_Airline") OVER (PARTITION BY "Origin" ORDER BY COUNT("Flight_Number_Reporting_Airline") DESC) AS "lead"
+FROM "flight-carriers"
+WHERE FLOOR("__time" TO DAY) = '2005-11-01'
+    AND "Origin" IN ('KOA', 'LIH')
+GROUP BY 1, 2, 3
+```
+
+Returns the following:
+
+| `flight_day` | `airport` | `airline` | `num_flights ` | `lead` |
+| --- | --- | --- | --- | ---|
+| `2005-11-01T00:00:00.000Z` | `KOA` | `HA` | `11` |`UA` |
+| `2005-11-01T00:00:00.000Z` | `KOA` | `UA` | `4` | `AA` |
+| `2005-11-01T00:00:00.000Z` | `KOA` | `AA` | `1` | `NW` |
+| `2005-11-01T00:00:00.000Z` | `KOA` | `NW` | `1` | `null` |
+| `2005-11-01T00:00:00.000Z` | `LIH` | `HA` | `15` | `AA` |
+| `2005-11-01T00:00:00.000Z` | `LIH` | `AA` | `2` | `UA` |
+| `2005-11-01T00:00:00.000Z` | `LIH` | `UA` | `2` | `null` |
+ 
+</details>
+
+[Learn more](sql-window-functions.md#window-function-reference)
+
+## LEAST
+
+Returns the minimum value from the provided expressions. For information on how Druid interprets the arguments passed into the function, see [Reduction functions](sql-scalar.md#reduction-functions).
+
+* **Syntax:** `LEAST([expr1, ...])`
+* **Function type:** Scalar, reduction
+
+<details>
+<summary>Example</summary>
+
+The following example returns the minimum value between the strings `apple`, `orange`, and `pear`. Druid interprets these arguments as STRING data type. 
+
+```sql
+SELECT LEAST( 'apple', 'orange', 'pear') AS "least"
+```
+
+Returns the following:
+
+| `least` |
+| -- |
+| `apple` |
+
+</details>
+
+[Learn more](sql-scalar.md#reduction-functions)
+
+
+## LEFT
+
+Returns the `N` leftmost characters of an expression, where `N` is an integer value.
+
+* **Syntax:** `LEFT(expr, N)`
+* **Function type:** Scalar, string 
+
+<details>
+<summary>Example</summary>
+
+The following example returns the `3` leftmost characters of the expression `ABCDEFG`.
+
+```sql
+SELECT
+  'ABCDEFG' AS "expression",
+  LEFT('ABCDEFG', 3) AS "leftmost_characters"
+```
+
+Returns the following:
+
+| `expression` | `leftmost_characters` |
+| -- | -- |
+| `ABCDEFG` | `ABC` |
+
+</details>
+
+[Learn more](sql-scalar.md#string-functions)
+
+## LENGTH
+
+Returns the length of the expression in UTF-16 code units.
+
+* **Syntax:** `LENGTH(expr)`
+* **Function type:** Scalar, string
+
+<details>
+<summary>Example</summary>
+
+The following example returns the character length of the `OriginCityName` column from the `flight-carriers` datasource.
+
+```sql
+SELECT 
+  "OriginCityName" AS "origin_city_name",
+  LENGTH("OriginCityName") AS "city_name_length"
+FROM "flight-carriers"
+LIMIT 1
+```
+
+Returns the following:
+
+| `origin_city_name` | `city_name_length` |
+| -- | -- |
+| `San Juan, PR` | `12` |
+
+</details>
+
+[Learn more](sql-scalar.md#string-functions)
+
+## LISTAGG
+
+Alias for [`STRING_AGG`](#string_agg).
+
+* **Syntax:** `LISTAGG([DISTINCT] expr, [separator, [size]])`
+* **Function type:** Aggregation
+
+[Learn more](sql-aggregations.md)
+
+## LN
+
+Calculates the natural logarithm of the numeric expression.
+
+* **Syntax:** `LN(<NUMERIC>)`
+* **Function type:** Scalar, numeric
+
+<details>
+<summary>Example</summary>
+
+The following example applies the LN function to the `max_temperature` column from the `taxi-trips` datasource.
+
+```sql
+SELECT
+  "max_temperature" AS "max_temperature",
+  LN("max_temperature") AS "natural_log_max_temp"
+FROM "taxi-trips"
+LIMIT 1
+```
+
+Returns the following:
+
+| `max_temperature` | `natural_log_max_temp` |
+| -- | -- |
+| `76` | `4.330733340286331` |
+
+</details>
+
+[Learn more](sql-scalar.md#numeric-functions)
+
+## LOG10
+
+Calculates the base-10 logarithm of the numeric expression.
+
+* **Syntax:** `LOG10(<NUMERIC>)`
+* **Function type:** Scalar, numeric
+
+<details>
+<summary>Example</summary>
+
+The following example applies the LOG10 function to the `max_temperature` column from the `taxi-trips` datasource.
+
+```sql
+SELECT
+  "max_temperature" AS "max_temperature",
+  LOG10("max_temperature") AS "log10_max_temp"
+FROM "taxi-trips"
+LIMIT 1
+```
+Returns the following:
+
+| `max_temperature` | `log10_max_temp` |
+| -- | -- |
+| `76` | `1.8808135922807914` |
+</details>
+
+[Learn more](sql-scalar.md#numeric-functions)
+
+## LOOKUP
+
+Searches for `expr` in a registered [query-time lookup table](lookups.md) named `lookupName` and returns the mapped value. If `expr` is null or not contained in the lookup, returns `defaultValue` if supplied, otherwise returns null.
+
+* **Syntax:** `LOOKUP(expr, lookupName[, defaultValue])`
+* **Function type:** Scalar, string
+
+<details>
+<summary>Example</summary>
+
+The following example uses a `map` type lookup table named `code_to_name`, which contains the following key-value pairs:
+
+```json
+{
+  "SJU": "Luis Munoz Marin International Airport",
+  "IAD": "Dulles International Airport"
+}
+```
+
+The example uses `code_to_name` to map the `Origin` column from the `flight-carriers` datasource to the corresponding full airport name. Returns `key not found` if no matching key exists in the lookup table.
+
+```sql
+SELECT 
+  "Origin" AS "origin_airport",
+  LOOKUP("Origin", 'code_to_name','key not found') AS "full_airport_name"
+FROM "flight-carriers"
+LIMIT 2
+```
+
+Returns the following:
+
+| `origin_airport` | `full_airport_name` |
+| -- | -- |
+| `SJU` | `Luis Munoz Marin International Airport` |
+| `BOS` | `key not found` |
+
+</details> 
+
+[Learn more](sql-scalar.md#string-functions)
+
+## LOWER
+
+Returns the expression in lowercase.
+
+* **Syntax:** `LOWER(expr)`
+* **Function type:** Scalar, string
+
+<details>
+<summary>Example</summary>
+
+The following example converts the `OriginCityName` column from the `flight-carriers` datasource to lowercase.
+
+```sql
+SELECT 
+  "OriginCityName" AS "origin_city",
+  LOWER("OriginCityName") AS "lowercase"
+FROM "flight-carriers"
+LIMIT 1
+```
+
+Returns the following:
+
+| `origin_city` | `lowercase` |
+| -- | -- |
+`San Juan, PR` | `san juan, pr` |
+
+</details>
+
+[Learn more](sql-scalar.md#string-functions)
+
+
+## LPAD
+
+Returns a string of size `length` from `expr`. When the length of `expr` is less than `length`, left pads `expr` with `chars`, which defaults to the space character. Truncates `expr` to `length` if `length` is shorter than the length of `expr`.
+
+* **Syntax:** `LPAD(expr, length[, chars])`
+* **Function type:** Scalar, string
+
+<details>
+<summary>Example</summary>
+
+The following example left pads the value of `OriginStateName` from the `flight-carriers` datasource to return a total of 11 characters.
+
+```sql
+SELECT 
+  "OriginStateName" AS "origin_state",
+  LPAD("OriginStateName", 11, '+') AS "add_left_padding"
+FROM "flight-carriers"
+LIMIT 3
+```
+
+Returns the following:
+
+| `origin_state` | `add_left_padding` |
+| -- | -- |
+| `Puerto Rico` | `Puerto Rico` |
+| `Massachusetts` | `Massachuset` |
+| `Florida` | `++++Florida` |
+
+</details>
+
+[Learn more](sql-scalar.md#string-functions)
+
+
+## LTRIM
+
+Trims characters from the leading end of an expression. Defaults `chars` to a space if none is provided.
+
+* **Syntax:** `LTRIM(expr[, chars])`
+* **Function type:** Scalar, string
+
+<details>
+<summary>Example</summary>
+
+The following example trims the `_` characters from the leading end of the string expression.
+
+```sql
+SELECT 
+  '___abc___' AS "original_string",
+  LTRIM('___abc___', '_') AS "trim_leading_end_of_expression"
+```
+
+Returns the following:
+
+| `original_string` | `trim_leading_end_of_expression` |
+| -- | -- |
+| `___abc___` | `abc___` |
+
+</details>
+
+[Learn more](sql-scalar.md#string-functions)
+
+## MAX
+
+Returns the maximum value of a set of values.
+
+* **Syntax**: `MAX(expr)`
+* **Function type:** Aggregation
+
+
+<details>
+<summary>Example</summary>
+
+The following example calculates the maximum delay in minutes for an airline in `flight-carriers`:
+
+```sql
+SELECT MAX("DepDelayMinutes") AS max_delay
+FROM "flight-carriers"
+WHERE "Reporting_Airline" = 'AA'
+```
+
+Returns the following:
+
+| `max_delay` |
+| -- |
+| `1210` |
+
+</details>
+
+[Learn more](sql-aggregations.md)
+
+## MILLIS_TO_TIMESTAMP
+
+Converts a number of milliseconds since epoch into a timestamp.
+
+* **Syntax:** `MILLIS_TO_TIMESTAMP(millis_expr)`
+* **Function type:** Scalar, date and time
+
+<details>
+<summary>Example</summary>
+
+The following example converts 1375344877000 milliseconds from epoch into a timestamp. 
+
+```sql
+SELECT MILLIS_TO_TIMESTAMP(1375344877000) AS "timestamp"
+```
+
+Returns the following:
+
+| `timestamp` |
+| -- |
+| `2013-08-01T08:14:37.000Z` |
+
+</details>
+
+[Learn more](sql-scalar.md#date-and-time-functions)
+
+## MIN
+
+Returns the minimum value of a set of values.
+
+* **Syntax**: `MIN(expr)`
+* **Function type:** Aggregation
+
+<details>
+<summary>Example</summary>
+
+The following example calculates the minimum delay in minutes for an airline in `flight-carriers`:
+
+```sql
+SELECT MIN("DepDelayMinutes") AS min_delay
+FROM "flight-carriers"
+WHERE "Reporting_Airline" = 'AA'
+```
+
+Returns the following:
+
+| `min_delay` |
+| -- |
+| `0` |
+
+</details>
+
+[Learn more](sql-aggregations.md)
+
+## MOD
+
+Calculates x modulo y, or the remainder of x divided by y. Where x and y are numeric expressions.
+
+* **Syntax:** `MOD(x, y)`
+* **Function type:** Scalar, numeric
+
+<details>
+<summary>Example</summary>
+
+The following calculates 78 MOD 10.
+
+```sql
+SELECT MOD(78, 10) as "modulo"
+```
+Returns the following:
+
+| `modulo` |
+| -- |
+| `8` |
+</details>
+
+[Learn more](sql-scalar.md#numeric-functions)
+
+## MV_APPEND
+
+Adds the expression to the end of the array.
+
+* **Syntax:** `MV_APPEND(arr1, expr)`
+* **Function type:** Multi-value string
+
+<details>
+<summary>Example</summary>
+
+The following example appends the string `label` to the multi-value string `tags` from `mvd-example`:
+
+```sql
+SELECT MV_APPEND("tags", "label") AS append
+FROM "mvd-example"
+LIMIT 1
+```
+
+Returns the following:
+
+| `append` |
+| -- |
+| `["t1","t2","t3","row1"]` |
+
+</details>
+
+[Learn more](sql-multivalue-string-functions.md)
+
+## MV_CONCAT
+
+Concatenates two arrays.
+
+* **Syntax:** `MV_CONCAT(arr1, arr2)`
+* **Function type:** Multi-value string
+
+<details>
+<summary>Example</summary>
+
+The following example concatenates `tags` from `mvd-example` to itself:
+
+```sql
+SELECT MV_CONCAT("tags", "tags") AS cat
+FROM "mvd-example"
+LIMIT 1
+```
+
+Returns the following:
+
+| `cat` |
+| -- |
+| `["t1","t2","t3","t1","t2","t3"]` |
+
+</details>
+
+[Learn more](sql-multivalue-string-functions.md)
+
+
+## MV_CONTAINS
+
+Returns true if the expression is in the array, false otherwise.
+
+* **Syntax:** `MV_CONTAINS(arr, expr)`
+* **Function type:** Multi-value string
+
+<details>
+<summary>Example</summary>
+
+The following example checks if the string `t3` exists within `tags` from `mvd-example`:
+
+```sql
+SELECT "tags", MV_CONTAINS("tags", 't3') AS contained
+FROM "mvd-example"
+```
+
+Returns the following:
+
+|`tags`|`contained`|
+|------|-----------|
+|`["t1","t2","t3"]`|`true`|
+|`["t3","t4","t5"]`|`true`|
+|`["t5","t6","t7"]`|`false`|
+|`null`|`false`|
+
+</details>
+
+[Learn more](sql-multivalue-string-functions.md)
+
+## MV_FILTER_NONE
+
+Filters a multi-value expression to exclude values from an array.
+
+* **Syntax:** `MV_FILTER_NONE(expr, arr)`
+* **Function type:** Multi-value string
+
+<details>
+<summary>Example</summary>
+
+The following example filters `tags` from `mvd-example` to remove values `t1` or `t3`, if present:
+
+```sql
+SELECT MV_FILTER_NONE("tags", ARRAY['t1', 't3']) AS exclude
+FROM "mvd-example"
+LIMIT 3
+```
+
+Returns the following:
+
+| `exclude` |
+| -- |
+| `t2` |
+| `["t4", "t5"]` |
+| `["t5","t6","t7"]` |
+
+</details>
+
+[Learn more](sql-multivalue-string-functions.md)
+
+## MV_FILTER_ONLY
+
+Filters a multi-value expression to include only values contained in the array.
+
+* **Syntax:** `MV_FILTER_ONLY(expr, arr)`
+* **Function type:** Multi-value string
+
+<details>
+<summary>Example</summary>
+
+The following example filters `tags` from `mvd-example` to only contain the values `t1` or `t3`:
+
+```sql
+SELECT MV_FILTER_ONLY("tags", ARRAY['t1', 't3']) AS filt
+FROM "mvd-example"
+LIMIT 3
+```
+
+Returns the following:
+
+| `filt` |
+| -- |
+| `["t1","t3"]` |
+| `t3` |
+| null |
+
+</details>
+
+[Learn more](sql-multivalue-string-functions.md)
+
+## MV_FILTER_REGEX
+
+Filters a multi-value expression to include only values matching the specified regular expression pattern.
+
+* **Syntax:** `MV_FILTER_REGEX(expr, pattern)`
+* **Function type:** Multi-value string
+
+<details>
+<summary>Example</summary>
+
+The following example filters the `tags` multi-value string from the `mvd-example` datasource to include only values starting with the letter `t`:
+
+```sql
+SELECT MV_FILTER_REGEX("tags", '^t.*') AS regex_filtered
+FROM "mvd-example"
+LIMIT 4
+```
+
+Returns the following:
+
+| `regex_filtered` |
+| -- |
+| `["t1","t2","t3"]` |
+| `["t3","t4","t5"]` |
+| `["t5","t6","t7"]` |
+| `[]` |
+
+</details>
+
+Filters multi-value `expr` to include values that match `pattern`.
+
+---
+
+## MV_FILTER_PREFIX
+
+Filters a multi-value expression to include only values that start with the specified prefix.
+
+* **Syntax:** `MV_FILTER_PREFIX(expr, prefix)`
+* **Function type:** Multi-value string
+
+<details>
+<summary>Example</summary>
+
+The following example filters the `tags` multi-value string from the `mvd-example` datasource to include only values starting with `t3`:
+
+```sql
+SELECT MV_FILTER_PREFIX("tags", 't3') AS prefix_filtered
+FROM "mvd-example"
+LIMIT 4
+```
+
+Returns the following:
+
+| `prefix_filtered` |
+| -- |
+| `[]` |
+| `["t3"]` |
+| `[]` |
+| `[]` |
+
+</details>
+
+Filters multi-value `expr` to include values that have prefix `prefix`.
+
+## MV_LENGTH
+
+Returns the length of an array expression.
+
+* **Syntax:** `MV_LENGTH(arr)`
+* **Function type:** Multi-value string
+
+<details>
+<summary>Example</summary>
+
+The following example returns the length of the `tags` multi-value strings from `mvd-example`:
+
+```sql
+SELECT MV_LENGTH("tags") AS len
+FROM "mvd-example"
+LIMIT 1
+```
+
+Returns the following:
+
+| `len` |
+| -- |
+| `3` |
+
+</details>
+
+[Learn more](sql-multivalue-string-functions.md)
+
+## MV_OFFSET
+
+Returns the array element at the given zero-based index.
+
+* **Syntax:** `MV_OFFSET(arr, long)`
+* **Function type:** Multi-value string
+
+<details>
+<summary>Example</summary>
+
+The following example returns `tags` and the element at the third position of `tags` in `mvd-example`:
+
+```sql
+SELECT "tags", MV_OFFSET("tags", 2) AS elem
+FROM "mvd-example"
+```
+
+Returns the following:
+
+|`tags`|`elem`|
+|------|------|
+|`["t1","t2","t3"]`|`t3`|
+|`["t3","t4","t5"]`|`t5`|
+|`["t5","t6","t7"]`|`t7`|
+|`null`|`null`|
+
+</details>
+
+[Learn more](sql-multivalue-string-functions.md)
+
+## MV_OFFSET_OF
+
+Returns the zero-based index of the first occurrence of a given expression in the array.
+
+* **Syntax:** `MV_OFFSET_OF(arr, expr)`
+* **Function type:** Multi-value string
+
+<details>
+<summary>Example</summary>
+
+The following example returns `tags` and the zero-based index of the string `t3` from `tags` in `mvd-example`:
+
+```sql
+SELECT "tags", MV_OFFSET_OF("tags", 't3') AS index
+FROM "mvd-example"
+```
+
+Returns the following:
+
+|`tags`|`index`|
+|------|-------|
+|`["t1","t2","t3"]`|`2`|
+|`["t3","t4","t5"]`|`0`|
+|`["t5","t6","t7"]`|`null`|
+|`null`|`null`|
+
+</details>
+
+[Learn more](sql-multivalue-string-functions.md)
+
+## MV_ORDINAL
+
+Returns the array element at the given one-based index.
+
+* **Syntax:** `MV_ORDINAL(arr, long)`
+* **Function type:** Multi-value string
+
+<details>
+<summary>Example</summary>
+
+The following example returns `tags` and the element at the third position of `tags` in `mvd-example`:
+
+```sql
+SELECT "tags", MV_ORDINAL("tags", 3) AS elem
+FROM "mvd-example"
+```
+
+Returns the following:
+
+|`tags`|`elem`|
+|------|------|
+|`["t1","t2","t3"]`|`t3`|
+|`["t3","t4","t5"]`|`t5`|
+|`["t5","t6","t7"]`|`t7`|
+|`null`|`null`|
+
+</details>
+
+[Learn more](sql-multivalue-string-functions.md)
+
+## MV_ORDINAL_OF
+
+Returns the one-based index of the first occurrence of a given expression.
+
+* **Syntax:** `MV_ORDINAL_OF(arr, expr)`
+* **Function type:** Multi-value string
+
+<details>
+<summary>Example</summary>
+
+The following example returns `tags` and the one-based index of the string `t3` from `tags` in `mvd-example`:
+
+```sql
+SELECT "tags", MV_ORDINAL_OF("tags", 't3') AS index
+FROM "mvd-example"
+```
+
+Returns the following:
+
+|`tags`|`index`|
+|------|-------|
+|`["t1","t2","t3"]`|`3`|
+|`["t3","t4","t5"]`|`1`|
+|`["t5","t6","t7"]`|`null`|
+|`null`|`null`|
+
+</details>
+
+[Learn more](sql-multivalue-string-functions.md)
+
+## MV_OVERLAP
+
+Returns true if the two arrays have any elements in common, false otherwise.
+
+* **Syntax:** `MV_OVERLAP(arr1, arr2)`
+* **Function type:** Multi-value string
+
+<details>
+<summary>Example</summary>
+
+The following example identifies rows that contain `t1` or `t3` in `tags` from `mvd-example`:
+
+```sql
+SELECT "tags", MV_OVERLAP("tags", ARRAY['t1', 't3']) AS overlap
+FROM "mvd_example"
+```
+
+Returns the following:
+
+|`tags`|`overlap`|
+|------|---------|
+|`["t1","t2","t3"]`|`true`|
+|`["t3","t4","t5"]`|`true`|
+|`["t5","t6","t7"]`|`false`|
+|`null`|`false`|
+
+</details>
+
+[Learn more](sql-multivalue-string-functions.md)
+
+## MV_PREPEND
+
+Adds the expression to the beginning of the array.
+
+* **Syntax:** `MV_PREPEND(expr, arr)`
+* **Function type:** Multi-value string
+
+<details>
+<summary>Example</summary>
+
+The following example prepends the string dimension `label` to the multi-value string dimension `tags` from `mvd-example`:
+
+```sql
+SELECT MV_PREPEND("label", "tags") AS prepend
+FROM "mvd-example"
+LIMIT 1
+```
+
+Returns the following:
+
+| `prepend` |
+| -- |
+| `["row1","t1","t2","t3"]` |
+
+
+</details>
+
+[Learn more](sql-multivalue-string-functions.md)
+
+## MV_SLICE
+
+Returns a slice of the array from the zero-based start and end indexes.
+
+* **Syntax:** `MV_SLICE(arr, start, end)`
+* **Function type:** Multi-value string
+
+<details>
+<summary>Example</summary>
+
+The following example returns `tags` and the second and third values of `tags` from `mvd-example`:
+
+```sql
+SELECT "tags", MV_SLICE(tags, 1, 3) AS slice
+FROM "mvd-example"
+```
+
+Returns the following:
+
+|`tags`|`slice`|
+|------|-------|
+|`["t1"","t2","t3"]`|`["t2","t3"]`|
+|`["t3"","t4","t5"]`|`["t4","t5"]`|
+|`["t5"","t6","t7"]`|`["t6","t7"]`|
+|`null`|`null`|
+
+</details>
+
+[Learn more](sql-multivalue-string-functions.md)
+
+## MV_TO_ARRAY
+
+Converts a multi-value string from a `VARCHAR` to a `VARCHAR ARRAY`.
+
+* **Syntax:** `MV_TO_ARRAY(str)`
+* **Function type:** Multi-value string
+
+<details>
+<summary>Example</summary>
+
+The following example transforms the `tags` column from `mvd-example` to arrays:
+
+```sql
+SELECT MV_TO_ARRAY(tags) AS arr
+FROM "mvd-example"
+LIMIT 1
+```
+
+Returns the following:
+
+| `arr` |
+| -- |
+| `[t1, t2, t3]` |
+
+</details>
+
+[Learn more](sql-multivalue-string-functions.md)
+
+## MV_TO_STRING
+
+Joins all elements of the array together by the given delimiter.
+
+* **Syntax:** `MV_TO_STRING(arr, str)`
+* **Function type:** Multi-value string
+
+<details>
+<summary>Example</summary>
+
+The following example transforms the `tags` column from `mvd-example` to strings delimited by a space character:
+
+```sql
+SELECT MV_TO_STRING("tags", ' ') AS str
+FROM mvd-example
+LIMIT 1
+```
+
+Returns the following:
+
+| `str` |
+| -- |
+| `t1 t2 t3` |
+
+</details>
+
+[Learn more](sql-multivalue-string-functions.md)
+
+## NTILE
+
+Divides the rows within a window as evenly as possible into the number of tiles, also called buckets, and returns the value of the tile that the row falls into.
+
+* **Syntax**: `NTILE(tiles)`
+* **Function type:** Window
+
+<details>
+<summary>Example</summary>
+
+The following example returns the results for flights by airline from two airports on a single day divided into 3 tiles.
+
+```sql
+SELECT FLOOR("__time" TO DAY)  AS "flight_day",
+    "Origin" AS "airport",
+    "Reporting_Airline" as "airline",
+    COUNT("Flight_Number_Reporting_Airline") as "num_flights",
+    NTILE(3) OVER (PARTITION BY "Origin" ORDER BY COUNT("Flight_Number_Reporting_Airline") DESC) AS "ntile"
+FROM "flight-carriers"
+WHERE FLOOR("__time" TO DAY) = '2005-11-01'
+    AND "Origin" IN ('KOA', 'LIH')
+GROUP BY 1, 2, 3
+```
+
+Returns the following:
+
+| `flight_day` | `airport` | `airline` | `lead` | `ntile` |
+| --- | --- | --- | --- | ---|
+| `2005-11-01T00:00:00.000Z` | `KOA` | `HA` | `11` | `1` |
+| `2005-11-01T00:00:00.000Z` | `KOA` | `UA` | `4` | `1` |
+| `2005-11-01T00:00:00.000Z` | `KOA` | `AA` | `1` | `2` |
+| `2005-11-01T00:00:00.000Z` | `KOA` | `NW` | `1` | `3` |
+| `2005-11-01T00:00:00.000Z` | `LIH` | `HA` | `15` | `1` |
+| `2005-11-01T00:00:00.000Z` | `LIH` | `AA` | `2` | `2` |
+| `2005-11-01T00:00:00.000Z` | `LIH` | `UA` | `2` | `3` |
+ 
+</details>
+
+[Learn more](sql-window-functions.md#window-function-reference)
+
+## NULLIF
+
+Returns null if two values are equal, else returns the first value.
+* **Syntax:** `NULLIF(value1, value2)`
+* **Function type:** Scalar, other
+
+<details>
+<summary>Example</summary>
+
+The following example returns null if the `OriginState` column from the `flight-carriers` datasource is `PR`.
+
+```sql
+SELECT "OriginState" AS "origin_state",
+  NULLIF("OriginState", 'PR') AS "remove_pr"
+FROM "flight-carriers"
+LIMIT 2
+```
+
+Returns the following:
+
+| `origin_state` | `remove_pr` |
+| -- | -- |
+| `PR` | `null` |
+| `MA` | `MA` |
+
+</details>
+
+[Learn more](sql-scalar.md#other-scalar-functions)
+
+
+## NVL
+
+Returns `value1` if `value1` is not null, otherwise returns `value2`.
+
+* **Syntax:** `NVL(value1, value1)`
+* **Function type:** Scalar, other
+
+<details>
+<summary>Example</summary>
+
+The following example replaces each null value in the `Tail_Number` column of the `flight-carriers` datasource with the string "No tail number."
+
+```sql
+SELECT "Tail_Number" AS "original_column",
+  NVL("Tail_Number", 'No tail number') AS "remove_null"
+FROM "flight-carriers"
+WHERE "OriginState" = 'CT'
+LIMIT 2
+```
+
+Returns the following:
+
+| `original_column` | `remove_null`
+| -- | -- |
+| `N951DL` | `N951DL` |
+| `null` | `No tail number` |
+
+</details>
+
+[Learn more](sql-scalar.md#other-scalar-functions)
+
+## PARSE_JSON
+
+Parses an expression into a `COMPLEX<json>` object. 
+
+The function deserializes JSON values when processing them, translating stringified JSON into a nested structure.
+If the input is invalid JSON or not a `VARCHAR`, it returns an error.
+
+* **Syntax:** `PARSE_JSON(expr)`
+* **Function type:** JSON
+
+<details>
+<summary>Example</summary>
+
+The following example creates a `COMPLEX<json>` object `gus` from a string of fields:
+
+```sql
+SELECT
+  PARSE_JSON('{"name":"Gus","email":"gus_cat@example.com","type":"Pet"}') as gus
+```
+
+Returns the following:
+
+| `gus` |
+| -- |
+| `{"name":"Gus","email":"gus_cat@example.com","type":"Pet"}` |
+
+</details>
+
+[Learn more](sql-json-functions.md)
+## PARSE_LONG
+
+Converts a string into a long(BIGINT) with the given radix, or into DECIMAL(base 10) if a radix is not provided.
+
+* **Syntax:**`PARSE_LONG(string[, radix])`
+* **Function type:** Scalar, string
+
+<details>
+<summary>Example</summary>
+
+The following example converts the string representation of the binary, radix 2, number `1100` into its long (BIGINT) equivalent.
+
+```sql
+SELECT 
+  '1100' AS "binary_as_string", 
+  PARSE_LONG('1110', 2) AS "bigint_value"
+```
+
+Returns the following:
+
+| `binary_as_string` | `bigint_value` |
+| -- | -- |
+| `1100` | `14` |
+
+</details>
+
+[Learn more](sql-scalar.md#string-functions)
+
+
+## PERCENT_RANK
+
+Returns the relative rank of the row calculated as a percentage according to the formula: `RANK() OVER (window) / COUNT(1) OVER (window)`.
+
+* **Syntax**: `PERCENT_RANK()`
+* **Function type:** Window
+
+<details>
+<summary>Example</summary>
+
+The following example returns the percent rank within the window for flights by airline from two airports on a single day.
+
+```sql
+SELECT FLOOR("__time" TO DAY)  AS "flight_day",
+    "Origin" AS "airport",
+    "Reporting_Airline" as "airline",
+    COUNT("Flight_Number_Reporting_Airline") as "num_flights",
+    PERCENT_RANK() OVER (PARTITION BY "Origin" ORDER BY COUNT("Flight_Number_Reporting_Airline") DESC) AS "pct_rank"
+FROM "flight-carriers"
+WHERE FLOOR("__time" TO DAY) = '2005-11-01'
+    AND "Origin" IN ('KOA', 'LIH')
+GROUP BY 1, 2, 3
+```
+
+Returns the following:
+
+| `flight_day` | `airport` | `airline` | `num_flights` | `pct_rank` |
+| --- | --- | --- | --- | ---|
+| `2005-11-01T00:00:00.000Z` | `KOA` | `HA` | `11` | `0` |
+| `2005-11-01T00:00:00.000Z` | `KOA` | `UA` | `4` | `0.3333333333333333` |
+| `2005-11-01T00:00:00.000Z` | `KOA` | `AA` | `1` | `0.6666666666666666` |
+| `2005-11-01T00:00:00.000Z` | `KOA` | `NW` | `1` | `0.6666666666666666` |
+| `2005-11-01T00:00:00.000Z` | `LIH` | `HA` | `15` | `0` |
+| `2005-11-01T00:00:00.000Z` | `LIH` | `AA` | `2` | `0.5` |
+| `2005-11-01T00:00:00.000Z` | `LIH` | `UA` | `2` | `0.5` |
+ 
+</details>
+
+
+[Learn more](sql-window-functions.md#window-function-reference)
+
+## POSITION
+
+Returns the one-based index position of a substring within an expression, optionally starting from a given one-based index. If `substring` is not found, returns 0.
+
+* **Syntax**: `POSITION(substring IN expr [FROM startingIndex])`
+* **Function type:** Scalar, string
+
+<details>
+<summary>Example</summary>
+
+The following example returns the one-based index of the substring `PR` in the `OriginCityName` column from the `flight-carriers` datasource starting from index 5.
+
+```sql
+SELECT 
+  "OriginCityName" AS "origin_city",
+  POSITION('PR' IN "OriginCityName" FROM 5) AS "index"
+FROM "flight-carriers"
+LIMIT 2
+```
+
+Returns the following:
+
+| `origin_city` | `index` |
+| -- | -- |
+| `San Juan, PR` | `11` |
+| `Boston, MA` | `0` |
+
+</details>
+
+[Learn more](sql-scalar.md#string-functions)
+
+## POWER
+
+Calculates a numerical expression raised to the specified power.
+
+* **Syntax:** `POWER(base, exponent)`
+* **Function type:** Scalar, numeric
+
+<details>
+<summary>Example</summary>
+
+The following example raises 5 to the power of 2.
+
+```sql
+SELECT POWER(5, 2) AS "power"
+```
+Returns the following:
+
+| `power` |
+| -- |
+| `25` |
+</details>
+
+[Learn more](sql-scalar.md#numeric-functions)
+
+## RADIANS
+
+Converts an angle from degrees to radians.
+
+* **Syntax:** `RADIANS(expr)`
+* **Function type:** Scalar, numeric
+
+<details>
+<summary>Example</summary>
+
+The following example converts an angle of `180` degrees to radians
+
+```sql
+SELECT RADIANS(180) AS "radians"
+```
+Returns the following:
+
+| `radians` |  
+| -- |
+| `3.141592653589793` |
+</details>
+
+[Learn more](sql-scalar.md#numeric-functions)
+
+## RANK
+
+Returns the rank with gaps for a row within a window. For example, if two rows tie for rank 1, the next rank is 3.
+
+* **Syntax**: `RANK()`
+* **Function type:** Window
+
+<details>
+<summary>Example</summary>
+
+The following example returns the rank within the window for flights by airline from two airports on a single day.
+
+```sql
+SELECT FLOOR("__time" TO DAY)  AS "flight_day",
+    "Origin" AS "airport",
+    "Reporting_Airline" as "airline",
+    COUNT("Flight_Number_Reporting_Airline") as "num_flights",
+    RANK() OVER (PARTITION BY "Origin" ORDER BY COUNT("Flight_Number_Reporting_Airline") DESC) AS "rank"
+FROM "flight-carriers"
+WHERE FLOOR("__time" TO DAY) = '2005-11-01'
+    AND "Origin" IN ('KOA', 'LIH')
+GROUP BY 1, 2, 3
+```
+
+Returns the following:
+
+| `flight_day` | `airport` | `airline` | `num_flights` | `rank` |
+| --- | --- | --- | --- | ---|
+| `2005-11-01T00:00:00.000Z` | `KOA` | `HA` | `11` | `1` |
+| `2005-11-01T00:00:00.000Z` | `KOA` | `UA` | `4` | `2` |
+| `2005-11-01T00:00:00.000Z` | `KOA` | `AA` | `1` | `3` |
+| `2005-11-01T00:00:00.000Z` | `KOA` | `NW` | `1` | `3` |
+| `2005-11-01T00:00:00.000Z` | `LIH` | `HA` | `15` | `1` |
+| `2005-11-01T00:00:00.000Z` | `LIH` | `AA` | `2` | `2` |
+| `2005-11-01T00:00:00.000Z` | `LIH` | `UA` | `2` | `3` |
+ 
+</details>
+
+[Learn more](sql-window-functions.md#window-function-reference)
+
+## REGEXP_EXTRACT
+
+Apply regular expression `pattern` to `expr` and extract the Nth capture group. If `N` is unspecified or zero, returns the first substring that matches the pattern. Returns null if there is no matching pattern.
+
+* **Syntax:** `REGEXP_EXTRACT(expr, pattern[, N])`
+* **Function type:** Scalar, string 
+
+<details>
+<summary>Example</summary>
+
+The following example uses regular expressions to find city names inside the `OriginCityName` column from the `flight-carriers` datasource by matching what comes before the comma.
+
+```sql
+SELECT 
+  "OriginCityName" AS "origin_city",
+  REGEXP_EXTRACT("OriginCityName", '([^,]+)', 0) AS "pattern_match"
+FROM "flight-carriers"
+LIMIT 1
+```
+
+Returns the following:
+
+| `origin_city` | `pattern_match` |
+| -- | -- |
+| `San Juan, PR` | `San Juan`|
+
+</details>
+
+[Learn more](sql-scalar.md#string-functions)
+
+## REGEXP_LIKE
+
+Returns `true` if the regular expression `pattern` finds a match in `expr`. Returns `false` otherwise.
+
+* **Syntax:** `REGEXP_LIKE(expr, pattern)`
+* **Function type:** Scalar, string
+
+<details>
+<summary>Example</summary>
+
+The following example returns `true` when the `OriginCityName` column from `flight-carriers` has a city name containing a space.
+
+```sql
+SELECT 
+  "OriginCityName" AS "origin_city",
+  REGEXP_LIKE("OriginCityName", '[A-Za-z]+\s[A-Za-z]+') AS "pattern_found"
+FROM "flight-carriers"
+LIMIT 2
+```
+
+Returns the following:
+
+| `origin_city` | `pattern_found` |
+| -- | -- |
+| `San Juan, PR` | `true` |
+| `Boston, MA` | `false` |
+
+</details>
+
+[Learn more](sql-scalar.md#string-functions)
+
+## REGEXP_REPLACE
+
+Replaces all occurrences of a regular expression in a string expression with a replacement string. Refer to capture groups in the replacement string using `$group` syntax. For example: `$1` or `$2`.
+
+* **Syntax:** `REGEXP_REPLACE(expr, pattern, replacement)`
+* **Function type:** Scalar, string
+
+<details>
+<summary>Example</summary>
+
+The following example matches three consecutive words, where each word is its own capture group, and replaces the matched words with the word in the second capture group punctuated with exclamation marks.
+
+```sql
+SELECT 
+  'foo bar baz' AS "original_string",
+  REGEXP_REPLACE('foo bar baz', '([A-Za-z]+) ([A-Za-z]+) ([A-Za-z]+)' , '$2!') AS "modified_string"
+```
+
+Returns the following:
+
+| `original_string` | `modified_string` |
+| -- | -- |
+| `foo bar baz` | `bar!` |
+
+</details>
+
+[Learn more](sql-scalar.md#string-functions)
+
+
+## REPEAT
+
+Repeats the string expression `N` times, where `N` is an integer.
+
+* **Syntax:** `REPEAT(expr, N)`
+* **Function type:** Scalar, string
+
+<details>
+<summary>Example</summary>
+
+The following example returns the string expression `abc` repeated `3` times.
+
+```sql
+SELECT 
+  'abc' AS "original_string",
+  REPEAT('abc', 3) AS "with_repetition"
+```
+
+Returns the following: 
+
+| `original_string` | `with_repetition` |
+| -- | -- |
+| `abc` | `abcabcabc` |
+
+</details>
+
+[Learn more](sql-scalar.md#string-functions)
+
+## REPLACE
+
+Replaces instances of a substring with a replacement string in the given expression.
+
+* **Syntax:** `REPLACE(expr, substring, replacement)`
+* **Function type:** Scalar, string 
+
+<details>
+<summary>Example</summary>
+
+The following example replaces instances of the substring `abc` with `XYZ`.
+
+```sql
+SELECT 
+  'abc 123 abc 123' AS "original_string",
+   REPLACE('abc 123 abc 123', 'abc', 'XYZ') AS "modified_string"
+```
+
+Returns the following:
+
+| `original_string` | `modified_string` |
+| -- | -- |
+| `abc 123 abc 123` | `XYZ 123 XYZ 123` |
+
+</details>
+
+[Learn more](sql-scalar.md#string-functions)
+
+## REVERSE
+
+Reverses the given expression.
+
+* **Syntax:** `REVERSE(expr)`
+* **Function type:** Scalar, string
+
+<details>
+<summary>Example</summary>
+
+The following example reverses the string expression `abc`.
+
+```sql
+SELECT 
+  'abc' AS "original_string",
+  REVERSE('abc') AS "reversal"
+```
+
+Returns the following:
+
+| `original_string` | `reversal` |
+| -- | -- |
+| `abc` | `cba` |
+
+</details>
+
+[Learn more](sql-scalar.md#string-functions)
+
+## RIGHT
+
+Returns the `N` rightmost characters of an expression, where `N` is an integer value.
+
+* **Syntax:** `RIGHT(expr, N)`
+* **Function type:** Scalar, string 
+
+<details>
+<summary>Example</summary>
+
+The following example returns the `3` rightmost characters of the expression `ABCDEFG`.
+
+```sql
+SELECT
+  'ABCDEFG' AS "expression",
+  RIGHT('ABCDEFG', 3) AS "rightmost_characters"
+```
+
+Returns the following:
+
+| `expression` | `rightmost_characters` |
+| -- | -- |
+| `ABCDEFG` | `EFG` |
+
+</details>
+
+[Learn more](sql-scalar.md#string-functions)
+
+## ROUND
+
+Calculates the rounded value for a numerical expression.
+
+* **Syntax:** `ROUND(expr[, digits])`
+* **Function type:** Scalar, numeric
+
+<details>
+<summary>Example</summary>
+
+The following applies the ROUND function to 0 decimal points on the `pickup_longitude` column from the `taxi-trips` datasource.
+
+```sql
+SELECT
+  "pickup_longitude" AS "pickup_longitude",
+  ROUND("pickup_longitude", 0) as "rounded_pickup_longitude"
+FROM "taxi-trips"
+WHERE "pickup_longitude" IS NOT NULL
+LIMIT 1
+```
+Returns the following:
+
+| `pickup_longitude` | `rounded_pickup_longitude` |
+| -- | -- |
+| `-73.9377670288086` | `-74` |
+</details>
+
+[Learn more](sql-scalar.md#numeric-functions)
+
+## ROW_NUMBER
+
+Returns the number of the row within the window starting from 1.
+
+* **Syntax**: `ROW_NUMBER()`
+* **Function type:** Window
+
+<details>
+<summary>Example</summary>
+
+The following example returns the row number within the window for flights by airline from two airports on a single day.
+
+```sql
+SELECT FLOOR("__time" TO DAY)  AS "flight_day",
+    "Origin" AS "airport",
+    "Reporting_Airline" as "airline",
+    COUNT("Flight_Number_Reporting_Airline") as "num_flights",
+    ROW_NUMBER() OVER (PARTITION BY "Origin" ORDER BY COUNT("Flight_Number_Reporting_Airline") DESC) AS "row_num"
+FROM "flight-carriers"
+WHERE FLOOR("__time" TO DAY) = '2005-11-01'
+    AND "Origin" IN ('KOA', 'LIH')
+GROUP BY 1, 2, 3
+```
+
+Returns the following:
+
+| `flight_day` | `airport` | `airline` | `num_flights` | `row_num` |
+| --- | --- | --- | --- | ---|
+| `2005-11-01T00:00:00.000Z` | `KOA` | `HA` | `11` | `1` |
+| `2005-11-01T00:00:00.000Z` | `KOA` | `UA` | `4` | `2` |
+| `2005-11-01T00:00:00.000Z` | `KOA` | `AA` | `1` | `3` |
+| `2005-11-01T00:00:00.000Z` | `KOA` | `NW` | `1` | `4` |
+| `2005-11-01T00:00:00.000Z` | `LIH` | `HA` | `15` | `1` |
+| `2005-11-01T00:00:00.000Z` | `LIH` | `AA` | `2` | `2` |
+| `2005-11-01T00:00:00.000Z` | `LIH` | `UA` | `2` | `3` |
+ 
+</details>
+
+[Learn more](sql-window-functions.md#window-function-reference)
+
+## RPAD
+
+Returns a string of size `length` from `expr`. When the length of `expr` is less than `length`, right pads `expr` with `chars`, which defaults to the space character. Truncates `expr` to `length` if `length` is shorter than the length of `expr`.
+
+* **Syntax:** `RPAD(expr, length[, chars])`
+* **Function type:** Scalar, string
+
+<details>
+<summary>Example</summary>
+
+The following example right pads the value of `OriginStateName` from the `flight-carriers` datasource to return a total of 11 characters.
+
+```sql
+SELECT 
+  "OriginStateName" AS "origin_state",
+  RPAD("OriginStateName", 11, '+') AS "add_right_padding"
+FROM "flight-carriers"
+LIMIT 3
+```
+
+Returns the following:
+
+| `origin_state` | `add_right_padding` |
+| -- | -- |
+| `Puerto Rico` | `Puerto Rico` |
+| `Massachusetts` | `Massachuset` |
+| `Florida` | `Florida++++` |
+
+</details>
+
+[Learn more](sql-scalar.md#string-functions)
+
+## RTRIM
+
+Trims characters from the trailing end of an expression. Defaults `chars` to a space if none is provided.
+
+* **Syntax:** `RTRIM(expr[, chars])`
+* **Function type:** Scalar, string
+
+<details>
+<summary>Example</summary>
+
+The following example trims the `_` characters from the trailing end of the string expression.
+
+```sql
+SELECT 
+  '___abc___' AS "original_string",
+  RTRIM('___abc___', '_') AS "trim_end"
+```
+
+Returns the following:
+
+| `original_string` | `trim_end` |
+| -- | -- |
+| `___abc___` | `___abc` |
+
+</details>
+
+[Learn more](sql-scalar.md#string-functions)
+
+## SAFE_DIVIDE
+
+Returns `x` divided by `y`, guarded on division by 0.
+
+* **Syntax:** `SAFE_DIVIDE(x, y)`
+* **Function type:** Scalar, numeric 
+
+<details>
+<summary>Example</summary>
+
+The following example calculates divisions of integer `78` by integer `10`.
+
+```sql
+SELECT SAFE_DIVIDE(78, 10) AS "safe_division"
+```
+
+Returns the following:
+
+|`safe_division`|
+|--|
+| `7` |
+
+</details>
+
+[Learn more](sql-scalar.md#numeric-functions)
+
+## SIN
+
+Calculates the trigonometric sine of an angle expressed in radians.
+
+* **Syntax:** `SIN(expr)`
+* **Function type:** Scalar, numeric
+
+<details>
+<summary>Example</summary>
+
+The following example calculates the sine of angle `PI/3` radians.
+
+```sql
+SELECT SIN(PI / 3) AS "sine"
+```
+Returns the following:
+
+| `sine` |  
+| -- |
+| `0.8660254037844386` |
+</details>
+
+[Learn more](sql-scalar.md#numeric-functions)
+
+## SQRT
+
+Calculates the square root of a numeric expression.
+
+* **Syntax:** `SQRT(<NUMERIC>)`
+* **Function type:** Scalar, numeric
+
+<details>
+<summary>Example</summary>
+
+The following example calculates the square root of 25.
+
+```sql
+SELECT SQRT(25) AS "square_root"
+```
+Returns the following:
+
+| `square_root` |  
+| -- |
+| `5` |
+</details>
+
+[Learn more](sql-scalar.md#numeric-functions)
+
+## STDDEV
+
+Alias for [`STDDEV_SAMP`](#stddev_samp).  
+Requires the [`druid-stats` extension](../development/extensions-core/stats.md).
+
+* **Syntax**: `STDDEV(expr)`
+* **Function type:** Aggregation
+
+[Learn more](sql-aggregations.md)
+
+## STDDEV_POP
+
+Calculates the population standard deviation of a set of values.  
+Requires the [`druid-stats` extension](../development/extensions-core/stats.md).
+
+* **Syntax**: `STDDEV_POP(expr)`
+* **Function type:** Aggregation
+
+<details>
+<summary>Example</summary>
+
+The following example calculates the population standard deviation for minutes of delay for an airline in `flight-carriers`:
+
+```sql
+SELECT STDDEV_POP("DepDelayMinutes") AS sd_delay
+FROM "flight-carriers"
+WHERE "Reporting_Airline" = 'AA'
+```
+
+Returns the following:
+
+| `sd_delay` |
+| -- |
+| `27.083557` |
+
+</details>
+
+[Learn more](sql-aggregations.md)
+
+## STDDEV_SAMP
+
+Calculates the sample standard deviation of a set of values.  
+Requires the [`druid-stats` extension](../development/extensions-core/stats.md).
+
+* **Syntax**: `STDDEV_SAMP(expr)`
+* **Function type:** Aggregation
+
+<details>
+<summary>Example</summary>
+
+The following example calculates the sample standard deviation for minutes of delay for an airline in `flight-carriers`:
+
+```sql
+SELECT STDDEV_SAMP("DepDelayMinutes") AS sd_delay
+FROM "flight-carriers"
+WHERE "Reporting_Airline" = 'AA'
+```
+
+Returns the following:
+
+| `sd_delay` |
+| -- |
+| `27.083811` |
+
+</details>
+
+[Learn more](sql-aggregations.md)
+
+## STRING_AGG
+
+Collects all values of an expression into a single string.
+
+* **Syntax**: `STRING_AGG(expr, separator, [size])`
+* **Function type:** Aggregation
+
+<details>
+<summary>Example</summary>
+
+The following example returns all the distinct airlines from `flight-carriers` as a single space-delimited string:
+
+```sql
+SELECT
+  STRING_AGG(DISTINCT "Reporting_Airline", ' ') AS "AllCarriers"
+FROM "flight-carriers"
+```
+
+Returns the following:
+
+|`AllCarriers`|
+|-------------|
+|`AA AS B6 CO DH DL EV F9 FL HA HP MQ NW OH OO TZ UA US WN XE`|
+
+</details>
+
+[Learn more](sql-aggregations.md)
+
+## STRING_FORMAT
+
+Returns a string formatted in the manner of Java's [String.format](https://docs.oracle.com/javase/8/docs/api/java/lang/String.html#format-java.lang.String-java.lang.Object...-).
+
+* **Syntax:** `STRING_FORMAT(pattern[, args...])`
+* **Function type:** Scalar, string 
+
+<details>
+<summary>Example</summary>
+
+The following example uses Java String format to pass in `Flight_Number_Reporting_Airline` and `origin_airport` columns, from the `flight-carriers` datasource, as arguments into the string. 
+
+```sql
+SELECT 
+  "Flight_Number_Reporting_Airline" AS "flight_number",
+  "Origin" AS "origin_airport",
+  STRING_FORMAT('Flight No.%d departing from %s', "Flight_Number_Reporting_Airline", "Origin") AS "departure_announcement"
+FROM "flight-carriers"
+LIMIT 1
+```
+
+Returns the following:
+
+| `flight_number` | `origin_airport` | `departure_announcement` |
+| -- | -- | -- |
+| `314` | `SJU` | `Flight No.314 departing from SJU` |
+
+</details>
+
+[Learn more](sql-scalar.md#string-functions)
+
+## STRING_TO_ARRAY
+
+Splits the string into an array of substrings using the specified delimiter. The delimiter must be a valid regular expression.
+
+* **Syntax**: `STRING_TO_ARRAY(string, delimiter)`
+* **Function type:** Array
+
+[Learn more](sql-array-functions.md)
+
+## STRING_TO_MV
+
+Splits `str1` into an multi-value string on the delimiter specified by `str2`, which is a regular expression.
+
+* **Syntax:** `STRING_TO_MV(str1, str2)`
+* **Function type:** Multi-value string
+
+<details>
+<summary>Example</summary>
+
+The following example splits a street address by whitespace characters:
+
+```sql
+SELECT STRING_TO_MV('123 Rose Lane', '\s+') AS mv
+```
+
+Returns the following:
+
+| `mv` |
+| -- |
+| `["123","Rose","Lane"]` |
+
+</details>
+
+[Learn more](sql-multivalue-string-functions.md)
+
+## STRLEN
+
+Alias for [`LENGTH`](#length).
+
+* **Syntax:** `STRLEN(expr)`
+* **Function type:** Scalar, string 
+
+[Learn more](sql-scalar.md#string-functions)
+
+## STRPOS
+
+Returns the one-based index position of a substring within an expression. If `substring` is not found, returns 0.
+
+* **Syntax:** `STRPOS(expr, substring)`
+* **Function type:** Scalar, string
+
+<details>
+<summary>Example</summary>
+
+The following example returns the one-based index position of `World`.
+
+```sql
+SELECT 
+  'Hello World!' AS "original_string",
+  STRPOS('Hello World!', 'World') AS "index"
+```
+
+Returns the following:
+
+| `original_string` | `index` |
+| -- | -- |
+| `Hello World!` | `7` |
+
+</details>
+
+[Learn more](sql-scalar.md#string-functions)
+
+## SUBSTR
+
+Alias for [`SUBSTRING`](#substring).
+
+* **Syntax:** `SUBSTR(expr, index[, length])`
+* **Function type:** Scalar, string
+
+[Learn more](sql-scalar.md#string-functions)
+
+
+## SUBSTRING
+
+Returns a substring of the expression starting at a given one-based index. If `length` is omitted, extracts characters to the end of the string, otherwise returns a substring of `length` characters.
+
+* **Syntax:** `SUBSTRING(expr, index[, length])`
+* **Function type:** Scalar, string
+
+<details>
+<summary>Example</summary>
+
+The following example extracts a substring from the string expression `abcdefghi` of length `3` starting at index `4`
+
+```sql
+SELECT 
+  'abcdefghi' AS "original_string",
+  SUBSTRING('abcdefghi', 4, 3) AS "substring"
+```
+
+Returns the following:
+
+| `original_string` | `substring` |
+| -- | -- |
+| `abcdefghi` | `def` |
+
+</details>
+
+
+
+[Learn more](sql-scalar.md#string-functions)
+
+## SUM
+
+Calculates the sum of a set of values.
+
+* **Syntax**: `SUM(expr)`
+* **Function type:** Aggregation
+
+<details>
+<summary>Example</summary>
+
+The following example calculates the total minutes of delay for an airline in `flight-carriers`:
+
+```sql
+SELECT SUM("DepDelayMinutes") AS tot_delay
+FROM "flight-carriers"
+WHERE "Reporting_Airline" = 'AA'
+```
+
+Returns the following:
+
+| `tot_delay` |
+| -- |
+| `475735` |
+
+</details>
+
+[Learn more](sql-aggregations.md)
+
+## TAN
+
+Calculates the trigonometric tangent of an angle expressed in radians.
+
+* **Syntax:** `TAN(expr)`
+* **Function type:** Scalar, numeric
+
+<details>
+<summary>Example</summary>
+
+The following example calculates the tangent of angle `PI/3` radians.
+
+```sql
+SELECT TAN(PI / 3) AS "tangent"
+```
+Returns the following:
+
+| `tangent` |  
+| -- |
+| `1.7320508075688767` |
+</details>
+
+[Learn more](sql-scalar.md#numeric-functions)
+
+## TEXTCAT
+
+Concatenates two string expressions.
+
+* **Syntax:** `TEXTCAT(expr, expr)`
+* **Function type:** Scalar, string
+  
+<details>
+<summary>Example</summary>
+
+The following example concatenates the `OriginState` column from the `flight-carriers` datasource to `, USA`.
+
+```sql
+SELECT
+  "OriginState" AS "origin_state",
+  TEXTCAT("OriginState", ', USA') AS "concatenate_state_with_USA"
+FROM "flight-carriers"
+LIMIT 1
+```
+
+Returns the following:
+
+| `origin_state` | `concatenate_state_with_USA` |
+| -- | -- |
+| `PR` | `PR, USA` |
+
+</details>
+
+[Learn more](sql-scalar.md#string-functions)
+
+## THETA_SKETCH_ESTIMATE
+
+Returns the distinct count estimate from a Theta sketch. The `expr` argument must return a Theta sketch.
+
+* **Syntax:** `THETA_SKETCH_ESTIMATE(expr)`
+* **Function type:** Scalar, sketch
+
+<details>
+<summary>Example</summary>
+
+The following example estimates the distinct number of tail numbers in the `Tail_Number` column of the `flight-carriers` datasource.
+
+```sql
+SELECT THETA_SKETCH_ESTIMATE( DS_THETA("Tail_Number") ) AS "estimate"
+FROM "flight-carriers"
+```
+
+Returns the following:
+
+| `estimate` |
+| -- |
+| `4667` |
+
+</details>
+
+[Learn more](sql-scalar.md#sketch-functions)
+
+## THETA_SKETCH_ESTIMATE_WITH_ERROR_BOUNDS
+
+Returns the distinct count estimate and error bounds from a Theta sketch. The `expr` argument must return a Theta sketch. Use `errorBoundsStdDev` to specify the number of standard error bound deviations.
+
+* **Syntax:** `THETA_SKETCH_ESTIMATE_WITH_ERROR_BOUNDS(expr, errorBoundsStdDev)`
+* **Function type:** Scalar, sketch
+
+<details>
+<summary>Details</summary>
+
+The following example estimates the number of distinct tail numbers in the `Tail_Number` column of the `flight-carriers` datasource with error bounds at plus or minus one standard deviation.
+
+```sql
+SELECT THETA_SKETCH_ESTIMATE_WITH_ERROR_BOUNDS(DS_THETA("Tail_Number", 4096), 1) AS "estimate_with_error"
+FROM "flight-carriers"
+```
+
+Returns the following:
+
+| `estimate_with_error` |
+| -- |
+| `{"estimate":4691.201541339628,"highBound":4718.4577807143205,"lowBound":4664.093801991001,"numStdDev":1}` |
+
+</details>
+
+[Learn more](sql-scalar.md#sketch-functions)
+
+## THETA_SKETCH_INTERSECT
+
+Returns an intersection of Theta sketches. Each input expression must return a Theta sketch. See [DataSketches Theta Sketch module](../development/extensions-core/datasketches-theta.md#aggregator) for a description of optional parameters. 
+
+* **Syntax:** `THETA_SKETCH_INTERSECT([size], expr0, expr1, ...)`
+* **Function type:** Scalar, sketch
+
+<details>
+<summary>Example</summary>
+
+The following example estimates the intersection of distinct tail numbers in the `flight-carriers` datasource for flights originating in CA, TX, and NY.
+
+```sql
+SELECT
+  THETA_SKETCH_ESTIMATE(
+    THETA_SKETCH_INTERSECT( 
+      DS_THETA("Tail_Number") FILTER(WHERE "OriginState" = 'CA'),
+      DS_THETA("Tail_Number") FILTER(WHERE "OriginState" = 'TX'),
+      DS_THETA("Tail_Number") FILTER(WHERE "OriginState" = 'NY')
+    )
+  ) AS "estimate_intersection"
+FROM "flight-carriers"
+```
+
+Returns the following:
+
+| `estimate_intersection` |
+| -- |
+| `1701` |
+
+</details>
+
+[Learn more](sql-scalar.md#sketch-functions)
+
+## THETA_SKETCH_NOT
+
+Returns a set difference of Theta sketches. Each input expression must return a Theta sketch. See [DataSketches Theta Sketch module](../development/extensions-core/datasketches-theta.md#aggregator) for a description of optional parameters.
+
+* **Syntax:** `THETA_SKETCH_NOT([size], expr0, expr1, ...)`
+* **Function type:** Scalar, sketch
+
+<details>
+<summary>Example</summary>
+
+The following example estimates the number of distinct tail numbers in the `flight-carriers` datasource for flights not originating in CA, TX, or NY.
+
+```sql
+SELECT
+  THETA_SKETCH_ESTIMATE(
+    THETA_SKETCH_NOT( 
+      DS_THETA("Tail_Number"),
+      DS_THETA("Tail_Number") FILTER(WHERE "OriginState" = 'CA'),
+      DS_THETA("Tail_Number") FILTER(WHERE "OriginState" = 'TX'),
+      DS_THETA("Tail_Number") FILTER(WHERE "OriginState" = 'NY')
+    )
+  ) AS "estimate_not"
+FROM "flight-carriers"
+```
+
+Returns the following:
+
+| `estimate_not` |
+| -- |
+| `145` |
+
+</details>
+
+[Learn more](sql-scalar.md#sketch-functions)
+
+## THETA_SKETCH_UNION
+
+Returns a union of Theta sketches. Each input expression must return a Theta sketch. See [DataSketches Theta Sketch module](../development/extensions-core/datasketches-theta.md#aggregator) for a description of optional parameters.
+
+* **Syntax:**`THETA_SKETCH_UNION([size], expr0, expr1, ...)`
+* **Function type:** Scalar, sketch
+
+<details>
+<summary>Example</summary>
+
+The following example estimates the number of distinct tail numbers that depart from CA, TX, or NY.
+
+```sql
+SELECT
+  THETA_SKETCH_ESTIMATE(
+    THETA_SKETCH_UNION( 
+      DS_THETA("Tail_Number") FILTER(WHERE "OriginState" = 'CA'),
+      DS_THETA("Tail_Number") FILTER(WHERE "OriginState" = 'TX'),
+      DS_THETA("Tail_Number") FILTER(WHERE "OriginState" = 'NY')
+    )
+  ) AS "estimate_union"
+FROM "flight-carriers"
+```
+Returns the following:
+
+| `estimate_union` |
+| -- |
+| `4522` |
+
+</details>
+
+[Learn more](sql-scalar.md#sketch-functions)
+
+## TIME_CEIL
+
+Rounds up a timestamp to a given ISO 8601 time period. You can specify `origin` to provide a reference timestamp from which to start rounding. If provided, `timezone` should be a time zone name like `America/Los_Angeles` or an offset like `-08:00`.
+
+* **Syntax:** `TIME_CEIL(timestamp_expr, period[, origin[, timezone]])`
+* **Function type:** Scalar, date and time
+
+<details>
+<summary>Example</summary>
+
+The following example rounds up the `__time` column from the `taxi-trips` datasource to the nearest 45th minute in reference to the timestamp `2013-08-01 08:0:00`.
+
+```sql
+SELECT 
+  "__time" AS "original_timestamp",
+  TIME_CEIL("__time", 'PT45M', TIMESTAMP '2013-08-01 08:0:00') AS "time_ceiling"
+FROM "taxi-trips"
+LIMIT 2
+```
+
+Returns the following:
+
+| `original_timestamp` | `time_ceiling` |
+| -- | -- |
+| `2013-08-01T08:14:37.000Z` | `2013-08-01T08:45:00.000Z` |
+| `2013-08-01T09:13:00.000Z` | `2013-08-01T09:30:00.000Z` |
+</details>
+
+[Learn more](sql-scalar.md#date-and-time-functions)
+
+## TIME_EXTRACT
+
+Extracts the value of `unit` from the timestamp and returns it as a number. If provided, `timezone` should be a time zone name like `America/Los_Angeles` or an offset like `-08:00`.
+
+* **Syntax:** `TIME_EXTRACT(timestamp_expr[, unit[, timezone]])`
+* **Function type:** Scalar, date and time
+
+<details>
+<summary>Example</summary>
+
+The following example extracts the hour from the `__time` column in the `taxi-trips` datasource and offsets its timezone by `-04:00` hours.
+
+```sql
+SELECT 
+  "__time" AS "original_timestamp",
+  TIME_EXTRACT("__time", 'hour', '-04:00') AS "extract_hour"
+FROM "taxi-trips"
+LIMIT 2
+```
+
+Returns the following:
+
+| `original_timestamp` | `extract_hour` |
+| -- | -- |
+| `2013-08-01T08:14:37.000Z` | `4` |
+| `2013-08-01T09:13:00.000Z` | `5` |
+
+</details>
+
+[Learn more](sql-scalar.md#date-and-time-functions)
+
+## TIME_FLOOR
+
+Rounds down a timestamp to a given ISO 8601 time period. You can specify `origin` to provide a reference timestamp from which to start rounding. If provided, `timezone` should be a time zone name like `America/Los_Angeles` or an offset like `-08:00`.
+
+* **Syntax:** `TIME_FLOOR(timestamp_expr, period[, origin[, timezone]])`
+* **Function type:** Scalar, date and time
+
+<details>
+<summary>Example</summary>
+
+The following example rounds down the `__time` column from the `taxi-trips` datasource to the nearest 45th minute in reference to the timestamp `2013-08-01 08:0:00`.
+
+```sql
+SELECT 
+  "__time" AS "original_timestamp",
+  TIME_FLOOR("__time", 'PT45M', TIMESTAMP '2013-08-01 08:0:00') AS "time_floor"
+FROM "taxi-trips"
+LIMIT 2
+```
+
+Returns the following:
+
+| `original_timestamp` | `time_floor` |
+| -- | -- |
+| `2013-08-01T08:14:37.000Z` | `2013-08-01T08:00:00.000Z` |
+| `2013-08-01T09:13:00.000Z` | `2013-08-01T08:45:00.000Z` |
+
+</details>
+
+[Learn more](sql-scalar.md#date-and-time-functions)
+
+## TIME_FORMAT
+
+Formats a timestamp as a string in a provided [Joda DateTimeFormat pattern](http://www.joda.org/joda-time/apidocs/org/joda/time/format/DateTimeFormat.html). If no pattern is provided, `pattern` defaults to ISO 8601. If provided, `timezone` should be a time zone name like `America/Los_Angeles` or an offset like `-08:00`.
+
+* **Syntax:** `TIME_FORMAT(timestamp_expr[, pattern[, timezone]])`
+* **Function type:** Scalar, date and time
+
+<details>
+<summary>Example</summary>
+
+The following example formats the `__time` column from the `flight-carriers` datasource into a string format and offsets the result's timezone by `-05:00` hours.
+
+```sql
+SELECT
+  "__time" AS "original_time",
+TIME_FORMAT( "__time", 'dd-MM-YYYY hh:mm aa zzz', '-05:00') AS "string"
+FROM "taxi-trips"
+LIMIT 1
+```
+
+Returns the following:
+
+| `original_time` | `string` |
+| -- | -- |
+| `2013-08-01T08:14:37.000Z` | `01-08-2013 03:14 AM -05:00` |
+
+</details>
+
+[Learn more](sql-scalar.md#date-and-time-functions)
+
+## TIME_IN_INTERVAL
+
+Returns true if a timestamp is contained within a particular interval. Intervals must be formatted as a string literal containing any ISO 8601 interval. The start instant of an interval is inclusive, and the end instant is exclusive.
+
+* **Syntax:** `TIME_IN_INTERVAL(timestamp_expr, interval)`
+* **Function type:** Scalar, date and time
+
+<details>
+<summary>Example</summary>
+
+The following example returns true when a timestamp in the `__time` column of the `taxi-trips` datasource is within a hour interval starting from `2013-08-01T08:00:00`.
+
+```sql
+SELECT 
+  "__time" AS "original_time",
+  TIME_IN_INTERVAL("__time", '2013-08-01T08:00:00/PT1H') AS "in_interval"
+FROM "taxi-trips"
+LIMIT 2
+```
+
+Returns the following:
+
+| `original_time` | `in_interval` |
+| -- | -- |
+| `2013-08-01T08:14:37.000Z` | `true` |
+| `2013-08-01T09:13:00.000Z` | `false` |
+
+</details>
+
+[Learn more](sql-scalar.md#date-and-time-functions)
+
+## TIME_PARSE
+
+Parses a string into a timestamp using a given [Joda DateTimeFormat pattern](http://www.joda.org/joda-time/apidocs/org/joda/time/format/DateTimeFormat.html). If no pattern is provided, `pattern` defaults to ISO 8601. Returns NULL if string cannot be parsed. If provided, `timezone` should be a time zone name like `America/Los_Angeles` or an offset like `-08:00`.
+
+* **Syntax:** `TIME_PARSE(string_expr[, pattern[, timezone]])`
+* **Function type:** Scalar, date and time
+
+<details>
+<summary>Example</summary>
+
+The following example parses the `FlightDate` STRING column from the `flight-carriers` datasource into a valid timestamp with an offset of `-05:00` hours.
+
+```sql
+SELECT
+  "FlightDate" AS "original_string",
+  TIME_PARSE("FlightDate", 'YYYY-MM-dd', '-05:00') AS "timestamp"
+FROM "flight-carriers"
+LIMIT 1
+```
+
+Returns the following:
+
+| `original_string` | `timestamp` |
+| -- | -- |
+| `2005-11-01` | `2005-11-01T05:00:00.000Z` |
+
+</details>
+
+[Learn more](sql-scalar.md#date-and-time-functions)
+
+## TIME_SHIFT
+
+Shifts a timestamp by a given number of time units. The `period` parameter can be any ISO 8601 period. The `step` parameter can be negative. If provided, `timezone` should be a time zone name like `America/Los_Angeles` or an offset like `-08:00`.
+
+* **Syntax:** `TIME_SHIFT(timestamp_expr, period, step[, timezone])`
+* **Function type:** Scalar, date and time
+
+<details>
+<summary>Example</summary>
+
+The following example shifts the `__time` column from the `taxi-trips` datasource back by 24 hours.
+
+```sql
+SELECT
+  "__time" AS "original_timestamp",
+  TIME_SHIFT("__time", 'PT1H', -24) AS "shift_back"
+FROM "taxi-trips"
+LIMIT 1
+```
+
+Returns the following:
+
+| `original_timestamp` | `shift_back` |
+| -- | -- |
+| `2013-08-01T08:14:37.000Z` | `2013-07-31T08:14:37.000Z` |
+
+</details>
+
+[Learn more](sql-scalar.md#date-and-time-functions)
+
+
+## TIMESTAMP_TO_MILLIS
+
+Returns the number of milliseconds since epoch for the given timestamp.
+
+* **Syntax:** `TIMESTAMP_TO_MILLIS(timestamp_expr)`
+* **Function type:** Scalar, date and time
+
+<details>
+<summary>Example</summary>
+
+The following example converts the `__time` column from the `taxi-trips` datasource into milliseconds since epoch.
+
+```sql
+SELECT 
+  "__time" AS "original_time",
+  TIMESTAMP_TO_MILLIS("__time") AS "miliseconds"
+FROM "taxi-trips"
+LIMIT 1
+```
+
+Returns the following:
+
+| `original_time` | `miliseconds` |
+| -- | -- |
+| `2013-08-01T08:14:37.000Z` | `1375344877000` |
+
+</details>
+
+[Learn more](sql-scalar.md#date-and-time-functions)
+
+## TIMESTAMPADD
+
+Add a `unit` of time multiplied by `count` to `timestamp`.
+
+* **Syntax:** `TIMESTAMPADD(unit, count, timestamp)`
+* **Function type:** Scalar, date and time
+
+<details>
+<summary>Example</summary>
+
+The following example adds five months to the timestamp `2000-01-01 00:00:00`.
+
+```sql
+SELECT
+  TIMESTAMP '2000-01-01 00:00:00' AS "original_time",
+  TIMESTAMPADD (MONTH, 5, TIMESTAMP '2000-01-01 00:00:00') AS "new_time"
+```
+
+Returns the following:
+
+| `original_time` | `new_time` |
+| -- | -- |
+| `2000-01-01T00:00:00.000Z` | `2000-06-01T00:00:00.000Z` |
+
+</details>
+
+[Learn more](sql-scalar.md#date-and-time-functions)
+
+## TIMESTAMPDIFF
+
+Returns the difference between two timestamps in a given unit.
+
+* **Syntax:** `TIMESTAMPDIFF(unit, timestamp1, timestamp2)`
+* **Function type:** Scalar, date and time
+
+<details>
+<summary>Example</summary>
+
+The following example calculates the taxi trip length in minutes by subtracting the `__time` column from the `dropoff_datetime` column in the `taxi-trips` datasource.
+
+```sql
+SELECT
+  "__time" AS "pickup_time",
+  "dropoff_datetime" AS "dropoff_time",
+  TIMESTAMPDIFF (MINUTE, "__time", TIME_PARSE("dropoff_datetime")) AS "trip_length"
+FROM "taxi-trips"
+LIMIT 1
+```
+
+Returns the following: 
+
+| `pickup_time` | `dropoff_time` | `trip_length` |
+| -- | -- | -- |
+| `2013-08-01T08:14:37.000Z` | `2013-08-01 09:09:06` | `54` |
+
+</details>
+
+[Learn more](sql-scalar.md#date-and-time-functions)
+
+## TO_JSON_STRING
+
+Serializes an expression into a JSON string.
+
+* **Syntax:** `TO_JSON_STRING(expr)`
+* **Function type:** JSON
+
+<details>
+<summary>Example</summary>
+
+The following example writes the distinct column names in the `events` nested column to a JSON string:
+
+```sql
+SELECT
+  TO_JSON_STRING(ARRAY_CONCAT_AGG(DISTINCT JSON_KEYS(event, '$.'))) as json_string
+FROM "kttm_nested"
+```
+
+Returns the following:
+
+| `json_string` |
+| -- |
+| `["error","layer","percentage","saveNumber","type","url","userAgent"]` |
+
+</details>
+
+[Learn more](sql-json-functions.md)
+
+
+## TRIM
+
+Trims the leading and/or trailing characters of an expression. Defaults `chars` to a space if none is provided. Defaults to `BOTH` if no directional argument is provided.
+
+* **Syntax:** `TRIM([BOTH|LEADING|TRAILING] [chars FROM] expr)`
+* **Function type:** Scalar, string
+
+<details>
+<summary>Example</summary>
+
+The following example trims `_` characters from both ends of the string expression.
+
+```sql
+SELECT 
+  '___abc___' AS "original_string",
+  TRIM( BOTH '_' FROM '___abc___') AS "trim_expression"
+```
+
+Returns the following:
+
+| `original_string` | `trim_expression` |
+| -- | -- |
+| `___abc___` | `abc` |
+
+</details>
+
+[Learn more](sql-scalar.md#string-functions)
+
+## TRUNC
+
+Alias for [`TRUNCATE`](#truncate).
+
+* **Syntax:** `TRUNC(expr[, digits])`
+* **Function type:** Scalar, numeric
+
+[Learn more](sql-scalar.md#numeric-functions)
+
+## TRUNCATE
+
+Truncates a numerical expression to a specific number of decimal digits.
+
+* **Syntax:** `TRUNCATE(expr[, digits])`
+* **Function type:** Scalar, numeric
+
+<details>
+<summary>Example</summary>
+
+The following applies the TRUNCATE function to 1 decimal place on the `pickup_longitude` column from the `taxi-trips` datasource.
+
+```sql
+SELECT
+  "pickup_longitude" as "pickup_longitude",
+  TRUNCATE("pickup_longitude", 1) as "truncate_pickup_longitude"
+FROM "taxi-trips"
+WHERE "pickup_longitude" IS NOT NULL
+LIMIT 1
+```
+Returns the following:
+
+| `pickup_longitude` | `truncate_pickup_longitude` |
+| -- | -- |
+| `-73.9377670288086` | `-73.9` |
+
+</details>
+
+
+[Learn more](sql-scalar.md#numeric-functions)
+
+## TRY_PARSE_JSON
+
+Parses an expression into a `COMPLEX<json>` object.
+
+This function deserializes JSON values when processing them, translating stringified JSON into a nested structure.
+If the input is invalid JSON or not a `VARCHAR`, it returns a `NULL` value.
+
+You can use this function instead of [PARSE_JSON](#parse_json) to insert a null value when processing invalid data, instead of producing an error.
+
+* **Syntax:** `TRY_PARSE_JSON(expr)`
+* **Function type:** JSON
+
+<details>
+<summary>Example</summary>
+
+The following example creates a `COMPLEX<json>` object `gus` from a string of fields:
+
+```sql
+SELECT
+  TRY_PARSE_JSON('{"name":"Gus","email":"gus_cat@example.com","type":"Pet"}') as gus
+```
+
+Returns the following:
+
+| `gus` |
+| -- |
+| `{"name":"Gus","email":"gus_cat@example.com","type":"Pet"}` |
+
+
+The following example contains invalid data `x:x`:
+
+```sql
+SELECT
+  TRY_PARSE_JSON('{"name":"Gus","email":"gus_cat@example.com","type":"Pet",x:x}') as gus
+```
+
+Returns the following:
+
+| `gus` |
+| -- |
+| `null` |
+
+</details>
+
+[Learn more](sql-json-functions.md)
+
+
+## UPPER
+
+Returns the expression in uppercase.
+
+* **Syntax:** `UPPER(expr)`
+* **Function type:** Scalar, string
+
+<details>
+<summary>Example</summary>
+
+The following example converts the `OriginCityName` column from the `flight-carriers` datasource to uppercase.
+
+```sql
+SELECT 
+  "OriginCityName" AS "origin_city",
+  UPPER("OriginCityName") AS "uppercase"
+FROM "flight-carriers"
+LIMIT 1
+```
+
+Returns the following:
+
+| `origin_city` | `uppercase` |
+| -- | -- |
+| `San Juan, PR` | `SAN JUAN, PR` |
+
+</details>
+
+[Learn more](sql-scalar.md#string-functions)
+
+## VAR_POP
+
+Calculates the population variance of a set of values.  
+Requires the [`druid-stats` extension](../development/extensions-core/stats.md).
+
+* **Syntax**: `VAR_POP(expr)`
+* **Function type:** Aggregation
+
+<details>
+<summary>Example</summary>
+
+The following example calculates the population variance for minutes of delay by a particular airlines in `flight-carriers`:
+
+```sql
+SELECT VAR_POP("DepDelayMinutes") AS varpop_delay
+FROM "flight-carriers"
+WHERE "Reporting_Airline" = 'AA'
+```
+
+Returns the following:
+
+| `varpop_delay` |
+| -- |
+| `733.51908` |
+
+</details>
+
+[Learn more](sql-aggregations.md)
+
+## VAR_SAMP
+
+Calculates the sample variance of a set of values.  
+Requires the [`druid-stats` extension](../development/extensions-core/stats.md).
+
+* **Syntax**: `VAR_SAMP(expr)`
+* **Function type:** Aggregation
+
+<details>
+<summary>Example</summary>
+
+The following example calculates the sample variance for minutes of delay for an airline in `flight-carriers`:
+
+```sql
+SELECT VAR_SAMP("DepDelayMinutes") AS varsamp_delay
+FROM "flight-carriers"
+WHERE "Reporting_Airline" = 'AA'
+```
+
+Returns the following:
+
+| `varsamp_delay` |
+| -- |
+| `733.53286` |
+
+</details>
+
+[Learn more](sql-aggregations.md)
+
+## VARIANCE
+
+Alias for [`VAR_SAMP`](#var_samp).  
+Requires the [`druid-stats` extension](../development/extensions-core/stats.md).
+
+* **Syntax**: `VARIANCE(expr)`
+* **Function type:** Aggregation
+
+[Learn more](sql-aggregations.md)
diff --git a/docs/35.0.0/querying/sql-json-functions.md b/docs/35.0.0/querying/sql-json-functions.md
new file mode 100644
index 0000000000..9d01cec1e4
--- /dev/null
+++ b/docs/35.0.0/querying/sql-json-functions.md
@@ -0,0 +1,75 @@
+---
+id: sql-json-functions
+title: "SQL JSON functions"
+sidebar_label: "JSON functions"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+<!--
+  The format of the tables that describe the functions and operators
+  should not be changed without updating the script create-sql-docs
+  in web-console/script/create-sql-docs, because the script detects
+  patterns in this markdown file and parse it to TypeScript file for web console
+-->
+
+Druid supports nested columns, which provide optimized storage and indexes for nested data structures. See [Nested columns](./nested-columns.md) for more information.
+
+You can use the following JSON functions to extract, transform, and create `COMPLEX<json>` objects.
+
+
+| Function | Notes |
+| --- | --- |
+|`JSON_KEYS(expr, path)`| Returns an array of field names from `expr` at the specified `path`.|
+|`JSON_MERGE(expr1, expr2[, expr3 ...])`| Merges two or more JSON `STRING` or `COMPLEX<json>` values into one, preserving the rightmost value when there are key overlaps. Returns `NULL` if any argument is `NULL`. Always returns a `COMPLEX<json>` object.|
+|`JSON_OBJECT(KEY expr1 VALUE expr2[, KEY expr3 VALUE expr4, ...])` | Constructs a new `COMPLEX<json>` object from one or more expressions. The `KEY` expressions must evaluate to string types. The `VALUE` expressions can be composed of any input type, including other `COMPLEX<json>` objects. The function can accept colon-separated key-value pairs. The following syntax is equivalent: `JSON_OBJECT(expr1:expr2[, expr3:expr4, ...])`.|
+|`JSON_PATHS(expr)`| Returns an array of all paths which refer to primitive values in `expr` in JSONPath format. |
+|`JSON_QUERY(expr, path)`| Extracts a `COMPLEX<json>` value from `expr`, at the specified `path`. |
+|`JSON_QUERY_ARRAY(expr, path)`| Extracts an `ARRAY<COMPLEX<json>>` value from `expr` at the specified `path`. If the value isn't an `ARRAY`, the function translates it into a single element `ARRAY` containing the value at `path`. Mainly used to extract arrays of objects to use as inputs to other [array functions](./sql-array-functions.md).|
+|`JSON_VALUE(expr, path [RETURNING sqlType])`| Extracts a primitive value from `expr` at the specified `path`. If you include `RETURNING` and specify a SQL type (such as `VARCHAR`, `BIGINT`, `DOUBLE`) the function plans the query using the suggested type. If `RETURNING` isn't included, the function attempts to infer the type based on the context. If the function can't infer the type, it defaults to `VARCHAR`. Primitive arrays can also be returned, but only if `RETURNING` is specified as an `ARRAY` type, e.g. `RETURNING VARCHAR ARRAY`.|
+|`PARSE_JSON(expr)`|Parses `expr` into a `COMPLEX<json>` object. This function deserializes JSON values when processing them, translating stringified JSON into a nested structure. If the input is invalid JSON or not a `VARCHAR`, it returns an error.|
+|`TRY_PARSE_JSON(expr)`|Parses `expr` into a `COMPLEX<json>` object. This operator deserializes JSON values when processing them, translating stringified JSON into a nested structure. If the input is invalid JSON or not a `VARCHAR`, it returns a `NULL` value.|
+|`TO_JSON_STRING(expr)`|Serializes `expr` into a JSON string.|
+
+### JSONPath syntax
+
+Druid supports a subset of the [JSONPath syntax](https://github.com/json-path/JsonPath/blob/master/README.md) operators, primarily limited to extracting individual values from nested data structures.
+
+|Operator|Description|
+| --- | --- |
+|`$`| Root element. All JSONPath expressions start with this operator. |
+|`.<name>`| Child element in dot notation. |
+|`['<name>']`| Child element in bracket notation. |
+|`[<number>]`| Array index. |
+
+Consider the following example input JSON:
+
+```json
+{"x":1, "y":[1, 2, 3]}
+```
+
+- To return the entire JSON object:<br />
+  `$`      -> `{"x":1, "y":[1, 2, 3]}`
+- To return the value of the key "x":<br />
+  `$.x`    -> `1`
+- For a key that contains an array, to return the entire array:<br />
+  `$['y']` -> `[1, 2, 3]`
+- For a key that contains an array, to return an item in the array:<br />
+  `$.y[1]` -> `2`
diff --git a/docs/35.0.0/querying/sql-metadata-tables.md b/docs/35.0.0/querying/sql-metadata-tables.md
new file mode 100644
index 0000000000..6d59462fd1
--- /dev/null
+++ b/docs/35.0.0/querying/sql-metadata-tables.md
@@ -0,0 +1,317 @@
+---
+id: sql-metadata-tables
+title: "SQL metadata tables"
+sidebar_label: "SQL metadata tables"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ Apache Druid supports two query languages: Druid SQL and [native queries](querying.md).
+ This document describes the SQL language.
+:::
+
+
+Druid Brokers infer table and column metadata for each datasource from segments loaded in the cluster, and use this to
+plan [SQL queries](./sql.md). This metadata is cached on Broker startup and also updated periodically in the background through
+[SegmentMetadata queries](segmentmetadataquery.md). Background metadata refreshing is triggered by
+segments entering and exiting the cluster, and can also be throttled through configuration.
+
+Druid exposes system information through special system tables. There are two such schemas available: Information Schema and Sys Schema.
+Information schema provides details about table and column types. The "sys" schema provides information about Druid internals like segments/tasks/servers.
+
+## INFORMATION SCHEMA
+
+You can access table and column metadata through JDBC using `connection.getMetaData()`, or through the
+INFORMATION_SCHEMA tables described below. For example, to retrieve metadata for the Druid
+datasource "foo", use the query:
+
+```sql
+SELECT *
+FROM INFORMATION_SCHEMA.COLUMNS
+WHERE "TABLE_SCHEMA" = 'druid' AND "TABLE_NAME" = 'foo'
+```
+
+:::info
+ Note: INFORMATION_SCHEMA tables do not currently support Druid-specific functions like `TIME_PARSE` and
+ `APPROX_QUANTILE_DS`. Only standard SQL functions can be used.
+:::
+
+### SCHEMATA table
+`INFORMATION_SCHEMA.SCHEMATA` provides a list of all known schemas, which include `druid` for standard [Druid Table datasources](datasource.md#table), `lookup` for [Lookups](datasource.md#lookup), `sys` for the virtual [System metadata tables](#system-schema), and `INFORMATION_SCHEMA` for these virtual tables. Tables are allowed to have the same name across different schemas, so the schema may be included in an SQL statement to distinguish them, e.g. `lookup.table` vs `druid.table`.
+
+|Column|Type|Notes|
+|------|----|-----|
+|CATALOG_NAME|VARCHAR|Always set as `druid`|
+|SCHEMA_NAME|VARCHAR|`druid`, `lookup`, `sys`, or `INFORMATION_SCHEMA`|
+|SCHEMA_OWNER|VARCHAR|Unused|
+|DEFAULT_CHARACTER_SET_CATALOG|VARCHAR|Unused|
+|DEFAULT_CHARACTER_SET_SCHEMA|VARCHAR|Unused|
+|DEFAULT_CHARACTER_SET_NAME|VARCHAR|Unused|
+|SQL_PATH|VARCHAR|Unused|
+
+### TABLES table
+`INFORMATION_SCHEMA.TABLES` provides a list of all known tables and schemas.
+
+|Column|Type|Notes|
+|------|----|-----|
+|TABLE_CATALOG|VARCHAR|Always set as `druid`|
+|TABLE_SCHEMA|VARCHAR|The 'schema' which the table falls under, see [SCHEMATA table for details](#schemata-table)|
+|TABLE_NAME|VARCHAR|Table name. For the `druid` schema, this is the `dataSource`.|
+|TABLE_TYPE|VARCHAR|"TABLE" or "SYSTEM_TABLE"|
+|IS_JOINABLE|VARCHAR|If a table is directly joinable if on the right hand side of a `JOIN` statement, without performing a subquery, this value will be set to `YES`, otherwise `NO`. Lookups are always joinable because they are globally distributed among Druid query processing nodes, but Druid datasources are not, and will use a less efficient subquery join.|
+|IS_BROADCAST|VARCHAR|If a table is 'broadcast' and distributed among all Druid query processing nodes, this value will be set to `YES`, such as lookups and Druid datasources which have a 'broadcast' load rule, else `NO`.|
+
+### COLUMNS table
+`INFORMATION_SCHEMA.COLUMNS` provides a list of all known columns across all tables and schema.
+
+|Column|Type|Notes|
+|------|----|-----|
+|TABLE_CATALOG|VARCHAR|Always set as `druid`|
+|TABLE_SCHEMA|VARCHAR|The 'schema' which the table column falls under, see [SCHEMATA table for details](#schemata-table)|
+|TABLE_NAME|VARCHAR|The 'table' which the column belongs to, see [TABLES table for details](#tables-table)|
+|COLUMN_NAME|VARCHAR|The column name|
+|ORDINAL_POSITION|BIGINT|The order in which the column is stored in a table|
+|COLUMN_DEFAULT|VARCHAR|Unused|
+|IS_NULLABLE|VARCHAR||
+|DATA_TYPE|VARCHAR||
+|CHARACTER_MAXIMUM_LENGTH|BIGINT|Unused|
+|CHARACTER_OCTET_LENGTH|BIGINT|Unused|
+|NUMERIC_PRECISION|BIGINT||
+|NUMERIC_PRECISION_RADIX|BIGINT||
+|NUMERIC_SCALE|BIGINT||
+|DATETIME_PRECISION|BIGINT||
+|CHARACTER_SET_NAME|VARCHAR||
+|COLLATION_NAME|VARCHAR||
+|JDBC_TYPE|BIGINT|Type code from java.sql.Types (Druid extension)|
+
+For example, this query returns [data type](sql-data-types.md) information for columns in the `foo` table:
+
+```sql
+SELECT "ORDINAL_POSITION", "COLUMN_NAME", "IS_NULLABLE", "DATA_TYPE", "JDBC_TYPE"
+FROM INFORMATION_SCHEMA.COLUMNS
+WHERE "TABLE_NAME" = 'foo'
+```
+### ROUTINES table
+`INFORMATION_SCHEMA.ROUTINES` provides a list of all known functions.
+
+|Column|Type| Notes|
+|------|----|------|
+|ROUTINE_CATALOG|VARCHAR| The catalog that contains the routine. Always set as `druid`|
+|ROUTINE_SCHEMA|VARCHAR| The schema that contains the routine. Always set as `INFORMATION_SCHEMA`|
+|ROUTINE_NAME|VARCHAR| THe routine name|
+|ROUTINE_TYPE|VARCHAR| The routine type. Always set as `FUNCTION`|
+|IS_AGGREGATOR|VARCHAR| If a routine is an aggregator function, then the value will be set to `YES`, else `NO`|
+|SIGNATURES|VARCHAR| One or more routine signatures|
+
+For example, this query returns information about all the aggregator functions:
+
+```sql
+SELECT "ROUTINE_CATALOG", "ROUTINE_SCHEMA", "ROUTINE_NAME", "ROUTINE_TYPE", "IS_AGGREGATOR", "SIGNATURES"
+FROM "INFORMATION_SCHEMA"."ROUTINES"
+WHERE "IS_AGGREGATOR" = 'YES'
+```
+
+
+## SYSTEM SCHEMA
+
+The "sys" schema provides visibility into Druid segments, servers and tasks.
+
+:::info
+ Note: "sys" tables do not currently support Druid-specific functions like `TIME_PARSE` and
+ `APPROX_QUANTILE_DS`. Only standard SQL functions can be used.
+:::
+
+### SEGMENTS table
+
+Segments table provides details on all Druid segments, whether they are published yet or not.
+
+|Column|Type|Notes|
+|------|-----|-----|
+|segment_id|VARCHAR|Unique segment identifier|
+|datasource|VARCHAR|Name of datasource|
+|start|VARCHAR|Interval start time (in ISO 8601 format)|
+|end|VARCHAR|Interval end time (in ISO 8601 format)|
+|size|BIGINT|Size of segment in bytes|
+|version|VARCHAR|Version string (generally an ISO8601 timestamp corresponding to when the segment set was first started). Higher version means the more recently created segment. Version comparing is based on string comparison.|
+|partition_num|BIGINT|Partition number (an integer, unique within a datasource+interval+version; may not necessarily be contiguous)|
+|num_replicas|BIGINT|Number of replicas of this segment currently being served|
+|num_rows|BIGINT|Number of rows in this segment, or zero if the number of rows is not known.<br /><br />This row count is gathered by the Broker in the background. It will be zero if the Broker has not gathered a row count for this segment yet. For segments ingested from streams, the reported row count may lag behind the result of a `count(*)` query because the cached `num_rows` on the Broker may be out of date. This will settle shortly after new rows stop being written to that particular segment.|
+|is_active|BIGINT|True for segments that represent the latest state of a datasource.<br /><br />Equivalent to `(is_published = 1 AND is_overshadowed = 0) OR is_realtime = 1`. In steady state, when no ingestion or data management operations are happening, `is_active` will be equivalent to `is_available`. However, they may differ from each other when ingestion or data management operations have executed recently. In these cases, Druid will load and unload segments appropriately to bring actual availability in line with the expected state given by `is_active`.|
+|is_published|BIGINT|Boolean represented as long type where 1 = true, 0 = false. 1 if this segment has been published to the metadata store and is marked as used. See the [segment lifecycle documentation](../design/storage.md#segment-lifecycle) for more details.|
+|is_available|BIGINT|Boolean represented as long type where 1 = true, 0 = false. 1 if this segment is currently being served by any data serving process, like a Historical or a realtime ingestion task. See the [segment lifecycle documentation](../design/storage.md#segment-lifecycle) for more details.|
+|is_realtime|BIGINT|Boolean represented as long type where 1 = true, 0 = false. 1 if this segment is _only_ served by realtime tasks, and 0 if any Historical process is serving this segment.|
+|is_overshadowed|BIGINT|Boolean represented as long type where 1 = true, 0 = false. 1 if this segment is published and is _fully_ overshadowed by some other published segments. Currently, `is_overshadowed` is always 0 for unpublished segments, although this may change in the future. You can filter for segments that "should be published" by filtering for `is_published = 1 AND is_overshadowed = 0`. Segments can briefly be both published and overshadowed if they were recently replaced, but have not been unpublished yet. See the [segment lifecycle documentation](../design/storage.md#segment-lifecycle) for more details.|
+|shard_spec|VARCHAR|JSON-serialized form of the segment `ShardSpec`|
+|dimensions|VARCHAR|JSON-serialized form of the segment dimensions|
+|metrics|VARCHAR|JSON-serialized form of the segment metrics|
+|last_compaction_state|VARCHAR|JSON-serialized form of the compaction task's config (compaction task which created this segment). May be null if segment was not created by compaction task.|
+|replication_factor|BIGINT|Total number of replicas of the segment that are required to be loaded across all historical tiers, based on the load rule that currently applies to this segment. If this value is 0, the segment is not assigned to any historical and will not be loaded. This value is -1 if load rules for the segment have not been evaluated yet.|
+
+For example, to retrieve all currently active segments for datasource "wikipedia", use the query:
+
+```sql
+SELECT * FROM sys.segments
+WHERE datasource = 'wikipedia'
+AND is_active = 1
+```
+
+Another example to retrieve segments total_size, avg_size, avg_num_rows and num_segments per datasource:
+
+```sql
+SELECT
+    datasource,
+    SUM("size") AS total_size,
+    CASE WHEN SUM("size") = 0 THEN 0 ELSE SUM("size") / (COUNT(*) FILTER(WHERE "size" > 0)) END AS avg_size,
+    CASE WHEN SUM(num_rows) = 0 THEN 0 ELSE SUM("num_rows") / (COUNT(*) FILTER(WHERE num_rows > 0)) END AS avg_num_rows,
+    COUNT(*) AS num_segments
+FROM sys.segments
+WHERE is_active = 1
+GROUP BY 1
+ORDER BY 2 DESC
+```
+
+This query goes a step further and shows the overall profile of available, non-realtime segments across buckets of 1 million rows each for the `foo` datasource:
+
+```sql
+SELECT ABS("num_rows" /  1000000) as "bucket",
+  COUNT(*) as segments,
+  SUM("size") / 1048576 as totalSizeMiB,
+  MIN("size") / 1048576 as minSizeMiB,
+  AVG("size") / 1048576 as averageSizeMiB,
+  MAX("size") / 1048576 as maxSizeMiB,
+  SUM("num_rows") as totalRows,
+  MIN("num_rows") as minRows,
+  AVG("num_rows") as averageRows,
+  MAX("num_rows") as maxRows,
+  (AVG("size") / AVG("num_rows"))  as avgRowSizeB
+FROM sys.segments
+WHERE is_available = 1 AND is_realtime = 0 AND "datasource" = `foo`
+GROUP BY 1
+ORDER BY 1
+```
+
+If you want to retrieve segment that was compacted (ANY compaction):
+
+```sql
+SELECT * FROM sys.segments WHERE is_active = 1 AND last_compaction_state IS NOT NULL
+```
+
+or if you want to retrieve segment that was compacted only by a particular compaction spec (such as that of the auto compaction):
+
+```sql
+SELECT * FROM sys.segments WHERE is_active = 1 AND last_compaction_state = 'CompactionState{partitionsSpec=DynamicPartitionsSpec{maxRowsPerSegment=5000000, maxTotalRows=9223372036854775807}, indexSpec={bitmap={type=roaring}, dimensionCompression=lz4, metricCompression=lz4, longEncoding=longs, segmentLoader=null}}'
+```
+
+### SERVERS table
+
+Servers table lists all discovered servers in the cluster.
+
+|Column|Type|Notes|
+|------|-----|-----|
+|server|VARCHAR|Server name in the form host:port|
+|host|VARCHAR|Hostname of the server|
+|plaintext_port|BIGINT|Unsecured port of the server, or -1 if plaintext traffic is disabled|
+|tls_port|BIGINT|TLS port of the server, or -1 if TLS is disabled|
+|server_type|VARCHAR|Type of Druid service. Possible values include: COORDINATOR, OVERLORD,  BROKER, ROUTER, HISTORICAL, MIDDLE_MANAGER or PEON.|
+|tier|VARCHAR|Distribution tier see [druid.server.tier](../configuration/index.md#historical-general-configuration). Only valid for HISTORICAL type, for other types it's null|
+|current_size|BIGINT|Current size of segments in bytes on this server. Only valid for HISTORICAL type, for other types it's 0|
+|max_size|BIGINT|Max size in bytes this server recommends to assign to segments see [druid.server.maxSize](../configuration/index.md#historical-general-configuration). Only valid for HISTORICAL type, for other types it's 0|
+|is_leader|BIGINT|1 if the server is currently the 'leader' (for services which have the concept of leadership), otherwise 0 if the server is not the leader, or null if the server type does not have the concept of leadership|
+|start_time|STRING|Timestamp in ISO8601 format when the server was announced in the cluster|
+|version|VARCHAR|Druid version running on the server|
+|labels|VARCHAR|Labels for the server configured using the property [`druid.labels`](../configuration/index.md)|
+To retrieve information about all servers, use the query:
+
+```sql
+SELECT * FROM sys.servers;
+```
+
+### SERVER_SEGMENTS table
+
+SERVER_SEGMENTS is used to join servers with segments table
+
+|Column|Type|Notes|
+|------|-----|-----|
+|server|VARCHAR|Server name in format host:port (Primary key of [servers table](#servers-table))|
+|segment_id|VARCHAR|Segment identifier (Primary key of [segments table](#segments-table))|
+
+JOIN between "servers" and "segments" can be used to query the number of segments for a specific datasource,
+grouped by server, example query:
+
+```sql
+SELECT count(segments.segment_id) as num_segments from sys.segments as segments
+INNER JOIN sys.server_segments as server_segments
+ON segments.segment_id  = server_segments.segment_id
+INNER JOIN sys.servers as servers
+ON servers.server = server_segments.server
+WHERE segments.datasource = 'wikipedia'
+GROUP BY servers.server;
+```
+
+### TASKS table
+
+The tasks table provides information about active and recently completed tasks. For more information
+check out the documentation for [ingestion tasks](../ingestion/tasks.md).
+
+|Column|Type|Notes|
+|------|-----|-----|
+|task_id|VARCHAR|Unique task identifier|
+|group_id|VARCHAR|Task group ID for this task, the value depends on the task `type`. For example, for native index tasks, it's same as `task_id`, for sub tasks, this value is the parent task's ID|
+|type|VARCHAR|Task type, for example this value is "index" for indexing tasks. See [tasks-overview](../ingestion/tasks.md)|
+|datasource|VARCHAR|Datasource name being indexed|
+|created_time|VARCHAR|Timestamp in ISO8601 format corresponding to when the ingestion task was created. Note that this value is populated for completed and waiting tasks. For running and pending tasks this value is set to 1970-01-01T00:00:00Z|
+|queue_insertion_time|VARCHAR|Timestamp in ISO8601 format corresponding to when this task was added to the queue on the Overlord|
+|status|VARCHAR|Status of a task can be RUNNING, FAILED, SUCCESS|
+|runner_status|VARCHAR|Runner status of a completed task would be NONE, for in-progress tasks this can be RUNNING, WAITING, PENDING|
+|duration|BIGINT|Time it took to finish the task in milliseconds, this value is present only for completed tasks|
+|location|VARCHAR|Server name where this task is running in the format host:port, this information is present only for RUNNING tasks|
+|host|VARCHAR|Hostname of the server where task is running|
+|plaintext_port|BIGINT|Unsecured port of the server, or -1 if plaintext traffic is disabled|
+|tls_port|BIGINT|TLS port of the server, or -1 if TLS is disabled|
+|error_msg|VARCHAR|Detailed error message in case of FAILED tasks|
+
+For example, to retrieve tasks information filtered by status, use the query
+
+```sql
+SELECT * FROM sys.tasks WHERE status='FAILED';
+```
+
+### SUPERVISORS table
+
+The supervisors table provides information about supervisors.
+
+|Column|Type|Notes|
+|------|-----|-----|
+|supervisor_id|VARCHAR|Supervisor task identifier|
+|datasource|VARCHAR|Datasource the supervisor operates on|
+|state|VARCHAR|Basic state of the supervisor. Available states: `UNHEALTHY_SUPERVISOR`, `UNHEALTHY_TASKS`, `PENDING`, `RUNNING`, `SUSPENDED`, `STOPPING`. See [Supervisor reference](../ingestion/supervisor.md) for more information.|
+|detailed_state|VARCHAR|Supervisor specific state. See documentation of the specific supervisor for details: [Kafka](../ingestion/kafka-ingestion.md) or [Kinesis](../ingestion/kinesis-ingestion.md).|
+|healthy|BIGINT|Boolean represented as long type where 1 = true, 0 = false. 1 indicates a healthy supervisor|
+|type|VARCHAR|Type of supervisor, e.g. `kafka`, `kinesis` or `materialized_view`|
+|source|VARCHAR|Source of the supervisor, e.g. Kafka topic or Kinesis stream|
+|suspended|BIGINT|Boolean represented as long type where 1 = true, 0 = false. 1 indicates supervisor is in suspended state|
+|spec|VARCHAR|JSON-serialized supervisor spec|
+
+For example, to retrieve supervisor tasks information filtered by health status, use the query
+
+```sql
+SELECT * FROM sys.supervisors WHERE healthy=0;
+```
diff --git a/docs/35.0.0/querying/sql-multivalue-string-functions.md b/docs/35.0.0/querying/sql-multivalue-string-functions.md
new file mode 100644
index 0000000000..7cba8a70f6
--- /dev/null
+++ b/docs/35.0.0/querying/sql-multivalue-string-functions.md
@@ -0,0 +1,68 @@
+---
+id: sql-multivalue-string-functions
+title: "SQL multi-value string functions"
+sidebar_label: "Multi-value string functions"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+<!--
+  The format of the tables that describe the functions and operators
+  should not be changed without updating the script create-sql-docs
+  in web-console/script/create-sql-docs, because the script detects
+  patterns in this markdown file and parse it to TypeScript file for web console
+-->
+
+
+:::info
+ Apache Druid supports two query languages: Druid SQL and [native queries](querying.md).
+ This document describes the SQL language.
+:::
+
+Druid supports string dimensions containing multiple values.
+This page describes the operations you can perform on multi-value string dimensions using [Druid SQL](./sql.md).
+See [SQL multi-value strings](./sql-data-types.md#multi-value-strings) and native [Multi-value dimensions](multi-value-dimensions.md) for more information.
+
+All array references in the multi-value string function documentation can refer to multi-value string columns or
+`ARRAY` types. These functions are largely identical to the [array functions](./sql-array-functions.md), but use
+`VARCHAR` types and behavior. Multi-value strings can also be converted to `ARRAY` types using `MV_TO_ARRAY`, and
+`ARRAY` into multi-value strings via `ARRAY_TO_MV`. For additional details about `ARRAY` types, see
+[`ARRAY` data type documentation](./sql-data-types.md#arrays).
+
+|Function|Description|
+|--------|-----|
+|`MV_FILTER_ONLY(expr, arr)`|Filters multi-value `expr` to include only values contained in array `arr`.|
+|`MV_FILTER_NONE(expr, arr)`|Filters multi-value `expr` to include no values contained in array `arr`.|
+|`MV_FILTER_REGEX(expr, pattern)`|Filters multi-value `expr` to include values that match `pattern`.|
+|`MV_FILTER_PREFIX(expr, prefix)`|Filters multi-value `expr` to include values that have prefix `prefix`.|
+|`MV_LENGTH(arr)`|Returns length of the array expression.|
+|`MV_CONTAINS(arr, expr)`|If `expr` is a scalar type, returns true if `arr` contains `expr`. If `expr` is an array, returns true if `arr` contains all elements of `expr`. Otherwise returns false.|
+|`MV_OVERLAP(arr1, arr2)`|Returns true if `arr1` and `arr2` have any elements in common, else false.|
+|`MV_OFFSET(arr, long)`|Returns the array element at the 0-based index supplied, or null for an out of range index.|
+|`MV_OFFSET_OF(arr, expr)`|Returns the 0-based index of the first occurrence of `expr` in the array. If no matching elements exist in the array, returns `null`.|
+|`MV_ORDINAL(arr, long)`|Returns the array element at the 1-based index supplied, or null for an out of range index.|
+|`MV_ORDINAL_OF(arr, expr)`|Returns the 1-based index of the first occurrence of `expr` in the array. If no matching elements exist in the array, returns `null`.|
+|`MV_PREPEND(expr, arr)`|Adds `expr` to the beginning of `arr`, the resulting array type determined by the type `arr`.|
+|`MV_APPEND(arr, expr)`|Appends `expr` to `arr`, the resulting array type determined by the type of `arr`.|
+|`MV_CONCAT(arr1, arr2)`|Concatenates `arr2` to `arr1`. The resulting array type is determined by the type of `arr1`.|
+|`MV_SLICE(arr, start, end)`|Returns the subarray of `arr` from the zero-based index of `start` (inclusive) to `end` (exclusive). Returns null when `start` is less than 0, greater than the array length, or greater than `end`. When `end` is greater than the array length, null values are appended to the subarray.|
+|`MV_TO_STRING(arr, str)`|Joins all elements of `arr` by the delimiter specified by `str`.|
+|`STRING_TO_MV(str1, str2)`|Splits `str1` into an array on the delimiter specified by `str2`, which is a regular expression.|
+|`MV_TO_ARRAY(str)`|Converts a multi-value string from a `VARCHAR` to a `VARCHAR ARRAY`.|
diff --git a/docs/35.0.0/querying/sql-operators.md b/docs/35.0.0/querying/sql-operators.md
new file mode 100644
index 0000000000..ebf6809901
--- /dev/null
+++ b/docs/35.0.0/querying/sql-operators.md
@@ -0,0 +1,117 @@
+---
+id: sql-operators
+title: "Druid SQL Operators"
+sidebar_label: "Operators"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+<!--
+  The format of the tables that describe the functions and operators
+  should not be changed without updating the script create-sql-docs
+  in web-console/script/create-sql-docs, because the script detects
+  patterns in this markdown file and parse it to TypeScript file for web console
+-->
+
+
+:::info
+ Apache Druid supports two query languages: Druid SQL and [native queries](querying.md).
+ This document describes the SQL language.
+:::
+
+
+Operators in [Druid SQL](./sql.md) typically operate on one or two values and return a result based on the values. Types of operators in Druid SQL include arithmetic, comparison, logical, and more, as described here. 
+
+When performing math operations, Druid uses 64-bit integer (long) data type unless there are double or float values. If an operation uses float or double values, then the result is a double, which is a 64-bit float. The precision of float and double values is defined by [Java](https://docs.oracle.com/javase/specs/jls/se8/html/jls-5.html) and [the IEEE standard](https://en.wikipedia.org/wiki/IEEE_754).
+
+Keep the following guidelines in mind to help you manage precision issues:
+
+- Long values can store up to 2^63 accurately with an additional bit used for the sign.
+- Float values use 32 bits, and doubles use 64 bits. Both types are impacted by floating point precision. If you need exact decimal values, consider storing the number in a non-decimal format as a long value (up to the limit for longs). For example, if you need three decimal places, store the number multiplied by 1000 and then divide by 1000 when querying.
+
+## Arithmetic operators
+
+|Operator|Description|
+|--------|-----------|
+|`x + y` |Add|
+|`x - y` |Subtract|
+|`x * y` |Multiply|
+|`x / y` |Divide|
+
+## Datetime arithmetic operators
+
+For the datetime arithmetic operators, `interval_expr` can include interval literals like `INTERVAL '2' HOUR`.
+This operator treats days as uniformly 86400 seconds long, and does not take into account daylight savings time.
+To account for daylight savings time, use the [`TIME_SHIFT` function](sql-scalar.md#date-and-time-functions).
+Also see [`TIMESTAMPADD`](sql-scalar.md#date-and-time-functions) for datetime arithmetic.
+
+|Operator|Description|
+|--------|-----------|
+|`timestamp_expr + interval_expr`|Add an amount of time to a timestamp.|
+|`timestamp_expr - interval_expr`|Subtract an amount of time from a timestamp.|
+
+## Concatenation operator
+Also see the [CONCAT function](sql-scalar.md#string-functions).
+
+|Operator|Description|
+|--------|-----------|
+|<code>x &#124;&#124; y</code>|Concatenate strings `x` and `y`.|
+
+## Comparison operators
+
+|Operator|Description|
+|--------|-----------|
+|`x = y` |Equal to|
+|`x IS NOT DISTINCT FROM y`|Equal to, considering `NULL` as a value. Never returns `NULL`.|
+|`x <> y`|Not equal to|
+|`x IS DISTINCT FROM y`|Not equal to, considering `NULL` as a value. Never returns `NULL`.|
+|`x > y` |Greater than|
+|`x >= y`|Greater than or equal to|
+|`x < y` |Less than|
+|`x <= y`|Less than or equal to|
+
+## Logical operators
+
+|Operator|Description|
+|--------|-----------|
+|`x AND y`|Boolean AND|
+|`x OR y`|Boolean OR|
+|`NOT x`|Boolean NOT|
+|`x IS NULL`|True if _x_ is NULL or empty string|
+|`x IS NOT NULL`|True if _x_ is neither NULL nor empty string|
+|`x IS TRUE`|True if _x_ is true|
+|`x IS NOT TRUE`|True if _x_ is not true|
+|`x IS FALSE`|True if _x_ is false|
+|`x IS NOT FALSE`|True if _x_ is not false|
+|`x BETWEEN y AND z`|Equivalent to `x >= y AND x <= z`|
+|`x NOT BETWEEN y AND z`|Equivalent to `x < y OR x > z`|
+|`x LIKE pattern [ESCAPE esc]`|True if _x_ matches a SQL LIKE pattern (with an optional escape)|
+|`x NOT LIKE pattern [ESCAPE esc]`|True if _x_ does not match a SQL LIKE pattern (with an optional escape)|
+|`x IN (values)`|True if _x_ is one of the listed values|
+|`x NOT IN (values)`|True if _x_ is not one of the listed values|
+|`x IN (subquery)`|True if _x_ is returned by the subquery. This will be translated into a join; see [Query translation](sql-translation.md) for details.|
+|`x NOT IN (subquery)`|True if _x_ is not returned by the subquery. This will be translated into a join; see [Query translation](sql-translation.md) for details.|
+
+## Other operators
+
+|Operator|Description|
+|--------|-----------|
+|`PIVOT (aggregation_function(column_to_aggregate) FOR column_with_values_to_pivot IN (pivoted_column1 [, pivoted_column2 ...]))`|Carries out an aggregation and transforms rows into columns in the output.|
+|`UNPIVOT (values_column FOR names_column IN (unpivoted_column1 [, unpivoted_column2 ... ]))`|Transforms existing column values into rows.|
\ No newline at end of file
diff --git a/docs/35.0.0/querying/sql-query-context.md b/docs/35.0.0/querying/sql-query-context.md
new file mode 100644
index 0000000000..31ec12338a
--- /dev/null
+++ b/docs/35.0.0/querying/sql-query-context.md
@@ -0,0 +1,63 @@
+---
+id: sql-query-context
+title: "SQL query context"
+sidebar_label: "SQL query context"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ Apache Druid supports two query languages: Druid SQL and [native queries](querying.md).
+ This document describes the SQL language.
+:::
+
+In Apache Druid, you can control how your [Druid SQL queries](./sql.md) queries run by using query context parameters. The parameters let you adjust aspects of query processing such as using approximations, selecting particular filters, controlling how lookups are executed.
+
+For additional context parameters supported for all query types, refer to [Query context reference](query-context-reference.md). To learn how to set the query context, see [Set query context](../querying/query-context.md).
+
+The table below lists the query context parameters you can use with Druid SQL.
+
+|Parameter|Description|Default value|
+|---------|-----------|-------------|
+|`sqlQueryId`|SQL query ID. For HTTP client, Druid returns it in the `X-Druid-SQL-Query-Id` header.<br/><br/>To specify a SQL query ID, use `sqlQueryId` instead of [`queryId`](query-context-reference.md). Setting `queryId` for a SQL request has no effect. All native queries underlying SQL use an auto-generated `queryId`.|auto-generated|
+|`sqlTimeZone`|Time zone for a connection. For example, "America/Los_Angeles" or an offset like "-08:00". This parameter affects how time functions and timestamp literals behave. |UTC|
+|`sqlStringifyArrays`|If `true`, Druid serializes result columns with array values as JSON strings in the response instead of arrays.|`true`, except for JDBC connections, where it's always `false`|
+|`useApproximateCountDistinct`|Whether to use an approximate cardinality algorithm for `COUNT(DISTINCT foo)`.|`true`|
+|`useGroupingSetForExactDistinct`|Whether to use grouping sets to execute queries with multiple exact distinct aggregations.|`false`|
+|`useApproximateTopN`|If `true`, Druid converts SQL queries to approximate [TopN queries](topnquery.md) wherever possible. If `false`, Druid uses exact [GroupBy queries](groupbyquery.md) instead.|`true`|
+|`useLexicographicTopN`|If `true`, Druid can use [TopN queries](topnquery.md) with lexicographic dimension ordering. If `false`, Druid uses [GroupBy queries](groupbyquery.md) instead for lexicographic ordering. When both `useLexicographicTopN` and `useApproximateTopN` are `false`, TopN queries are never used.|`false`|
+|`enableTimeBoundaryPlanning`|If `true`, Druid converts SQL queries to [time boundary queries](timeboundaryquery.md) wherever possible. Time boundary queries are very efficient for min-max calculation on the `__time` column in a datasource. |`false`|
+|`useNativeQueryExplain`|If `true`, `EXPLAIN PLAN FOR` returns the explain plan as a JSON representation of equivalent native query, else it returns the original version of explain plan generated by Calcite.<br /><br />This property is provided for backwards compatibility. We don't recommend setting this parameter unless your application depends on the older behavior.|`true`|
+|`sqlFinalizeOuterSketches`|If `false` (default behavior in Druid 25.0.0 and later), `DS_HLL`, `DS_THETA`, and `DS_QUANTILES_SKETCH` return sketches in query results. If `true` (default behavior in Druid 24.0.1 and earlier), Druid finalizes sketches from these functions when they appear in query results.<br /><br />This property is provided for backwards compatibility with behavior in Druid 24.0.1 and earlier. We don't recommend setting this parameter unless your application uses Druid 24.0.1 or earlier. Instead, use a function that doesn't return a sketch, such as `APPROX_COUNT_DISTINCT_DS_HLL`, `APPROX_COUNT_DISTINCT_DS_THETA`, `APPROX_QUANTILE_DS`, `DS_THETA_ESTIMATE`, or `DS_GET_QUANTILE`.|`false`|
+|`sqlUseBoundAndSelectors`|If `false` (default behavior in Druid 27.0.0 and later), the SQL planner uses [equality](./filters.md#equality-filter), [null](./filters.md#null-filter), and [range](./filters.md#range-filter) filters instead of [selector](./filters.md#selector-filter) and [bounds](./filters.md#bound-filter). For filtering `ARRAY` typed values, `sqlUseBoundAndSelectors` must be `false`. | `false`.|
+|`sqlUseExtractionFns`|If false, the SQL planner avoids using [`extractionFn`](dimensionspecs.md#extraction-functions) in favor of using other constructs such as [virtual columns](virtual-columns.md). This parameter is provided for compatibility with prior behavior, and may be removed in a future release.|false|
+|`sqlReverseLookup`|Whether to consider the [reverse-lookup rewrite](lookups.md#reverse-lookup) of the `LOOKUP` function during SQL planning.<br /><br />Druid reverses calls to `LOOKUP` only when the number of matching keys is lower than both `inSubQueryThreshold` and `sqlReverseLookupThreshold`.|`true`|
+|`sqlReverseLookupThreshold`|Maximum size of `IN` filter to create when applying a [reverse-lookup rewrite](lookups.md#reverse-lookup). If a `LOOKUP` call matches more keys than the specified threshold, it remains unchanged.<br /><br />If `inSubQueryThreshold` is lower than `sqlReverseLookupThreshold`, Druid uses `inSubQueryThreshold` threshold instead.|10000|
+|`sqlPullUpLookup`|Whether to consider the [pull-up rewrite](lookups.md#pull-up) of the `LOOKUP` function during SQL planning.|`true`|
+|`enableJoinLeftTableScanDirect`|This parameter applies to queries with joins. By default, when the left child is a simple scan with a filter, Druid runs the scan as a query, then joins it with the right child on the Broker. Setting this parameter to `true` overrides that behavior and pushes the join to the data servers instead. Even if a query doesn't explicitly include a join, this parameter may still apply since the SQL planner can translate the query into a join internally.|`false`|
+|`maxNumericInFilters`|Max limit for the amount of numeric values that Druid can compare for a string type dimension when the entire SQL WHERE clause of a query translates only to an [OR](../querying/filters.md#or) of [bound filter](../querying/filters.md#bound-filter). By default, Druid doesn't restrict the amount of numeric bound filters on string columns, although this situation may block other queries from running. Set this parameter to a smaller value to prevent Druid from running queries that have prohibitively long segment processing times. The optimal limit requires some trial and error. We recommend starting with 100. Users who submit a query that exceeds the limit of `maxNumericInFilters` should rewrite their queries to use strings in the `WHERE` clause instead of numbers. For example, `WHERE someString IN (‘123’, ‘456’)`. This value can't exceed the set system configuration `druid.sql.planner.maxNumericInFilters`. If `druid.sql.planner.maxNumericInFilters` isn't set explicitly, Druid ignores this value.|`-1`|
+|`inFunctionThreshold`| At or beyond this threshold number of values, Druid converts SQL `IN` to [`SCALAR_IN_ARRAY`](sql-functions.md#scalar_in_array). A threshold of 0 forces this conversion in all cases. A threshold of `Integer.MAX_VALUE` disables this conversion. The converted function is eligible for fewer planning-time optimizations, which speeds up planning, but may prevent certain planning-time optimizations.| `100`|
+|`inFunctionExprThreshold`|At or beyond this threshold number of values, SQL `IN` is eligible for execution using the native function `scalar_in_array` rather than an <code>&#124;&#124;</code> of `==`, even if the number of values is below `inFunctionThreshold`. This property only affects translation of SQL `IN` to a [native expression](math-expr.md). It doesn't affect translation of SQL `IN` to a [native filter](filters.md). This property is provided for backwards compatibility purposes, and may be removed in a future release.|`2`|
+|`inSubQueryThreshold`|At or beyond this threshold number of values, Druid converts SQL `IN` to `JOIN` on an inline table. `inFunctionThreshold` takes priority over this setting. A threshold of 0 forces usage of an inline table in all cases where the size of a SQL `IN` is larger than `inFunctionThreshold`. A threshold of `2147483647` disables the rewrite of SQL `IN` to `JOIN`. |`2147483647`|
+
+## Learn more
+- [Set query context](../querying/query-context.md) for how to set the query context.
+- [Query context reference](query-context-reference.md)  for available query context parameters.
+- [MSQ context parameters](../multi-stage-query/reference.md#context-parameters) for how to set context parameters for Multi-Stage Queries.
diff --git a/docs/35.0.0/querying/sql-scalar.md b/docs/35.0.0/querying/sql-scalar.md
new file mode 100644
index 0000000000..59c3e2893a
--- /dev/null
+++ b/docs/35.0.0/querying/sql-scalar.md
@@ -0,0 +1,282 @@
+---
+id: sql-scalar
+title: "SQL scalar functions"
+sidebar_label: "Scalar functions"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+<!--
+  The format of the tables that describe the functions and operators
+  should not be changed without updating the script create-sql-docs
+  in web-console/script/create-sql-docs, because the script detects
+  patterns in this markdown file and parse it to TypeScript file for web console
+-->
+
+
+:::info
+ Apache Druid supports two query languages: Druid SQL and [native queries](querying.md).
+ This document describes the SQL language.
+:::
+
+[Druid SQL](./sql.md) includes scalar functions that include numeric and string functions, IP address functions, Sketch functions, and more, as described on this page. 
+
+
+## Numeric functions
+
+For mathematical operations, Druid SQL will use integer math if all operands involved in an expression are integers.
+Otherwise, Druid will switch to floating point math. You can force this to happen by casting one of your operands
+to FLOAT. At runtime, Druid will widen 32-bit floats to 64-bit for most expressions.
+
+|Function|Notes|
+|--------|-----|
+|`PI`|Constant Pi.|
+|`ABS(expr)`|Absolute value.|
+|`CEIL(expr)`|Ceiling.|
+|`EXP(expr)`|e to the power of `expr`.|
+|`FLOOR(expr)`|Floor.|
+|`LN(expr)`|Logarithm (base e).|
+|`LOG10(expr)`|Logarithm (base 10).|
+|`POWER(expr, power)`|`expr` raised to the power of `power`.|
+|`SQRT(expr)`|Square root.|
+|`TRUNCATE(expr[, digits])`|Truncates `expr` to a specific number of decimal digits. If `digits` is negative, then this truncates that many places to the left of the decimal point. If not specified, `digits` defaults to zero.|
+|`TRUNC(expr[, digits])`|Alias for `TRUNCATE`.|
+|`ROUND(expr[, digits])`|Rounds `expr` to a specific number of decimal digits. If `digits` is negative, then it rounds that many places to the left of the decimal point. If not specified, `digits` defaults to zero.|
+|`MOD(x, y)`|Modulo (remainder of x divided by y).|
+|`SIN(expr)`|Trigonometric sine of an angle `expr`.|
+|`COS(expr)`|Trigonometric cosine of an angle `expr`.|
+|`TAN(expr)`|Trigonometric tangent of an angle `expr`.|
+|`COT(expr)`|Trigonometric cotangent of an angle `expr`.|
+|`ASIN(expr)`|Arc sine of `expr`.|
+|`ACOS(expr)`|Arc cosine of `expr`.|
+|`ATAN(expr)`|Arc tangent of `expr`.|
+|`ATAN2(y, x)`|Angle theta from the conversion of rectangular coordinates (x, y) to polar * coordinates (r, theta).|
+|`DEGREES(expr)`|Converts an angle measured in radians to an approximately equivalent angle measured in degrees.|
+|`RADIANS(expr)`|Converts an angle measured in degrees to an approximately equivalent angle measured in radians.|
+|`BITWISE_AND(expr1, expr2)`|Returns the result of `expr1 & expr2`. Double values will be implicitly cast to longs, use `BITWISE_CONVERT_DOUBLE_TO_LONG_BITS` to perform bitwise operations directly with doubles.|
+|`BITWISE_COMPLEMENT(expr)`|Returns the result of `~expr`. Double values will be implicitly cast to longs, use `BITWISE_CONVERT_DOUBLE_TO_LONG_BITS` to perform bitwise operations directly with doubles.|
+|`BITWISE_CONVERT_DOUBLE_TO_LONG_BITS(expr)`|Converts the bits of an IEEE 754 floating-point double value to a long. If the input is not a double, it is implicitly cast to a double prior to conversion.|
+|`BITWISE_CONVERT_LONG_BITS_TO_DOUBLE(expr)`|Converts a long to the IEEE 754 floating-point double specified by the bits stored in the long. If the input is not a long, it is implicitly cast to a long prior to conversion.|
+|`BITWISE_OR(expr1, expr2)`|Returns the result of `expr1 [PIPE] expr2`. Double values will be implicitly cast to longs, use `BITWISE_CONVERT_DOUBLE_TO_LONG_BITS` to perform bitwise operations directly with doubles.|
+|`BITWISE_SHIFT_LEFT(expr1, expr2)`|Returns the result of `expr1 << expr2`. Double values will be implicitly cast to longs, use `BITWISE_CONVERT_DOUBLE_TO_LONG_BITS` to perform bitwise operations directly with doubles.|
+|`BITWISE_SHIFT_RIGHT(expr1, expr2)`|Returns the result of `expr1 >> expr2`. Double values will be implicitly cast to longs, use `BITWISE_CONVERT_DOUBLE_TO_LONG_BITS` to perform bitwise operations directly with doubles.|
+|`BITWISE_XOR(expr1, expr2)`|Returns the result of `expr1 ^ expr2`. Double values will be implicitly cast to longs, use `BITWISE_CONVERT_DOUBLE_TO_LONG_BITS` to perform bitwise operations directly with doubles.|
+|`DIV(x, y)`|Returns the result of integer division of x by y |
+|`HUMAN_READABLE_BINARY_BYTE_FORMAT(value[, precision])`| Formats a number in human-readable [IEC](https://en.wikipedia.org/wiki/Binary_prefix) format. For example, `HUMAN_READABLE_BINARY_BYTE_FORMAT(1048576)` returns `1.00 MiB`. `precision` must be in the range of `[0, 3]`. If not specified,  `precision` defaults to 2. |
+|`HUMAN_READABLE_DECIMAL_BYTE_FORMAT(value[, precision])`| Formats a number in human-readable [SI](https://en.wikipedia.org/wiki/Binary_prefix) format. For example, `HUMAN_READABLE_DECIMAL_BYTE_FORMAT(1048576)` returns `1.04 MB`. `precision` must be in the range of `[0, 3]`. If not specified, `precision` defaults to 2. |
+|`HUMAN_READABLE_DECIMAL_FORMAT(value[, precision])`| Formats a number in human-readable [SI](https://en.wikipedia.org/wiki/Binary_prefix) format. For example, `HUMAN_READABLE_DECIMAL_FORMAT(1048576)` returns `1.04 M`. `precision` must be in the range of `[0, 3]`. If not specified, `precision` defaults to 2. |
+|`SAFE_DIVIDE(x, y)`|Returns the division of x by y guarded on division by 0. In case y is 0 it returns `null`|
+
+
+## String functions
+
+String functions accept strings and return a type appropriate to the function.
+
+|Function|Notes|
+|--------|-----|
+|`CONCAT(expr[, expr, ...])`|Concatenates a list of expressions. Also see the [concatenation operator](sql-operators.md#concatenation-operator).|
+|`TEXTCAT(expr, expr)`|Concatenates two expressions.|
+|`CONTAINS_STRING(expr, str)`|Returns true if the `str` is a substring of `expr`.|
+|`ICONTAINS_STRING(expr, str)`|Returns true if the `str` is a substring of `expr`. The match is case-insensitive.|
+|`DECODE_BASE64_UTF8(expr)`|Decodes a Base64-encoded string into a UTF-8 encoded string.|
+|`LEFT(expr, N)`|Returns the `N` leftmost characters from `expr`, where `N` is an integer. |
+|`RIGHT(expr, N)`|Returns the `N` rightmost characters from `expr`, where `N` is an integer. |
+|`LENGTH(expr)`|Length of `expr` in UTF-16 code units.|
+|`CHAR_LENGTH(expr)`|Alias for `LENGTH`.|
+|`CHARACTER_LENGTH(expr)`|Alias for `LENGTH`.|
+|`STRLEN(expr)`|Alias for `LENGTH`.|
+|`LOOKUP(expr, lookupName[, replaceMissingValueWith])`|Searches for `expr` in a registered [query-time lookup table](lookups.md) named `lookupName` and returns the mapped value. If `expr` is null or not contained in the lookup, returns `replaceMissingValueWith` if supplied, otherwise returns null.<br /><br />You can query lookups directly using the [`lookup` schema](sql.md#from).|
+|`LOWER(expr)`|Returns `expr` in all lowercase.|
+|`UPPER(expr)`|Returns `expr` in all uppercase.|
+|`LPAD(expr, length[, chars])`|Returns a string of `length` from `expr`. If `expr` is shorter than `length`, left pads `expr` with `chars`, which defaults to space characters. If `expr` exceeds `length`, truncates `expr` to equal `length`.  If `chars` is an empty string, no padding is added. Returns `null` if either `expr` or `chars` is null.|
+|`RPAD(expr, length[, chars])`|Returns a string of `length` from `expr`. If `expr` is shorter than `length`, right pads `expr` with `chars`, which defaults to space characters. If `expr` exceeds `length`, truncates `expr` to equal `length`.  If `chars` is an empty string, no padding is added. Returns `null` if either `expr` or `chars` is null.|
+|`PARSE_LONG(string[, radix])`|Parses a string into a long (BIGINT) with the given radix, or 10 (decimal) if a radix is not provided.|
+|`POSITION(substring IN expr [FROM startingIndex])`|Returns the index of `substring` within `expr` with indexes starting from 1. The search begins at `startingIndex`. If `startingIndex` is not specified, the default is 1. If `substring` is not found, returns 0.|
+|`REGEXP_EXTRACT(expr, pattern[, index])`|Apply regular expression `pattern` to `expr` and extract a capture group or `NULL` if there is no match. If `index` is unspecified or zero, returns the first substring that matches the pattern. The pattern may match anywhere inside `expr`. To match the entire string, use the `^` and `$` markers at the start and end of your pattern.|
+|`REGEXP_LIKE(expr, pattern)`|Returns whether `expr` matches regular expression `pattern`. The pattern may match anywhere inside `expr`; if you want to match the entire string instead, use the `^` and `$` markers at the start and end of your pattern. Similar to [`LIKE`](sql-operators.md#logical-operators), but uses regexps instead of LIKE patterns. Especially useful in WHERE clauses.|
+|`REGEXP_REPLACE(expr, pattern, replacement)`|Replaces all occurrences of regular expression `pattern` within `expr` with `replacement`. The replacement string may refer to capture groups using `$1`, `$2`, etc. The pattern may match anywhere inside `expr`; if you want to match the entire string instead, use the `^` and `$` markers at the start and end of your pattern.|
+|`REPLACE(expr, substring, replacement)`|Replaces instances of `substring` in `expr` with `replacement` and returns the result.|
+|`REPEAT(expr, N)`|Repeats `expr` `N` times.|
+|`REVERSE(expr)`|Reverses `expr`.|
+|`STRING_FORMAT(pattern[, args...])`|Returns a string formatted in the manner of Java's [String.format](https://docs.oracle.com/en/java/javase/17/docs/api/java.base/java/lang/String.html#format(java.lang.String,java.lang.Object...)).|
+|`STRPOS(expr, substring)`|Returns the index of `substring` within `expr`, with indexes starting from 1. If `substring` is not found, returns 0.|
+|`SUBSTRING(expr, index[, length])`|Returns a substring of `expr` starting at a given one-based index. If `length` is omitted, extracts characters to the end of the string, otherwise returns a substring of `length` UTF-16 characters.|
+|`SUBSTR(expr, index[, length])`|Alias for `SUBSTRING`.|
+|`TRIM([BOTH `<code>&#124;</code>` LEADING `<code>&#124;</code>` TRAILING] [chars FROM] expr)`|Returns `expr` with characters removed from the leading, trailing, or both ends of `expr` if they are in `chars`. If `chars` is not provided, it defaults to `''` (a space). If the directional argument is not provided, it defaults to `BOTH`.|
+|`BTRIM(expr[, chars])`|Alternate form of `TRIM(BOTH chars FROM expr)`.|
+|`LTRIM(expr[, chars])`|Alternate form of `TRIM(LEADING chars FROM expr)`.|
+|`RTRIM(expr[, chars])`|Alternate form of `TRIM(TRAILING chars FROM expr)`.|
+
+
+## Date and time functions 
+
+Time functions can be used with:
+
+- Druid's primary timestamp column, `__time`;
+- Numeric values representing milliseconds since the epoch, through the MILLIS_TO_TIMESTAMP function; and
+- String timestamps, through the TIME_PARSE function.
+
+By default, time operations use the UTC time zone. You can change the time zone by setting the connection
+context parameter `sqlTimeZone` to the name of another time zone, like `America/Los_Angeles`, or to an offset like
+`-08:00`. If you need to mix multiple time zones in the same query, or if you need to use a time zone other than
+the connection time zone, some functions also accept time zones as parameters. These parameters always take precedence
+over the connection time zone.
+
+Literal timestamps in the connection time zone can be written using `TIMESTAMP '2000-01-01 00:00:00'` syntax. The
+simplest way to write literal timestamps in other time zones is to use TIME_PARSE, like
+`TIME_PARSE('2000-02-01 00:00:00', NULL, 'America/Los_Angeles')`.
+
+The best way to filter based on time is by using ISO 8601 intervals, like
+`TIME_IN_INTERVAL(__time, '2000-01-01/2000-02-01')`, or by using literal timestamps with the `>=` and `<` operators, like
+`__time >= TIMESTAMP '2000-01-01 00:00:00' AND __time < TIMESTAMP '2000-02-01 00:00:00'`.
+
+Druid supports the standard SQL `BETWEEN` operator, but we recommend avoiding it for time filters. `BETWEEN` is inclusive
+of its upper bound, which makes it awkward to write time filters correctly. For example, the equivalent of
+`TIME_IN_INTERVAL(__time, '2000-01-01/2000-02-01')` is
+`__time BETWEEN TIMESTAMP '2000-01-01 00:00:00' AND TIMESTAMP '2000-01-31 23:59:59.999'`.
+
+Druid processes timestamps internally as longs (64-bit integers) representing milliseconds since the epoch. Therefore,
+time functions perform best when used with the primary timestamp column, or with timestamps stored in long columns as
+milliseconds and accessed with MILLIS_TO_TIMESTAMP. Other timestamp representations, include string timestamps and
+POSIX timestamps (seconds since the epoch) require query-time conversion to Druid's internal form, which adds additional
+overhead.
+
+|Function|Notes|
+|--------|-----|
+|`CURRENT_TIMESTAMP`|Current timestamp in UTC time, unless you specify a different timezone in the query context.|
+|`CURRENT_DATE`|Current date in UTC time, unless you specify a different timezone in the query context.|
+|`DATE_TRUNC(unit, timestamp_expr)`|Rounds down a timestamp, returning it as a new timestamp. Unit can be 'milliseconds', 'second', 'minute', 'hour', 'day', 'week', 'month', 'quarter', 'year', 'decade', 'century', or 'millennium'.|
+|`TIME_CEIL(timestamp_expr, period[, origin[, timezone]])`|Rounds up a timestamp, returning it as a new timestamp. Period can be any ISO 8601 period, like P3M (quarters) or PT12H (half-days). Specify `origin` as a timestamp to set the reference time for rounding. For example, `TIME_CEIL(__time, 'PT1H', TIMESTAMP '2016-06-27 00:30:00')` measures an hourly period from 00:30-01:30 instead of 00:00-01:00. See [Period granularities](granularities.md) for details on the default starting boundaries. The time zone, if provided, should be a time zone name like `America/Los_Angeles` or an offset like `-08:00`. This function is similar to `CEIL` but is more flexible.|
+|`TIME_FLOOR(timestamp_expr, period[, origin[, timezone]])`|Rounds down a timestamp, returning it as a new timestamp. Period can be any ISO 8601 period, like P3M (quarters) or PT12H (half-days). Specify `origin` as a timestamp to set the reference time for rounding. For example, `TIME_FLOOR(__time, 'PT1H', TIMESTAMP '2016-06-27 00:30:00')` measures an hourly period from 00:30-01:30 instead of 00:00-01:00. See [Period granularities](granularities.md) for details on the default starting boundaries. The time zone, if provided, should be a time zone name like `America/Los_Angeles` or an offset like `-08:00`. This function is similar to `FLOOR` but is more flexible.|
+|`TIME_SHIFT(timestamp_expr, period, step[, timezone])`|Shifts a timestamp by a period (step times), returning it as a new timestamp. The `period` parameter can be any ISO 8601 period. The `step` parameter can be negative. The time zone, if provided, should be a time zone name like `America/Los_Angeles` or an offset like `-08:00`.|
+|`TIME_EXTRACT(timestamp_expr, unit[, timezone])`| Extracts a time part from `expr`, returning it as a number. Unit can be EPOCH, MILLISECOND, SECOND, MINUTE, HOUR, DAY (day of month), DOW (day of week), DOY (day of year), WEEK (week of [week year](https://en.wikipedia.org/wiki/ISO_week_date)), MONTH (1 through 12), QUARTER (1 through 4), or YEAR. The time zone, if provided, should be a time zone name like `America/Los_Angeles` or an offset like `-08:00`. The `unit` and `timezone` parameters must be provided as quoted literals, such as `TIME_EXTRACT(__time, 'HOUR')` or `TIME_EXTRACT(__time, 'HOUR', 'America/Los_Angeles')`. This function is similar to `EXTRACT` but is more flexible. |
+|`TIME_PARSE(string_expr[, pattern[, timezone]])`|Parses a string into a timestamp using a given [Joda DateTimeFormat pattern](http://www.joda.org/joda-time/apidocs/org/joda/time/format/DateTimeFormat.html), or ISO 8601 (e.g. `2000-01-02T03:04:05Z`) if the pattern is not provided. The `timezone` parameter is used as the time zone for strings that do not already include a time zone offset. If provided, `timezone` should be a time zone name like `America/Los_Angeles` or an offset like `-08:00`. The `pattern` and `timezone` parameters must be literals. Strings that cannot be parsed as timestamps return NULL.|
+|`TIME_FORMAT(timestamp_expr[, pattern[, timezone]])`|Formats a timestamp as a string with a given [Joda DateTimeFormat pattern](http://www.joda.org/joda-time/apidocs/org/joda/time/format/DateTimeFormat.html), or ISO 8601 (e.g. `2000-01-02T03:04:05Z`) if the pattern is not provided. If provided, the `timezone` parameter should be a time zone name like `America/Los_Angeles` or an offset like `-08:00`. The `pattern` and `timezone` parameters must be literals.|
+|`TIME_IN_INTERVAL(timestamp_expr, interval)`|Returns whether a timestamp is contained within a particular interval. The interval must be a literal string containing any ISO 8601 interval, such as `'2001-01-01/P1D'` or `'2001-01-01T01:00:00/2001-01-02T01:00:00'`. The start instant of the interval is inclusive and the end instant is exclusive.|
+|`MILLIS_TO_TIMESTAMP(millis_expr)`|Converts a number of milliseconds since the epoch (1970-01-01 00:00:00 UTC) into a timestamp.|
+|`TIMESTAMP_TO_MILLIS(timestamp_expr)`|Converts a timestamp into a number of milliseconds since the epoch.|
+|`EXTRACT(unit FROM timestamp_expr)`| Extracts a time part from `expr`, returning it as a number. Unit can be EPOCH, MILLISECOND, SECOND, MINUTE, HOUR, DAY (day of month), DOW (day of week), ISODOW (ISO day of week), DOY (day of year), WEEK (week of year), MONTH, QUARTER, YEAR, ISOYEAR, DECADE, CENTURY or MILLENNIUM. Units must be provided unquoted, like `EXTRACT(HOUR FROM __time)`.                                                                                                                                                                                                                                                                                                     |
+|`FLOOR(timestamp_expr TO unit)`|Rounds down a timestamp, returning it as a new timestamp. The `unit` parameter must be unquoted and can be SECOND, MINUTE, HOUR, DAY, WEEK, MONTH, QUARTER, or YEAR.|
+|`CEIL(timestamp_expr TO unit)`|Rounds up a timestamp, returning it as a new timestamp. The `unit` parameter must be unquoted and can be SECOND, MINUTE, HOUR, DAY, WEEK, MONTH, QUARTER, or YEAR.|
+|`TIMESTAMPADD(unit, count, timestamp)`|Adds a `count` number of time `unit` to timestamp, equivalent to `timestamp + count * unit`. The `unit` parameter must be unquoted and can be SECOND, MINUTE, HOUR, DAY, WEEK, MONTH, QUARTER, or YEAR.|
+|`TIMESTAMPDIFF(unit, timestamp1, timestamp2)`|Returns a signed number of `unit` between `timestamp1` and `timestamp2`. The `unit` parameter must be unquoted and can be SECOND, MINUTE, HOUR, DAY, WEEK, MONTH, QUARTER, or YEAR.|
+
+
+## Reduction functions
+
+Reduction functions operate on zero or more expressions and return a single expression. If no expressions are passed as
+arguments, then the result is `NULL`. The expressions must all be convertible to a common data type, which will be the
+type of the result:
+*  If all argument are `NULL`, the result is `NULL`. Otherwise, `NULL` arguments are ignored.
+*  If the arguments comprise a mix of numbers and strings, the arguments are interpreted as strings.
+*  If all arguments are integer numbers, the arguments are interpreted as longs.
+*  If all arguments are numbers and at least one argument is a double, the arguments are interpreted as doubles. 
+
+|Function|Notes|
+|--------|-----|
+|`GREATEST([expr1, ...])`|Evaluates zero or more expressions and returns the maximum value based on comparisons as described above.|
+|`LEAST([expr1, ...])`|Evaluates zero or more expressions and returns the minimum value based on comparisons as described above.|
+
+
+## IP address functions
+
+For the IPv4 address functions, the `address` argument can either be an IPv4 dotted-decimal string
+(e.g., "192.168.0.1") or an IP address represented as an integer (e.g., 3232235521). The `subnet`
+argument should be a string formatted as an IPv4 address subnet in CIDR notation (e.g., "192.168.0.0/16").
+
+For the IPv6 address function, the `address` argument accepts a semicolon separated string (e.g. "75e9:efa4:29c6:85f6::232c"). The format of the `subnet` argument should be an IPv6 address subnet in CIDR notation (e.g. "75e9:efa4:29c6:85f6::/64").
+
+|Function|Notes|
+|---|---|
+|`IPV4_MATCH(address, subnet)`|Returns true if the `address` belongs to the `subnet` literal, else false. If `address` is not a valid IPv4 address, then false is returned. This function is more efficient if `address` is an integer instead of a string.|
+|`IPV4_PARSE(address)`|Parses `address` into an IPv4 address stored as an integer . If `address` is an integer that is a valid IPv4 address, then it is passed through. Returns null if `address` cannot be represented as an IPv4 address.|
+|`IPV4_STRINGIFY(address)`|Converts `address` into an IPv4 address dotted-decimal string. If `address` is a string that is a valid IPv4 address, then it is passed through. Returns null if `address` cannot be represented as an IPv4 address.|
+| IPV6_MATCH(address, subnet) | Returns 1 if the IPv6 `address` belongs to the `subnet` literal, else 0. If `address` is not a valid IPv6 address, then 0 is returned.|
+
+## Sketch functions
+
+These functions operate on expressions or columns that return sketch objects.
+To create sketch objects, see the [DataSketches aggregators](sql-aggregations.md#sketch-functions).
+
+
+### HLL sketch functions
+
+The following functions operate on [DataSketches HLL sketches](../development/extensions-core/datasketches-hll.md).
+The [DataSketches extension](../development/extensions-core/datasketches-extension.md) must be loaded to use the following functions.
+
+|Function|Notes|
+|--------|-----|
+|`HLL_SKETCH_ESTIMATE(expr[, round])`|Returns a distinct count estimate from a HLL sketch. `expr` must be a HLL sketch. To round the estimate, set `round` to true. Otherwise, `round` defaults to false.|
+|`HLL_SKETCH_ESTIMATE_WITH_ERROR_BOUNDS(expr[, numStdDev])`|Returns a distinct count estimate and error bounds from a HLL sketch. `expr` must be a HLL sketch. `numStdDev` argument specifies the number of standard deviations of the bounds. `numStdDev` must be `1`, `2`, or `3`. |
+|`HLL_SKETCH_UNION([lgK, tgtHllType], expr0, expr1, ...)`|Returns a union of HLL sketches, where each input expression must return an HLL sketch. The `lgK` and `tgtHllType` can be optionally specified as the first parameter; if provided, both optional parameters must be specified.|
+|`HLL_SKETCH_TO_STRING(expr)`|Returns a human-readable string representation of an HLL sketch for debugging. `expr` must return an HLL sketch.|
+
+### Theta sketch functions
+
+The following functions operate on [theta sketches](../development/extensions-core/datasketches-theta.md).
+The [DataSketches extension](../development/extensions-core/datasketches-extension.md) must be loaded to use the following functions.
+
+|Function|Notes|
+|--------|-----|
+|`THETA_SKETCH_ESTIMATE(expr)`|Returns the distinct count estimate from a theta sketch. `expr` must return a theta sketch.|
+|`THETA_SKETCH_ESTIMATE_WITH_ERROR_BOUNDS(expr, errorBoundsStdDev)`|Returns the distinct count estimate and error bounds from a theta sketch. `expr` must return a theta sketch.|
+|`THETA_SKETCH_UNION([size], expr0, expr1, ...)`|Returns a union of theta sketches, where each input expression must return a theta sketch. The `size` can be optionally specified as the first parameter.|
+|`THETA_SKETCH_INTERSECT([size], expr0, expr1, ...)`|Returns an intersection of theta sketches, where each input expression must return a theta sketch. The `size` can be optionally specified as the first parameter.|
+|`THETA_SKETCH_NOT([size], expr0, expr1, ...)`|Returns a set difference of theta sketches, where each input expression must return a theta sketch. The `size` can be optionally specified as the first parameter.|
+
+### Quantiles sketch functions
+
+The following functions operate on [quantiles sketches](../development/extensions-core/datasketches-quantiles.md).
+The [DataSketches extension](../development/extensions-core/datasketches-extension.md) must be loaded to use the following functions.
+
+|Function|Notes|
+|--------|-----|
+|`DS_GET_QUANTILE(expr, fraction)`|Returns the quantile estimate corresponding to `fraction` from a quantiles sketch. `expr` must return a quantiles sketch.|
+|`DS_GET_QUANTILES(expr, fraction0, fraction1, ...)`|Returns a string representing an array of quantile estimates corresponding to a list of fractions from a quantiles sketch. `expr` must return a quantiles sketch.|
+|`DS_HISTOGRAM(expr, splitPoint0, splitPoint1, ...)`|Returns a string representing an approximation to the histogram given a list of split points that define the histogram bins from a quantiles sketch. `expr` must return a quantiles sketch.|
+|`DS_CDF(expr, splitPoint0, splitPoint1, ...)`|Returns a string representing approximation to the Cumulative Distribution Function given a list of split points that define the edges of the bins from a quantiles sketch. `expr` must return a quantiles sketch.|
+|`DS_RANK(expr, value)`|Returns an approximation to the rank of a given value that is the fraction of the distribution less than that value from a quantiles sketch. `expr` must return a quantiles sketch.|
+|`DS_QUANTILE_SUMMARY(expr)`|Returns a string summary of a quantiles sketch, useful for debugging. `expr` must return a quantiles sketch.|
+
+### Tuple sketch functions
+
+The following functions operate on [tuple sketches](../development/extensions-core/datasketches-tuple.md).
+The [DataSketches extension](../development/extensions-core/datasketches-extension.md) must be loaded to use the following functions.
+
+|Function|Notes|Default|
+|--------|-----|-------|
+|`DS_TUPLE_DOUBLES_METRICS_SUM_ESTIMATE(expr)`|Computes approximate sums of the values contained within a [Tuple sketch](../development/extensions-core/datasketches-tuple.md#estimated-metrics-values-for-each-column-of-arrayofdoublessketch) column which contains an array of double values as its Summary Object.
+|`DS_TUPLE_DOUBLES_INTERSECT(expr, ...[, nominalEntries])`|Returns an intersection of tuple sketches, where each input expression must return a tuple sketch which contains an array of double values as its Summary Object. The values contained in the Summary Objects are summed when combined. If the last value of the array is a numeric literal, Druid assumes that the value is an override parameter for [nominal entries](../development/extensions-core/datasketches-tuple.md).|
+|`DS_TUPLE_DOUBLES_NOT(expr, ...[, nominalEntries])`|Returns a set difference of tuple sketches, where each input expression must return a tuple sketch which contains an array of double values as its Summary Object. The values contained in the Summary Object are preserved as is. If the last value of the array is a numeric literal, Druid assumes that the value is an override parameter for [nominal entries](../development/extensions-core/datasketches-tuple.md).|
+|`DS_TUPLE_DOUBLES_UNION(expr, ...[, nominalEntries])`|Returns a union of tuple sketches, where each input expression must return a tuple sketch which contains an array of double values as its Summary Object. The values contained in the Summary Objects are summed when combined. If the last value of the array is a numeric literal, Druid assumes that the value is an override parameter for [nominal entries](../development/extensions-core/datasketches-tuple.md).|
+
+
+## Other scalar functions
+
+|Function|Notes|
+|--------|-----|
+|`BLOOM_FILTER_TEST(expr, serialized-filter)`|Returns true if the value of `expr` is contained in the base64-serialized Bloom filter. See the [Bloom filter extension](../development/extensions-core/bloom-filter.md) documentation for additional details. See the [`BLOOM_FILTER` function](sql-aggregations.md) for computing Bloom filters.|
+|`CASE expr WHEN value1 THEN result1 \[ WHEN value2 THEN result2 ... \] \[ ELSE resultN \] END`|Simple CASE.|
+|`CASE WHEN boolean_expr1 THEN result1 \[ WHEN boolean_expr2 THEN result2 ... \] \[ ELSE resultN \] END`|Searched CASE.|
+|`CAST(value AS TYPE)`|Cast value to another type. See [Data types](sql-data-types.md) for details about how Druid SQL handles CAST.|
+|`COALESCE(value1, value2, ...)`|Returns the first non-null value.|
+|`DECODE_BASE64_COMPLEX(dataType, expr)`| Decodes a Base64-encoded string into a complex data type, where `dataType` is the complex data type and `expr` is the Base64-encoded string to decode. The `hyperUnique` and `serializablePairLongString` data types are supported by default. You can enable support for the following complex data types by loading their extensions:<br/><ul><li>`druid-bloom-filter`: `bloom`</li><li>`druid-datasketches`: `arrayOfDoublesSketch`, `HLLSketch`, `KllDoublesSketch`, `KllFloatsSketch`, `quantilesDoublesSketch`, `thetaSketch`</li><li>`druid-histogram`: `approximateHistogram`, `fixedBucketsHistogram`</li><li>`druid-stats`: `variance`</li><li>`druid-compressed-bigdecimal`: `compressedBigDecimal`</li><li>`druid-momentsketch`: `momentSketch`</li><li>`druid-tdigestsketch`: `tDigestSketch`</li></ul>|
+|`NULLIF(value1, value2)`|Returns NULL if `value1` and `value2` match, else returns `value1`.|
+|`NVL(value1, value2)`|Returns `value1` if `value1` is not null, otherwise `value2`.|
\ No newline at end of file
diff --git a/docs/35.0.0/querying/sql-translation.md b/docs/35.0.0/querying/sql-translation.md
new file mode 100644
index 0000000000..9049d07462
--- /dev/null
+++ b/docs/35.0.0/querying/sql-translation.md
@@ -0,0 +1,838 @@
+---
+id: sql-translation
+title: "SQL query translation"
+sidebar_label: "SQL query translation"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ Apache Druid supports two query languages: Druid SQL and [native queries](querying.md).
+ This document describes the Druid SQL language.
+:::
+
+Druid uses [Apache Calcite](https://calcite.apache.org/) to parse and plan SQL queries.
+Druid translates SQL statements into its [native JSON-based query language](querying.md).
+In general, the slight overhead of translating SQL on the Broker is the only minor performance penalty to using Druid SQL compared to native queries.
+
+This topic includes best practices and tools to help you achieve good performance and minimize the impact of translation.
+
+## Best practices
+
+Consider the following non-exhaustive list of best practices when looking into performance implications of
+translating Druid SQL queries to native queries.
+
+1. If you wrote a filter on the primary time column `__time`, make sure it is being correctly translated to an
+`"intervals"` filter, as described in the [Time filters](#time-filters) section below. If not, you may need to change
+the way you write the filter.
+
+2. Try to avoid subqueries underneath joins: they affect both performance and scalability. This includes implicit
+subqueries generated by conditions on mismatched types, and implicit subqueries generated by conditions that use
+expressions to refer to the right-hand side.
+
+3. Currently, Druid does not support pushing down predicates (condition and filter) past a Join (i.e. into 
+Join's children). Druid only supports pushing predicates into the join if they originated from 
+above the join. Hence, the location of predicates and filters in your Druid SQL is very important. 
+Also, as a result of this, comma joins should be avoided.
+
+4. Read through the [Query execution](query-execution.md) page to understand how various types of native queries
+will be executed.
+
+5. Be careful when interpreting EXPLAIN PLAN output, and use request logging if in doubt. Request logs will show the
+exact native query that was run. See the [next section](#interpreting-explain-plan-output) for more details.
+
+6. If you encounter a query that could be planned better, feel free to
+[raise an issue on GitHub](https://github.com/apache/druid/issues/new/choose). A reproducible test case is always
+appreciated.
+
+## Interpreting EXPLAIN PLAN output
+
+The [EXPLAIN PLAN](sql.md#explain-plan) functionality can help you understand how a given SQL query will
+be translated to native.
+EXPLAIN PLAN statements return:
+- a `PLAN` column that contains a JSON array of native queries that Druid will run
+- a `RESOURCES` column that describes the resources used in the query
+- an `ATTRIBUTES` column that describes the attributes of the query, including:
+  - `statementType`: the SQL statement type
+  - `targetDataSource`: the target datasource in an INSERT or REPLACE statement
+  - `partitionedBy`: the time-based partitioning granularity in an INSERT or REPLACE statement
+  - `clusteredBy`: the clustering columns in an INSERT or REPLACE statement
+  - `replaceTimeChunks`: the time chunks in a REPLACE statement
+
+Example 1: EXPLAIN PLAN for a `SELECT` query on the `wikipedia` datasource:
+
+<details>
+<summary>Show the query</summary>
+
+```sql
+EXPLAIN PLAN FOR
+SELECT
+  channel,
+  COUNT(*)
+FROM wikipedia
+WHERE channel IN (SELECT page FROM wikipedia GROUP BY page ORDER BY COUNT(*) DESC LIMIT 10)
+GROUP BY channel
+```
+</details>
+
+The above EXPLAIN PLAN query returns the following result:
+
+<details>
+<summary>Show the result</summary>
+
+```json
+[
+  [
+    {
+      "query": {
+        "queryType": "topN",
+        "dataSource": {
+          "type": "join",
+          "left": {
+            "type": "table",
+            "name": "wikipedia"
+          },
+          "right": {
+            "type": "query",
+            "query": {
+              "queryType": "groupBy",
+              "dataSource": {
+                "type": "table",
+                "name": "wikipedia"
+              },
+              "intervals": {
+                "type": "intervals",
+                "intervals": [
+                  "-146136543-09-08T08:23:32.096Z/146140482-04-24T15:36:27.903Z"
+                ]
+              },
+              "granularity": {
+                "type": "all"
+              },
+              "dimensions": [
+                {
+                  "type": "default",
+                  "dimension": "page",
+                  "outputName": "d0",
+                  "outputType": "STRING"
+                }
+              ],
+              "aggregations": [
+                {
+                  "type": "count",
+                  "name": "a0"
+                }
+              ],
+              "limitSpec": {
+                "type": "default",
+                "columns": [
+                  {
+                    "dimension": "a0",
+                    "direction": "descending",
+                    "dimensionOrder": {
+                      "type": "numeric"
+                    }
+                  }
+                ],
+                "limit": 10
+              },
+              "context": {
+                "sqlOuterLimit": 101,
+                "sqlQueryId": "ee616a36-c30c-4eae-af00-245127956e42",
+                "useApproximateCountDistinct": false,
+                "useApproximateTopN": false
+              }
+            }
+          },
+          "rightPrefix": "j0.",
+          "condition": "(\"channel\" == \"j0.d0\")",
+          "joinType": "INNER"
+        },
+        "dimension": {
+          "type": "default",
+          "dimension": "channel",
+          "outputName": "d0",
+          "outputType": "STRING"
+        },
+        "metric": {
+          "type": "dimension",
+          "ordering": {
+            "type": "lexicographic"
+          }
+        },
+        "threshold": 101,
+        "intervals": {
+          "type": "intervals",
+          "intervals": [
+            "-146136543-09-08T08:23:32.096Z/146140482-04-24T15:36:27.903Z"
+          ]
+        },
+        "granularity": {
+          "type": "all"
+        },
+        "aggregations": [
+          {
+            "type": "count",
+            "name": "a0"
+          }
+        ],
+        "context": {
+          "sqlOuterLimit": 101,
+          "sqlQueryId": "ee616a36-c30c-4eae-af00-245127956e42",
+          "useApproximateCountDistinct": false,
+          "useApproximateTopN": false
+        }
+      },
+      "signature": [
+        {
+          "name": "d0",
+          "type": "STRING"
+        },
+        {
+          "name": "a0",
+          "type": "LONG"
+        }
+      ],
+      "columnMappings": [
+        {
+          "queryColumn": "d0",
+          "outputColumn": "channel"
+        },
+        {
+          "queryColumn": "a0",
+          "outputColumn": "EXPR$1"
+        }
+      ]
+    }
+  ],
+  [
+    {
+      "name": "wikipedia",
+      "type": "DATASOURCE"
+    }
+  ],
+  {
+    "statementType": "SELECT"
+  }
+]
+```
+</details>
+
+Example 2: EXPLAIN PLAN for an `INSERT` query that inserts data into the `wikipedia` datasource:
+
+<details>
+<summary>Show the query</summary>
+
+```sql
+EXPLAIN PLAN FOR
+INSERT INTO wikipedia2
+SELECT
+  TIME_PARSE("timestamp") AS __time,
+  namespace,
+  cityName,
+  countryName,
+  regionIsoCode,
+  metroCode,
+  countryIsoCode,
+  regionName
+FROM TABLE(
+    EXTERN(
+      '{"type":"http","uris":["https://druid.apache.org/data/wikipedia.json.gz"]}',
+      '{"type":"json"}',
+      '[{"name":"timestamp","type":"string"},{"name":"namespace","type":"string"},{"name":"cityName","type":"string"},{"name":"countryName","type":"string"},{"name":"regionIsoCode","type":"string"},{"name":"metroCode","type":"long"},{"name":"countryIsoCode","type":"string"},{"name":"regionName","type":"string"}]'
+    )
+  )
+PARTITIONED BY ALL
+```
+</details>
+
+
+The above EXPLAIN PLAN returns the following result:
+
+<details>
+<summary>Show the result</summary>
+
+```json
+[
+  [
+    {
+      "query": {
+        "queryType": "scan",
+        "dataSource": {
+          "type": "external",
+          "inputSource": {
+            "type": "http",
+            "uris": [
+              "https://druid.apache.org/data/wikipedia.json.gz"
+            ]
+          },
+          "inputFormat": {
+            "type": "json"
+          },
+          "signature": [
+            {
+              "name": "timestamp",
+              "type": "STRING"
+            },
+            {
+              "name": "namespace",
+              "type": "STRING"
+            },
+            {
+              "name": "cityName",
+              "type": "STRING"
+            },
+            {
+              "name": "countryName",
+              "type": "STRING"
+            },
+            {
+              "name": "regionIsoCode",
+              "type": "STRING"
+            },
+            {
+              "name": "metroCode",
+              "type": "LONG"
+            },
+            {
+              "name": "countryIsoCode",
+              "type": "STRING"
+            },
+            {
+              "name": "regionName",
+              "type": "STRING"
+            }
+          ]
+        },
+        "intervals": {
+          "type": "intervals",
+          "intervals": [
+            "-146136543-09-08T08:23:32.096Z/146140482-04-24T15:36:27.903Z"
+          ]
+        },
+        "virtualColumns": [
+          {
+            "type": "expression",
+            "name": "v0",
+            "expression": "timestamp_parse(\"timestamp\",null,'UTC')",
+            "outputType": "LONG"
+          }
+        ],
+        "resultFormat": "compactedList",
+        "columns": [
+          "cityName",
+          "countryIsoCode",
+          "countryName",
+          "metroCode",
+          "namespace",
+          "regionIsoCode",
+          "regionName",
+          "v0"
+        ],
+        "context": {
+          "finalizeAggregations": false,
+          "forceExpressionVirtualColumns": true,
+          "groupByEnableMultiValueUnnesting": false,
+          "maxNumTasks": 5,
+          "multiStageQuery": true,
+          "queryId": "42e3de2b-daaf-40f9-a0e7-2c6184529ea3",
+          "scanSignature": "[{\"name\":\"cityName\",\"type\":\"STRING\"},{\"name\":\"countryIsoCode\",\"type\":\"STRING\"},{\"name\":\"countryName\",\"type\":\"STRING\"},{\"name\":\"metroCode\",\"type\":\"LONG\"},{\"name\":\"namespace\",\"type\":\"STRING\"},{\"name\":\"regionIsoCode\",\"type\":\"STRING\"},{\"name\":\"regionName\",\"type\":\"STRING\"},{\"name\":\"v0\",\"type\":\"LONG\"}]",
+          "sqlInsertSegmentGranularity": "{\"type\":\"all\"}",
+          "sqlQueryId": "42e3de2b-daaf-40f9-a0e7-2c6184529ea3",
+          "useNativeQueryExplain": true
+        },
+        "granularity": {
+          "type": "all"
+        }
+      },
+      "signature": [
+        {
+          "name": "v0",
+          "type": "LONG"
+        },
+        {
+          "name": "namespace",
+          "type": "STRING"
+        },
+        {
+          "name": "cityName",
+          "type": "STRING"
+        },
+        {
+          "name": "countryName",
+          "type": "STRING"
+        },
+        {
+          "name": "regionIsoCode",
+          "type": "STRING"
+        },
+        {
+          "name": "metroCode",
+          "type": "LONG"
+        },
+        {
+          "name": "countryIsoCode",
+          "type": "STRING"
+        },
+        {
+          "name": "regionName",
+          "type": "STRING"
+        }
+      ],
+      "columnMappings": [
+        {
+          "queryColumn": "v0",
+          "outputColumn": "__time"
+        },
+        {
+          "queryColumn": "namespace",
+          "outputColumn": "namespace"
+        },
+        {
+          "queryColumn": "cityName",
+          "outputColumn": "cityName"
+        },
+        {
+          "queryColumn": "countryName",
+          "outputColumn": "countryName"
+        },
+        {
+          "queryColumn": "regionIsoCode",
+          "outputColumn": "regionIsoCode"
+        },
+        {
+          "queryColumn": "metroCode",
+          "outputColumn": "metroCode"
+        },
+        {
+          "queryColumn": "countryIsoCode",
+          "outputColumn": "countryIsoCode"
+        },
+        {
+          "queryColumn": "regionName",
+          "outputColumn": "regionName"
+        }
+      ]
+    }
+  ],
+  [
+    {
+      "name": "EXTERNAL",
+      "type": "EXTERNAL"
+    },
+    {
+      "name": "wikipedia",
+      "type": "DATASOURCE"
+    }
+  ],
+  {
+    "statementType": "INSERT",
+    "targetDataSource": "wikipedia",
+    "partitionedBy": {
+      "type": "all"
+    }
+  }
+]
+```
+</details>
+
+Example 3: EXPLAIN PLAN for a `REPLACE` query that replaces all the data in the `wikipedia` datasource with a `DAY`
+time partitioning, and `cityName` and `countryName` as the clustering columns:
+
+<details>
+<summary>Show the query</summary>
+
+```sql
+EXPLAIN PLAN FOR
+REPLACE INTO wikipedia
+OVERWRITE ALL
+SELECT
+  TIME_PARSE("timestamp") AS __time,
+  namespace,
+  cityName,
+  countryName,
+  regionIsoCode,
+  metroCode,
+  countryIsoCode,
+  regionName
+FROM TABLE(
+    EXTERN(
+      '{"type":"http","uris":["https://druid.apache.org/data/wikipedia.json.gz"]}',
+      '{"type":"json"}',
+      '[{"name":"timestamp","type":"string"},{"name":"namespace","type":"string"},{"name":"cityName","type":"string"},{"name":"countryName","type":"string"},{"name":"regionIsoCode","type":"string"},{"name":"metroCode","type":"long"},{"name":"countryIsoCode","type":"string"},{"name":"regionName","type":"string"}]'
+    )
+  )
+PARTITIONED BY DAY
+CLUSTERED BY cityName, countryName
+```
+</details>
+
+
+The above EXPLAIN PLAN query returns the following result:
+
+<details>
+<summary>Show the result</summary>
+
+```json
+[
+  [
+    {
+      "query": {
+        "queryType": "scan",
+        "dataSource": {
+          "type": "external",
+          "inputSource": {
+            "type": "http",
+            "uris": [
+              "https://druid.apache.org/data/wikipedia.json.gz"
+            ]
+          },
+          "inputFormat": {
+            "type": "json"
+          },
+          "signature": [
+            {
+              "name": "timestamp",
+              "type": "STRING"
+            },
+            {
+              "name": "namespace",
+              "type": "STRING"
+            },
+            {
+              "name": "cityName",
+              "type": "STRING"
+            },
+            {
+              "name": "countryName",
+              "type": "STRING"
+            },
+            {
+              "name": "regionIsoCode",
+              "type": "STRING"
+            },
+            {
+              "name": "metroCode",
+              "type": "LONG"
+            },
+            {
+              "name": "countryIsoCode",
+              "type": "STRING"
+            },
+            {
+              "name": "regionName",
+              "type": "STRING"
+            }
+          ]
+        },
+        "intervals": {
+          "type": "intervals",
+          "intervals": [
+            "-146136543-09-08T08:23:32.096Z/146140482-04-24T15:36:27.903Z"
+          ]
+        },
+        "virtualColumns": [
+          {
+            "type": "expression",
+            "name": "v0",
+            "expression": "timestamp_parse(\"timestamp\",null,'UTC')",
+            "outputType": "LONG"
+          }
+        ],
+        "resultFormat": "compactedList",
+        "columns": [
+          "cityName",
+          "countryIsoCode",
+          "countryName",
+          "metroCode",
+          "namespace",
+          "regionIsoCode",
+          "regionName",
+          "v0"
+        ],
+        "context": {
+          "finalizeAggregations": false,
+          "groupByEnableMultiValueUnnesting": false,
+          "maxNumTasks": 5,
+          "queryId": "d88e0823-76d4-40d9-a1a7-695c8577b79f",
+          "scanSignature": "[{\"name\":\"cityName\",\"type\":\"STRING\"},{\"name\":\"countryIsoCode\",\"type\":\"STRING\"},{\"name\":\"countryName\",\"type\":\"STRING\"},{\"name\":\"metroCode\",\"type\":\"LONG\"},{\"name\":\"namespace\",\"type\":\"STRING\"},{\"name\":\"regionIsoCode\",\"type\":\"STRING\"},{\"name\":\"regionName\",\"type\":\"STRING\"},{\"name\":\"v0\",\"type\":\"LONG\"}]",
+          "sqlInsertSegmentGranularity": "\"DAY\"",
+          "sqlQueryId": "d88e0823-76d4-40d9-a1a7-695c8577b79f",
+          "sqlReplaceTimeChunks": "all"
+        },
+        "granularity": {
+          "type": "all"
+        }
+      },
+      "signature": [
+        {
+          "name": "v0",
+          "type": "LONG"
+        },
+        {
+          "name": "namespace",
+          "type": "STRING"
+        },
+        {
+          "name": "cityName",
+          "type": "STRING"
+        },
+        {
+          "name": "countryName",
+          "type": "STRING"
+        },
+        {
+          "name": "regionIsoCode",
+          "type": "STRING"
+        },
+        {
+          "name": "metroCode",
+          "type": "LONG"
+        },
+        {
+          "name": "countryIsoCode",
+          "type": "STRING"
+        },
+        {
+          "name": "regionName",
+          "type": "STRING"
+        }
+      ],
+      "columnMappings": [
+        {
+          "queryColumn": "v0",
+          "outputColumn": "__time"
+        },
+        {
+          "queryColumn": "namespace",
+          "outputColumn": "namespace"
+        },
+        {
+          "queryColumn": "cityName",
+          "outputColumn": "cityName"
+        },
+        {
+          "queryColumn": "countryName",
+          "outputColumn": "countryName"
+        },
+        {
+          "queryColumn": "regionIsoCode",
+          "outputColumn": "regionIsoCode"
+        },
+        {
+          "queryColumn": "metroCode",
+          "outputColumn": "metroCode"
+        },
+        {
+          "queryColumn": "countryIsoCode",
+          "outputColumn": "countryIsoCode"
+        },
+        {
+          "queryColumn": "regionName",
+          "outputColumn": "regionName"
+        }
+      ]
+    }
+  ],
+  [
+    {
+      "name": "EXTERNAL",
+      "type": "EXTERNAL"
+    },
+    {
+      "name": "wikipedia",
+      "type": "DATASOURCE"
+    }
+  ],
+  {
+    "statementType": "REPLACE",
+    "targetDataSource": "wikipedia",
+    "partitionedBy": "DAY",
+    "clusteredBy": ["cityName","countryName"],
+    "replaceTimeChunks": "all"
+  }
+]
+```
+
+</details>
+
+
+In this case the JOIN operator gets translated to a `join` datasource. See the [Join translation](#joins) section
+for more details about how this works.
+
+We can see this for ourselves using Druid's [request logging](../configuration/index.md#request-logging) feature. After
+enabling logging and running this query, we can see that it actually runs as the following native query.
+
+```json
+{
+  "queryType": "groupBy",
+  "dataSource": {
+    "type": "join",
+    "left": "wikipedia",
+    "right": {
+      "type": "query",
+      "query": {
+        "queryType": "topN",
+        "dataSource": "wikipedia",
+        "dimension": {"type": "default", "dimension": "page", "outputName": "d0"},
+        "metric": {"type": "numeric", "metric": "a0"},
+        "threshold": 10,
+        "intervals": "-146136543-09-08T08:23:32.096Z/146140482-04-24T15:36:27.903Z",
+        "granularity": "all",
+        "aggregations": [
+          { "type": "count", "name": "a0"}
+        ]
+      }
+    },
+    "rightPrefix": "j0.",
+    "condition": "(\"page\" == \"j0.d0\")",
+    "joinType": "INNER"
+  },
+  "intervals": "-146136543-09-08T08:23:32.096Z/146140482-04-24T15:36:27.903Z",
+  "granularity": "all",
+  "dimensions": [
+    {"type": "default", "dimension": "channel", "outputName": "d0"}
+  ],
+  "aggregations": [
+    { "type": "count", "name": "a0"}
+  ]
+}
+```
+
+## Query types
+
+Druid SQL uses four different native query types.
+
+- [Scan](scan-query.md) is used for queries that do not aggregate&mdash;no GROUP BY, no DISTINCT.
+
+- [Timeseries](timeseriesquery.md) is used for queries that GROUP BY `FLOOR(__time TO unit)` or `TIME_FLOOR(__time, period)`, have no other grouping expressions, no HAVING clause, no nesting, and either no ORDER BY, or an
+ORDER BY that orders by same expression as present in GROUP BY. It also uses Timeseries for "grand total" queries that
+have aggregation functions but no GROUP BY. This query type takes advantage of the fact that Druid segments are sorted
+by time.
+
+- [TopN](topnquery.md) is used by default for queries that group by a single expression, do have ORDER BY and LIMIT
+clauses, do not have HAVING clauses, and are not nested. However, the TopN query type will deliver approximate ranking
+and results in some cases; if you want to avoid this, set "useApproximateTopN" to "false". Additionally, TopN queries
+with lexicographic ordering (sorting by dimension values) can be disabled by setting "useLexicographicTopN" to "false".
+TopN results are always computed in memory. See the TopN documentation for more details.
+
+- [GroupBy](groupbyquery.md) is used for all other aggregations, including any nested aggregation queries. Druid's
+GroupBy is a traditional aggregation engine: it delivers exact results and rankings and supports a wide variety of
+features. GroupBy aggregates in memory if it can, but it may spill to disk if it doesn't have enough memory to complete
+your query. Results are streamed back from data processes through the Broker if you ORDER BY the same expressions in your
+GROUP BY clause, or if you don't have an ORDER BY at all. If your query has an ORDER BY referencing expressions that
+don't appear in the GROUP BY clause (like aggregation functions) then the Broker will materialize a list of results in
+memory, up to a max of your LIMIT, if any. See the GroupBy documentation for details about tuning performance and memory
+use.
+
+## Time filters
+
+For all native query types, filters on the `__time` column will be translated into top-level query "intervals" whenever
+possible, which allows Druid to use its global time index to quickly prune the set of data that must be scanned.
+Consider this (non-exhaustive) list of time filters that will be recognized and translated to "intervals":
+
+- `__time >= TIMESTAMP '2000-01-01 00:00:00'` (comparison to absolute time)
+- `__time >= CURRENT_TIMESTAMP - INTERVAL '8' HOUR` (comparison to relative time)
+- `FLOOR(__time TO DAY) = TIMESTAMP '2000-01-01 00:00:00'` (specific day)
+
+Refer to the [Interpreting EXPLAIN PLAN output](#interpreting-explain-plan-output) section for details on confirming
+that time filters are being translated as you expect.
+
+## Joins
+
+SQL join operators are translated to native join datasources as follows:
+
+1. Joins that the native layer can handle directly are translated literally, to a [join datasource](datasource.md#join)
+whose `left`, `right`, and `condition` are faithful translations of the original SQL. This includes any SQL join where
+the right-hand side is a lookup or subquery, and where the condition is an equality where one side is an expression based
+on the left-hand table, the other side is a simple column reference to the right-hand table, and both sides of the
+equality are the same data type.
+
+2. If a join cannot be handled directly by a native [join datasource](datasource.md#join) as written, Druid SQL
+will insert subqueries to make it runnable. For example, `foo INNER JOIN bar ON foo.abc = LOWER(bar.def)` cannot be
+directly translated, because there is an expression on the right-hand side instead of a simple column access. A subquery
+will be inserted that effectively transforms this clause to
+`foo INNER JOIN (SELECT LOWER(def) AS def FROM bar) t ON foo.abc = t.def`.
+
+3. Druid SQL does not currently reorder joins to optimize queries.
+
+Refer to the [Interpreting EXPLAIN PLAN output](#interpreting-explain-plan-output) section for details on confirming
+that joins are being translated as you expect.
+
+Refer to the [Query execution](query-execution.md#join) page for information about how joins are executed.
+
+## Subqueries
+
+Subqueries in SQL are generally translated to native query datasources. Refer to the
+[Query execution](query-execution.md#query) page for information about how subqueries are executed.
+
+:::info
+ Note: Subqueries in the WHERE clause, like `WHERE col1 IN (SELECT foo FROM ...)` are translated to inner joins.
+:::
+
+## Approximations
+
+Druid SQL will use approximate algorithms in some situations:
+
+- The `COUNT(DISTINCT col)` aggregation functions by default uses a variant of
+[HyperLogLog](http://algo.inria.fr/flajolet/Publications/FlFuGaMe07.pdf), a fast approximate distinct counting
+algorithm. Druid SQL will switch to exact distinct counts if you set "useApproximateCountDistinct" to "false", either
+through query context or through Broker configuration.
+
+- GROUP BY queries over a single column with ORDER BY and LIMIT may be executed using the TopN engine, which uses an
+approximate algorithm. Druid SQL will switch to an exact grouping algorithm if you set "useApproximateTopN" to "false",
+either through query context or through Broker configuration.
+
+- Aggregation functions that are labeled as using sketches or approximations, such as APPROX_COUNT_DISTINCT, are always
+approximate, regardless of configuration.
+
+**A known issue with approximate functions based on data sketches**
+
+The `APPROX_QUANTILE_DS` and `DS_QUANTILES_SKETCH` functions can fail with an `IllegalStateException` if one of the sketches for
+the query hits `maxStreamLength`: the maximum number of items to store in each sketch.
+See [GitHub issue 11544](https://github.com/apache/druid/issues/11544) for more details.
+To workaround the issue, increase value of the maximum string length with the `approxQuantileDsMaxStreamLength` parameter
+in the query context. Since it is set to 1,000,000,000 by default, you don't need to override it in most cases.
+See [accuracy information](https://datasketches.apache.org/docs/Quantiles/ClassicQuantilesSketch.html) in the DataSketches documentation for how many bytes are required per stream length.
+This query context  parameter is a temporary solution to avoid the known issue. It may be removed in a future release after the bug is fixed.
+
+## Unsupported features
+
+Druid does not support all SQL features. In particular, the following features are not supported.
+
+- JOIN between native datasources (table, lookup, subquery) and [system tables](sql-metadata-tables.md).
+- JOIN conditions that are not an equality between expressions from the left- and right-hand sides.
+- JOIN conditions containing a constant value inside the condition.
+- JOIN conditions on a column which contains a multi-value dimension.
+- ORDER BY for a non-aggregating query, except for `ORDER BY __time` or `ORDER BY __time DESC`, which are supported.
+  This restriction only applies to non-aggregating queries; you can ORDER BY any column in an aggregating query.
+- DDL and DML.
+- Using Druid-specific functions like `TIME_PARSE` and `APPROX_QUANTILE_DS` on [system tables](sql-metadata-tables.md).
+
+Additionally, some Druid native query features are not supported by the SQL language. Some unsupported Druid features
+include:
+
+- [Inline datasources](datasource.md#inline).
+- [Spatial filters](geo.md).
+- [Multi-value dimensions](sql-data-types.md#multi-value-strings) are only partially implemented in Druid SQL. There are known
+inconsistencies between their behavior in SQL queries and in native queries due to how they are currently treated by
+the SQL planner.
+
+
diff --git a/docs/35.0.0/querying/sql-window-functions.md b/docs/35.0.0/querying/sql-window-functions.md
new file mode 100644
index 0000000000..b7f6b17d86
--- /dev/null
+++ b/docs/35.0.0/querying/sql-window-functions.md
@@ -0,0 +1,423 @@
+---
+id: sql-window-functions
+title: Window functions
+description: Reference for window functions
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ License); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ AS IS BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+
+Apache Druid supports two query languages: [Druid SQL](sql.md) and [native queries](querying.md).
+This document describes the SQL language.
+
+:::
+
+Window functions in Apache Druid produce values based upon the relationship of one row within a window of rows to the other rows within the same window. A window is a group of related rows within a result set. For example, rows with the same value for a specific dimension.
+
+Window functions in Druid require a GROUP BY statement. Druid performs the row-level aggregations for the GROUP BY before performing the window function calculations.
+
+The following example organizes results with the same `channel` value into windows. For each window, the query returns the rank of each row in ascending order based upon its `changed` value.
+
+```sql
+SELECT FLOOR(__time TO DAY) AS event_time,
+    channel,
+    ABS(delta) AS change,
+    RANK() OVER w AS rank_value
+FROM wikipedia
+WHERE channel in ('#kk.wikipedia', '#lt.wikipedia')
+AND '2016-06-28' > FLOOR(__time TO DAY) > '2016-06-26'
+GROUP BY channel, ABS(delta), __time
+WINDOW w AS (PARTITION BY channel ORDER BY ABS(delta) ASC)
+```
+
+<details>
+<summary> View results </summary>
+
+| `event_time` | `channel` | `change`| `rank_value` |
+| -- | -- | -- | -- |
+| `2016-06-27T00:00:00.000Z`| `#kk.wikipedia`| 1 | 1 |
+| `2016-06-27T00:00:00.000Z`| `#kk.wikipedia`| 1 | 1 |
+| `2016-06-27T00:00:00.000Z`| `#kk.wikipedia`| 7 | 3 |
+| `2016-06-27T00:00:00.000Z`| `#kk.wikipedia`| 56 | 4 |
+| `2016-06-27T00:00:00.000Z`| `#kk.wikipedia`| 56 | 4 |
+| `2016-06-27T00:00:00.000Z`| `#kk.wikipedia`| 63 | 6 |
+| `2016-06-27T00:00:00.000Z`| `#kk.wikipedia`| 91 | 7 |  
+| `2016-06-27T00:00:00.000Z`| `#kk.wikipedia`| 2440 | 8 |
+| `2016-06-27T00:00:00.000Z`| `#kk.wikipedia`| 2703 | 9 |
+| `2016-06-27T00:00:00.000Z`| `#kk.wikipedia`| 6900 |10 |
+| `2016-06-27T00:00:00.000Z`| `#lt.wikipedia`| 1 | 1 |
+| `2016-06-27T00:00:00.000Z`| `#lt.wikipedia`| 2 | 2 |
+| `2016-06-27T00:00:00.000Z`| `#lt.wikipedia`| 13 | 3 |
+| `2016-06-27T00:00:00.000Z`| `#lt.wikipedia`| 28 | 4 |
+| `2016-06-27T00:00:00.000Z`| `#lt.wikipedia`| 53 | 5 |
+| `2016-06-27T00:00:00.000Z`| `#lt.wikipedia`| 56 | 6 |
+| `2016-06-27T00:00:00.000Z`| `#lt.wikipedia`| 59 | 7 |
+| `2016-06-27T00:00:00.000Z`| `#lt.wikipedia`| 391 | 8 |
+| `2016-06-27T00:00:00.000Z`| `#lt.wikipedia`| 894 | 9 |
+| `2016-06-27T00:00:00.000Z`| `#lt.wikipedia`| 4358 | 10 |
+
+</details>
+
+Window functions are similar to [aggregation functions](./aggregations.md).  
+
+You can use the OVER clause to treat other Druid aggregation functions as window functions. For example, the sum of a value for rows within a window.
+
+Window functions support aliasing.
+
+## Window function syntax
+
+You can write a window function in Druid using either syntax below.
+The second syntax shows a window alias to reference a window that you can reuse.
+
+
+```sql
+window_function() OVER (
+  [PARTITION BY partitioning expression]
+  [ORDER BY order expression]
+  [[ROWS, RANGE] BETWEEN range start AND range end])
+FROM table
+GROUP BY dimensions
+```
+
+```sql
+window_function() OVER w
+FROM table
+WINDOW w AS ([PARTITION BY partitioning expression] [ORDER BY order expression]
+  [[ROWS, RANGE] BETWEEN range start AND range end])
+GROUP BY dimensions
+```
+
+The OVER clause defines the query windows for window functions as follows:
+- PARTITION BY indicates the dimension that defines window boundaries
+- ORDER BY specifies the order of the rows within the windows
+
+An empty OVER clause or the absence of a PARTITION BY clause indicates that all data belongs to a single window.
+
+In the following example, the following OVER clause example sets the window dimension to `channel` and orders the results by the absolute value of `delta` ascending:
+
+```sql
+...
+RANK() OVER (PARTITION BY channel ORDER BY ABS(delta) ASC)
+...
+```
+
+Window frames, set in ROWS and RANGE expressions, limit the set of rows used for the windowed aggregation.
+
+ROWS and RANGE accept the following values for `range start` and `range end`:
+- UNBOUNDED PRECEDING: from the beginning of the window as ordered by the order expression
+- _N_ ROWS PRECEDING: _N_ rows before the current row as ordered by the order expression
+- CURRENT ROW: the current row
+- _N_ ROWS FOLLOWING: _N_ rows after the current row as ordered by the order expression
+- UNBOUNDED FOLLOWING: to the end of the window as ordered by the order expression
+
+See [Example with window frames](#example-with-window-frames) for more detail.
+ 
+Druid applies the GROUP BY dimensions before calculating all non-window aggregation functions. Then it applies the window function over the aggregated results.
+
+:::note
+
+Sometimes windows are called partitions. However, the partitioning for window functions are a shuffle (partition) of the result set created at query time and is not to be confused with Druid's segment partitioning feature which partitions data at ingest time.
+
+:::
+
+### ORDER BY windows
+
+When the window definition only specifies ORDER BY and not PARTITION BY, it sorts the aggregate data set and applies the function in that order.
+
+The following query uses `ORDER BY SUM(delta) DESC` to rank user hourly activity from the most changed the least changed within an hour:
+
+```sql
+SELECT
+    TIME_FLOOR(__time, 'PT1H') as time_hour, 
+    channel, 
+    user,
+    SUM(delta) net_user_changes,
+    RANK() OVER (ORDER BY SUM(delta) DESC) AS editing_rank
+FROM "wikipedia"
+WHERE channel IN ('#kk.wikipedia', '#lt.wikipedia')
+  AND __time BETWEEN '2016-06-27' AND '2016-06-28'
+GROUP BY TIME_FLOOR(__time, 'PT1H'), channel, user
+ORDER BY 5 
+```
+
+<details>
+<summary> View results </summary>
+
+| `time_hour` | `channel` | `user` | `net_user_changes` | `editing_rank` |
+| --- | --- | --- | --- | --- |
+| `2016-06-27T15:00:00.000Z` | `#kk.wikipedia` | `Nurkhan` | 6900| 1 |
+| `2016-06-27T19:00:00.000Z` | `#lt.wikipedia` | `77.221.66.41` | 4358 | 2 |
+| `2016-06-27T09:00:00.000Z` | `#kk.wikipedia` | `Салиха` | 2702 | 3 |
+| `2016-06-27T04:00:00.000Z` | `#kk.wikipedia` | `Nurkhan` | 2440 | 4 |
+| `2016-06-27T09:00:00.000Z` | `#lt.wikipedia` | `80.4.147.222` | 894 | 5 |
+| `2016-06-27T09:00:00.000Z` | `#lt.wikipedia` | `178.11.203.212` | 447 | 6 |
+| `2016-06-27T11:00:00.000Z` | `#kk.wikipedia` | `Нұрлан Рахымжанов` | 126 | 7 |
+| `2016-06-27T06:00:00.000Z` | `#kk.wikipedia` | `Шокай` | 91 | 8 |
+| `2016-06-27T11:00:00.000Z` | `#lt.wikipedia` | `MaryroseB54` | 59 | 9 |
+| `2016-06-27T04:00:00.000Z` | `#kk.wikipedia` | `Нұрлан Рахымжанов` | 56 | 10 |
+| `2016-06-27T12:00:00.000Z` | `#lt.wikipedia` | `Karoliuk` | 53 | 11 |
+| `2016-06-27T12:00:00.000Z` | `#lt.wikipedia` | `Powermelon` | 28 | 12 |
+| `2016-06-27T07:00:00.000Z` | `#lt.wikipedia` | `Powermelon` | 13 | 13 |
+| `2016-06-27T10:00:00.000Z` | `#lt.wikipedia` | `80.4.147.222` | 1 | 14 |
+| `2016-06-27T07:00:00.000Z` | `#kk.wikipedia` | `Салиха` | -1 | 15 |
+| `2016-06-27T06:00:00.000Z` | `#lt.wikipedia` | `Powermelon` | -2 | 16 |
+</details>
+
+### PARTITION BY windows
+
+When a window only specifies PARTITION BY partition expression, Druid calculates the aggregate window function over all the rows that share a value within the selected dataset.
+
+The following example demonstrates a query that uses two different windows—`PARTITION BY channel` and `PARTITION BY user`—to calculate the total activity in the channel and total activity by the user so that they can be compared to individual hourly activity:
+
+```sql
+SELECT
+    TIME_FLOOR(__time, 'PT1H') as time_hour,
+    channel,
+    user,
+    SUM(delta) AS hourly_user_changes,
+    SUM(SUM(delta)) OVER (PARTITION BY user) AS total_user_changes,
+    SUM(SUM(delta)) OVER (PARTITION BY channel) AS total_channel_changes
+FROM "wikipedia"
+WHERE channel IN ('#kk.wikipedia', '#lt.wikipedia')
+  AND __time BETWEEN '2016-06-27' AND '2016-06-28'
+GROUP BY TIME_FLOOR(__time, 'PT1H'), 2, 3
+ORDER BY channel, TIME_FLOOR(__time, 'PT1H'), user
+```
+
+<details>
+<summary> View results </summary>
+
+| `time_hour` | `channel` | `user` | `hourly_user_changes` | `total_user_changes` | `total_channel_changes` |
+| --- | ---| ---| --- | --- | --- |
+| `2016-06-27T04:00:00.000Z` | `#kk.wikipedia` | `Nurkhan` | 2440 | 9340 | 12314 |
+| `2016-06-27T04:00:00.000Z` | `#kk.wikipedia` | `Нұрлан Рахымжанов` | 56 | 182 | 12314 |
+| `2016-06-27T06:00:00.000Z` | `#kk.wikipedia` | `Шокай` | 91 | 91 | 12314 |
+| `2016-06-27T07:00:00.000Z` | `#kk.wikipedia` | `Салиха` | -1 | 2701 | 12314 |
+| `2016-06-27T09:00:00.000Z` | `#kk.wikipedia` | `Салиха` | 2702 | 2701 | 12314 |
+| `2016-06-27T11:00:00.000Z` | `#kk.wikipedia` | `Нұрлан Рахымжанов` | 126 | 182 | 12314 |
+| `2016-06-27T15:00:00.000Z` | `#kk.wikipedia` | `Nurkhan` | 6900 | 9340 | 12314 |
+| `2016-06-27T06:00:00.000Z` | `#lt.wikipedia` | `Powermelon` | -2 | 39 | 5851 |
+| `2016-06-27T07:00:00.000Z` | `#lt.wikipedia` | `Powermelon` | 13 | 39 | 5851 |
+| `2016-06-27T09:00:00.000Z` | `#lt.wikipedia` | `178.11.203.212` | 447 | 447 | 5851 |
+| `2016-06-27T09:00:00.000Z` | `#lt.wikipedia` | `80.4.147.222` | 894 | 895 | 5851 |
+| `2016-06-27T10:00:00.000Z` | `#lt.wikipedia` | `80.4.147.222` | 1 | 895 | 5851 |
+| `2016-06-27T11:00:00.000Z` | `#lt.wikipedia` | `MaryroseB54` | 59 | 59 | 5851 |
+| `2016-06-27T12:00:00.000Z` | `#lt.wikipedia` | `Karoliuk` | 53 | 53 | 5851 |
+| `2016-06-27T12:00:00.000Z` | `#lt.wikipedia` | `Powermelon` | 28 | 39 | 5851 |
+| `2016-06-27T19:00:00.000Z` | `#lt.wikipedia` | `77.221.66.41` | 4358 | 4358 | 5851 |
+
+</details>
+
+In this example, the dataset is filtered for a single day. Therefore the window function results represent the total activity for the day, for the `user` and for the `channel` dimensions respectively.
+
+This type of result helps you analyze the impact of an individual user's hourly activity:
+- the impact to the channel by comparing `hourly_user_changes` to `total_channel_changes`
+- the impact of each user over the channel by `total_user_changes` to `total_channel_changes`
+- the progress of each user's individual activity by comparing `hourly_user_changes` to `total_user_changes`
+
+#### Window frame guardrails
+
+Druid has guardrail logic to prevent you from executing window function queries with window frame expressions that might return unexpected results.
+
+For example:
+- You cannot set expressions as bounds for window frames.
+- You can only use a RANGE frames when both endpoints are unbounded or current row.
+
+## Window function reference
+
+|Function|Notes|
+|--------|-----|
+| `ROW_NUMBER()` | Returns the number of the row within the window starting from 1 |
+| `RANK()` | Returns the rank with gaps for a row within a window. For example, if two rows tie for rank 1, the next rank is 3 | 
+| `DENSE_RANK()` | Returns the rank for a row within a window without gaps. For example, if two rows tie for rank of 1, the subsequent row is ranked 2. |
+| `PERCENT_RANK()` | Returns the relative rank of the row calculated as a percentage according to the formula: `RANK() OVER (window) / COUNT(1) OVER (window)` |
+| `CUME_DIST()` | Returns the cumulative distribution of the current row within the window calculated as number of window rows at the same rank or higher than current row divided by total window rows. The return value ranges between `1/number of rows` and 1 |
+| `NTILE(tiles)` | Divides the rows within a window as evenly as possible into the number of tiles, also called buckets, and returns the value of the tile that the row falls into | None |
+| `LAG(expr[, offset])` | If you do not supply an `offset`, returns the value evaluated at the row preceding the current row. Specify an offset number, `n`, to return the value evaluated at `n` rows preceding the current one |
+| `LEAD(expr[, offset])` | If you do not supply an `offset`, returns the value evaluated at the row following the current row. Specify an offset number `n` to return the value evaluated at `n` rows following the current one; if there is no such row, returns the given default value |
+| `FIRST_VALUE(expr)` | Returns the value evaluated for the expression for the first row within the window |
+| `LAST_VALUE(expr)` | Returns the value evaluated for the expression for the last row within the window |
+
+## Examples
+
+The following example illustrates all of the built-in window functions to compare the number of characters changed per event for a channel in the Wikipedia data set.
+
+```sql
+SELECT FLOOR(__time TO DAY) AS event_time,
+    channel,
+    ABS(delta) AS change,
+    ROW_NUMBER() OVER w AS row_no,
+    RANK() OVER w AS rank_no,
+    DENSE_RANK() OVER w AS dense_rank_no,
+    PERCENT_RANK() OVER w AS pct_rank,
+    CUME_DIST() OVER w AS cumulative_dist,
+    NTILE(4) OVER w AS ntile_val,
+    LAG(ABS(delta), 1, 0) OVER w AS lag_val,
+    LEAD(ABS(delta), 1, 0) OVER w AS lead_val,
+    FIRST_VALUE(ABS(delta)) OVER w AS first_val,
+    LAST_VALUE(ABS(delta)) OVER w AS last_val
+FROM wikipedia
+WHERE channel IN ('#kk.wikipedia', '#lt.wikipedia')
+GROUP BY channel, ABS(delta), FLOOR(__time TO DAY) 
+WINDOW w AS (PARTITION BY channel ORDER BY ABS(delta) ASC)
+```
+
+<details>
+<summary> View results </summary>
+
+|`event_time`|`channel`|`change`|`row_no`|`rank_no`|`dense_rank_no`|`pct_rank`|`cumulative_dist`|`ntile_val`|`lag_val`|`lead_val`|`first_val`|`last_val`|
+|------------|---------|--------|--------|---------|---------------|----------|----------------|-----------|---------|----------|-----------|----------|
+|`2016-06-27T00:00:00.000Z`|`#kk.wikipedia`|1|1|1|1|0.0|0.125|1|null|7|1|6900|
+|`2016-06-27T00:00:00.000Z`|`#kk.wikipedia`|7|2|2|2|0.14285714285714285|0.25|1|1|56|1|6900|
+|`2016-06-27T00:00:00.000Z`|`#kk.wikipedia`|56|3|3|3|0.2857142857142857|0.375|2|7|63|1|6900|
+|`2016-06-27T00:00:00.000Z`|`#kk.wikipedia`|63|4|4|4|0.42857142857142855|0.5|2|56|91|1|6900|
+|`2016-06-27T00:00:00.000Z`|`#kk.wikipedia`|91|5|5|5|0.5714285714285714|0.625|3|63|2440|1|6900|
+|`2016-06-27T00:00:00.000Z`|`#kk.wikipedia`|2440|6|6|6|0.7142857142857143|0.75|3|91|2703|1|6900|
+|`2016-06-27T00:00:00.000Z`|`#kk.wikipedia`|2703|7|7|7|0.8571428571428571|0.875|4|2440|6900|1|6900|
+|`2016-06-27T00:00:00.000Z`|`#kk.wikipedia`|6900|8|8|8|1|1|4|2703|null|1|6900|
+|`2016-06-27T00:00:00.000Z`| `#lt.wikipedia`|1|1|1|1|0|0.1|1|null|2|1|4358|
+|`2016-06-27T00:00:00.000Z`| `#lt.wikipedia`|2|2|2|2|0.1111111111111111|0.2|1|1|13|1|4358|
+|`2016-06-27T00:00:00.000Z`| `#lt.wikipedia`|13|3|3|3|0.2222222222222222|0.3|1|2|28|1|4358|
+|`2016-06-27T00:00:00.000Z`| `#lt.wikipedia`|28|4|4|4|0.3333333333333333|0.4|2|13|53|1|4358|
+|`2016-06-27T00:00:00.000Z`| `#lt.wikipedia`|53|5|5|5|0.4444444444444444|0.5|2|28|56|1|4358|
+|`2016-06-27T00:00:00.000Z`| `#lt.wikipedia`|56|6|6|6|0.5555555555555556|0.6|2|53|59|1|4358|
+|`2016-06-27T00:00:00.000Z`| `#lt.wikipedia`|59|7|7|7|0.6666666666666666|0.7|3|56|391|1|4358|
+|`2016-06-27T00:00:00.000Z`| `#lt.wikipedia`|391|8|8|8|0.7777777777777778|0.8|3|59|894|1|4358|
+|`2016-06-27T00:00:00.000Z`| `#lt.wikipedia`|894|9|9|9|0.8888888888888888|0.9|4|391|4358|1|4358|
+|`2016-06-27T00:00:00.000Z`| `#lt.wikipedia`|4358|10|10|10|1|1|4|894|null|1|4358|
+
+</details>
+
+The following example demonstrates applying the SUM() function over the values in a window to calculate the cumulative changes to a channel over time:
+
+```sql
+SELECT
+    FLOOR(__time TO MINUTE) as "time",
+    channel,
+    ABS(delta) AS changes,
+    sum(ABS(delta)) OVER (PARTITION BY channel ORDER BY FLOOR(__time TO MINUTE) ASC) AS cum_changes
+FROM wikipedia
+WHERE channel IN ('#kk.wikipedia', '#lt.wikipedia')
+GROUP BY channel, __time, delta
+```
+
+<details>
+<summary> View results </summary>
+
+|`time`|`channel`|`changes`|`cum_changes`|
+|------|---------|---------|-------------|
+|`2016-06-27T04:20:00.000Z`|`#kk.wikipedia`|56|56|
+|`2016-06-27T04:35:00.000Z`|`#kk.wikipedia`|2440|2496|
+|`2016-06-27T06:15:00.000Z`|`#kk.wikipedia`|91|2587|
+|`2016-06-27T07:32:00.000Z`|`#kk.wikipedia`|1|2588|
+|`2016-06-27T09:00:00.000Z`|`#kk.wikipedia`|2703|5291|
+|`2016-06-27T09:24:00.000Z`|`#kk.wikipedia`|1|5292|
+|`2016-06-27T11:00:00.000Z`|`#kk.wikipedia`|63|5355|
+|`2016-06-27T11:05:00.000Z`|`#kk.wikipedia`|7|5362|
+|`2016-06-27T11:32:00.000Z`|`#kk.wikipedia`|56|5418|
+|`2016-06-27T15:21:00.000Z`|`#kk.wikipedia`|6900|12318|
+|`2016-06-27T06:17:00.000Z`|`#lt.wikipedia`|2|2|
+|`2016-06-27T07:55:00.000Z`|`#lt.wikipedia`|13|15|
+|`2016-06-27T09:05:00.000Z`|`#lt.wikipedia`|894|909|
+|`2016-06-27T09:12:00.000Z`|`#lt.wikipedia`|391|1300|
+|`2016-06-27T09:23:00.000Z`|`#lt.wikipedia`|56|1356|
+|`2016-06-27T10:59:00.000Z`|`#lt.wikipedia`|1|1357|
+|`2016-06-27T11:49:00.000Z`|`#lt.wikipedia`|59|1416|
+|`2016-06-27T12:41:00.000Z`|`#lt.wikipedia`|53|1469|
+|`2016-06-27T12:58:00.000Z`|`#lt.wikipedia`|28|1497|
+|`2016-06-27T19:03:00.000Z`|`#lt.wikipedia`|4358|5855|
+
+</details>
+
+### Example with window frames
+
+The following query uses a few different window frames to calculate overall activity by channel:
+
+```sql
+SELECT
+    channel, 
+    TIME_FLOOR(__time, 'PT1H')      AS time_hour, 
+    SUM(delta)                      AS hourly_channel_changes,
+    SUM(SUM(delta)) OVER cumulative AS cumulative_activity_in_channel,
+    SUM(SUM(delta)) OVER moving5    AS csum5,
+    COUNT(1) OVER moving5           AS count5
+FROM "wikipedia"
+WHERE channel = '#en.wikipedia'
+  AND __time BETWEEN '2016-06-27' AND '2016-06-28'
+GROUP BY 1, TIME_FLOOR(__time, 'PT1H')
+WINDOW cumulative AS (   
+                         PARTITION BY channel 
+                         ORDER BY TIME_FLOOR(__time, 'PT1H') 
+                         ROWS BETWEEN UNBOUNDED PRECEDING AND CURRENT ROW
+                     )
+                     ,
+        moving5 AS ( 
+                    PARTITION BY channel 
+                    ORDER BY TIME_FLOOR(__time, 'PT1H') 
+                    ROWS BETWEEN 4 PRECEDING AND CURRENT ROW
+                  )
+```
+
+<details>
+<summary> View results </summary>
+
+| `channel` | `time_hour` | `hourly_channel_changes` | `cumulative_activity_in_channel` | `csum5` | `count5` |
+| --- | --- | --- | --- | --- | --- | --- | --- |
+| `#en.wikipedia` | `2016-06-27T00:00:00.000Z` | 74996 | 74996 | 74996 | 1 |
+| `#en.wikipedia` | `2016-06-27T01:00:00.000Z` | 24150 | 99146 | 99146 | 2 |
+| `#en.wikipedia` | `2016-06-27T02:00:00.000Z` | 102372 | 201518 | 201518 | 3 |
+| `#en.wikipedia` | `2016-06-27T03:00:00.000Z` | 61362 | 262880 | 262880 | 4 |
+| `#en.wikipedia` | `2016-06-27T04:00:00.000Z` | 61666 | 324546 | 324546 | 5 |
+| `#en.wikipedia` | `2016-06-27T05:00:00.000Z` | 144199 | 468745 | 393749 | 5 |
+| `#en.wikipedia` | `2016-06-27T06:00:00.000Z` | 33414 | 502159 | 403013 | 5 |
+| `#en.wikipedia` | `2016-06-27T07:00:00.000Z` | 79397 | 581556 | 380038 | 5 |
+| `#en.wikipedia` | `2016-06-27T08:00:00.000Z` | 104436 | 685992 | 423112 | 5 |
+| `#en.wikipedia` | `2016-06-27T09:00:00.000Z` | 58020 | 744012 | 419466 | 5 |
+| `#en.wikipedia` | `2016-06-27T10:00:00.000Z` | 93904 | 837916 | 369171 | 5 |
+| `#en.wikipedia` | `2016-06-27T11:00:00.000Z` | 74436 | 912352 | 410193 | 5 |
+| `#en.wikipedia` | `2016-06-27T12:00:00.000Z` | 83491 | 995843 | 414287 | 5 |
+| `#en.wikipedia` | `2016-06-27T13:00:00.000Z` | 103051 | 1098894 | 412902 | 5 |
+| `#en.wikipedia` | `2016-06-27T14:00:00.000Z` | 211411 | 1310305 | 566293 | 5 |
+| `#en.wikipedia` | `2016-06-27T15:00:00.000Z` | 101247 | 1411552 | 573636 | 5 |
+| `#en.wikipedia` | `2016-06-27T16:00:00.000Z` | 189765 | 1601317 | 688965 | 5 |
+| `#en.wikipedia` | `2016-06-27T17:00:00.000Z` | 74404 | 1675721 | 679878 | 5 |
+| `#en.wikipedia` | `2016-06-27T18:00:00.000Z` | 104824 | 1780545 | 681651 | 5 |
+| `#en.wikipedia` | `2016-06-27T19:00:00.000Z` | 71268 | 1851813 | 541508 | 5 |
+| `#en.wikipedia` | `2016-06-27T20:00:00.000Z` | 88185 | 1939998 | 528446 | 5 |
+| `#en.wikipedia` | `2016-06-27T21:00:00.000Z` | 42584 | 1982582 | 381265 | 5 |
+
+</details>
+
+The example defines multiple window specifications in the WINDOW clause that you can use for various window function calculations.
+
+The query uses two windows:
+- `cumulative` is partitioned by channel and includes all rows from the beginning of partition up to the current row as ordered by `__time` to enable cumulative aggregation
+- `moving5` is also partitioned by channel but only includes up to the last four rows and the current row as ordered by time
+
+The number of rows considered for the `moving5` window for the `count5` column:
+- starts at a single row because there are no rows before the current one
+- grows up to five rows as defined by `ROWS BETWEEN 4 ROWS PRECEDING AND CURRENT ROW`
+
+## Known issues
+
+The following are known issues with window functions:
+
+- SELECT * queries without a WHERE clause are not supported. If you want to retrieve all columns in this case, specify the column names.
diff --git a/docs/35.0.0/querying/sql.md b/docs/35.0.0/querying/sql.md
new file mode 100644
index 0000000000..c231053169
--- /dev/null
+++ b/docs/35.0.0/querying/sql.md
@@ -0,0 +1,482 @@
+---
+id: sql
+title: "Druid SQL overview"
+sidebar_label: "Overview and syntax"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ Apache Druid supports two query languages: Druid SQL and [native queries](querying.md).
+ This document describes the SQL language.
+:::
+
+You can query data in Druid datasources using Druid SQL. Druid translates SQL queries into its [native query language](querying.md). To learn about translation and how to get the best performance from Druid SQL, see [SQL query translation](sql-translation.md).
+
+Druid SQL planning occurs on the Broker.
+Set [Broker runtime properties](../configuration/index.md#sql) to configure the query plan and JDBC querying.
+
+For information on permissions needed to make SQL queries, see [Defining SQL permissions](../operations/security-user-auth.md#sql-permissions).
+
+This topic introduces Druid SQL syntax.
+For more information and SQL querying options see:
+- [Data types](./sql-data-types.md) for a list of supported data types for Druid columns.
+- [Aggregation functions](./sql-aggregations.md) for a list of aggregation functions available for Druid SQL SELECT statements.
+- [Scalar functions](./sql-scalar.md) for Druid SQL scalar functions including numeric and string functions, IP address functions, Sketch functions, and more.
+- [SQL multi-value string functions](./sql-multivalue-string-functions.md) for operations you can perform on string dimensions containing multiple values.
+- [Query translation](./sql-translation.md) for information about how Druid translates SQL queries to native queries before running them.
+
+For information about APIs, see:
+- [Druid SQL API](../api-reference/sql-api.md) for information on the HTTP API.
+- [SQL JDBC driver API](../api-reference/sql-jdbc.md) for information about the JDBC driver API.
+- [SQL query context](./sql-query-context.md) for information about the query context parameters that affect SQL planning.
+
+## Syntax
+
+Druid SQL supports SELECT queries with the following structure:
+
+```
+[ EXPLAIN PLAN FOR ]
+[ WITH tableName [ ( column1, column2, ... ) ] AS ( query ) ]
+SELECT [ ALL | DISTINCT ] { * | exprs }
+FROM { <table> | (<subquery>) | <o1> [ INNER | LEFT ] JOIN <o2> ON condition }
+[PIVOT (aggregation_function(column_to_aggregate) FOR column_with_values_to_pivot IN (pivoted_column1 [, pivoted_column2 ...]))]
+[UNPIVOT (values_column FOR names_column IN (unpivoted_column1 [, unpivoted_column2 ... ]))]
+[ CROSS JOIN UNNEST(source_expression) as table_alias_name(column_alias_name) ]
+[ WHERE expr ]
+[ GROUP BY [ exprs | GROUPING SETS ( (exprs), ... ) | ROLLUP (exprs) | CUBE (exprs) ] ]
+[ HAVING expr ]
+[ ORDER BY expr [ ASC | DESC ], expr [ ASC | DESC ], ... ]
+[ LIMIT limit ]
+[ OFFSET offset ]
+[ UNION ALL <another query> ]
+```
+
+## FROM
+
+The FROM clause can refer to any of the following:
+
+- [Table datasources](datasource.md#table) from the `druid` schema. This is the default schema, so Druid table
+datasources can be referenced as either `druid.dataSourceName` or simply `dataSourceName`.
+- [Lookups](datasource.md#lookup) from the `lookup` schema, for example `lookup.countries`. Note that lookups can
+also be queried using the [`LOOKUP` function](sql-scalar.md#string-functions).
+- [Subqueries](datasource.md#query).
+- [Joins](datasource.md#join) between anything in this list, except between native datasources (table, lookup,
+query) and system tables. The join condition must be an equality between expressions from the left- and right-hand side
+of the join.
+- [Metadata tables](sql-metadata-tables.md) from the `INFORMATION_SCHEMA` or `sys` schemas. Unlike the other options for the
+FROM clause, metadata tables are not considered datasources. They exist only in the SQL layer.
+
+For more information about table, lookup, query, and join datasources, refer to the [Datasources](datasource.md)
+documentation.
+
+## PIVOT
+
+:::info
+The PIVOT operator is an [experimental feature](../development/experimental.md).
+:::
+
+The PIVOT operator carries out an aggregation and transforms rows into columns in the output.
+
+The following is the general syntax for the PIVOT operator. Note that the PIVOT operator is enclosed in parentheses and forms part of the FROM clause of the query.
+
+```sql
+PIVOT (aggregation_function(column_to_aggregate)
+  FOR column_with_values_to_pivot
+  IN (pivoted_column1 [, pivoted_column2 ...])
+)
+```
+
+PIVOT syntax parameters:
+
+* `aggregation_function`: An aggregation function, such as SUM, COUNT, MIN, MAX, or AVG.
+* `column_to_aggregate`: The source column to be aggregated.
+* `column_with_values_to_pivot`: The column that contains values for the pivoted column names.
+* `pivoted_columnN`: The list of values to pivot into headers in the output.
+
+The following example demonstrates how to transform `cityName` values into column headers `ba_sum_deleted` and `ny_sum_deleted`:
+
+```sql
+SELECT user, channel, ba_sum_deleted, ny_sum_deleted
+FROM "wikipedia"
+PIVOT (SUM(deleted) AS "sum_deleted" FOR "cityName" IN ( 'Buenos Aires' AS ba, 'New York' AS ny))
+WHERE ba_sum_deleted IS NOT NULL OR ny_sum_deleted IS NOT NULL
+LIMIT 15
+```
+
+<details>
+<summary> View results </summary>
+
+|`user`|`channel`|`ba_sum_deleted`|`ny_sum_deleted`|
+|------|---------|----------------|----------------|
+|181.230.118.178|`#en.wikipedia`|0|null|
+|181.230.118.178|`#en.wikipedia`|0|null|
+|69.86.6.150|`#en.wikipedia`|null|1|
+|190.123.145.147|`#es.wikipedia`|0|null|
+|181.230.118.178|`#en.wikipedia`|16|null|
+|181.230.118.178|`#en.wikipedia`|0|null|
+|181.230.118.178|`#en.wikipedia`|0|null|
+|181.230.118.178|`#en.wikipedia`|0|null|
+|181.230.118.178|`#en.wikipedia`|0|null|
+|181.230.118.178|`#en.wikipedia`|0|null|
+|181.230.118.178|`#en.wikipedia`|0|null|
+|190.192.179.192|`#en.wikipedia`|0|null|
+|181.230.118.178|`#en.wikipedia`|0|null|
+|181.230.118.178|`#en.wikipedia`|0|null|
+|181.230.118.178|`#en.wikipedia`|0|null|
+
+</details>
+
+## UNPIVOT
+
+:::info
+The UNPIVOT operator is an [experimental feature](../development/experimental.md).
+:::
+
+The UNPIVOT operator transforms existing column values into rows.
+Note that UNPIVOT isn't the exact reverse operation of PIVOT. The PIVOT operator carries out an aggregation and merges rows as needed. UNPIVOT doesn't reproduce the original rows that have been merged.
+
+The following is the general syntax for the UNPIVOT operator. Note that the UNPIVOT operator is enclosed in parentheses and forms part of the FROM clause of the query.
+
+```sql
+UNPIVOT (values_column 
+  FOR names_column
+  IN (unpivoted_column1 [, unpivoted_column2 ... ])
+)
+```
+
+UNPIVOT syntax parameters:
+
+* `values_column`: The column that contains the values of the unpivoted columns.
+* `names_column`: The column that contains the names of the unpivoted columns.
+* `unpivoted_columnN`: The list of columns to transform into rows in the output.
+
+The following example demonstrates how to transform the columns `added` and `deleted` into row values that correspond to a particular `channel`:
+
+```sql
+SELECT channel, user, action, SUM(changes) AS total_changes
+FROM "wikipedia" 
+UNPIVOT ( changes FOR action IN ("added", "deleted") )
+WHERE channel LIKE '#ar%'
+GROUP BY channel, user, action
+LIMIT 15
+```
+
+<details>
+<summary> View results </summary>
+
+|`channel`|`user`|`action`|`total_changes`|
+|---------|------|--------|---------------|
+|`#ar.wikipedia`|156.202.189.223|added|0|
+|`#ar.wikipedia`|156.202.189.223|deleted|30|
+|`#ar.wikipedia`|156.202.76.160|added|0|
+|`#ar.wikipedia`|156.202.76.160|deleted|0|
+|`#ar.wikipedia`|156.212.124.165|added|451|
+|`#ar.wikipedia`|156.212.124.165|deleted|0|
+|`#ar.wikipedia`|160.166.147.167|added|1|
+|`#ar.wikipedia`|160.166.147.167|deleted|0|
+|`#ar.wikipedia`|185.99.32.50|added|1|
+|`#ar.wikipedia`|185.99.32.50|deleted|0|
+|`#ar.wikipedia`|197.18.109.148|added|0|
+|`#ar.wikipedia`|197.18.109.148|deleted|24|
+|`#ar.wikipedia`|`2001:16A2:3C7:6C00:917E:AD28:FAD3:FD5C`|added|1|
+|`#ar.wikipedia`|`2001:16A2:3C7:6C00:917E:AD28:FAD3:FD5C`|deleted|0|
+|`#ar.wikipedia`|41.108.33.83|added|0|
+
+</details>
+
+## UNNEST
+
+The UNNEST clause unnests ARRAY typed values. The source for UNNEST can be an array type column, or an input that's been transformed into an array, such as with helper functions like [`MV_TO_ARRAY`](./sql-multivalue-string-functions.md) or [`ARRAY`](./sql-array-functions.md).
+
+The following is the general syntax for UNNEST, specifically a query that returns the column that gets unnested:
+
+```sql
+SELECT column_alias_name
+FROM datasource
+CROSS JOIN UNNEST(source_expression1) AS table_alias_name1(column_alias_name1)
+CROSS JOIN UNNEST(source_expression2) AS table_alias_name2(column_alias_name2) ...
+```
+
+* The `datasource` for UNNEST can be any Druid datasource, such as the following:
+  * A table, such as  `FROM a_table`.
+  * A subset of a table based on a query, a filter, or a JOIN. For example, `FROM (SELECT columnA,columnB,columnC from a_table)`.
+* The `source_expression` for the UNNEST function must be an array and can come from any expression. UNNEST works directly on Druid ARRAY typed columns. If the column you are unnesting is a multi-value VARCHAR, you must specify `MV_TO_ARRAY(dimension)` to convert it to an ARRAY type. You can also specify any expression that has an SQL array datatype. For example, you can call UNNEST on the following:
+  * `ARRAY[dim1,dim2]` if you want to make an array out of two dimensions. 
+  * `ARRAY_CONCAT(dim1,dim2)` if you want to concatenate two multi-value dimensions. 
+* The `AS table_alias_name(column_alias_name)` clause  is not required but is highly recommended. Use it to specify the output, which can be an existing column or a new one. Replace `table_alias_name` and `column_alias_name` with a table and column name you want to alias the unnested results to. If you don't provide this, Druid uses a nondescriptive name, such as `EXPR$0`.
+
+Keep the following things in mind when writing your query:
+
+- You can unnest multiple source expressions in a single query.
+- Notice the CROSS JOIN between the datasource and the UNNEST function. This is needed in most cases of the UNNEST function. Specifically, it is not needed when you're unnesting an inline array since the array itself is the datasource.
+- If you view the native explanation of a SQL UNNEST, you'll notice that Druid uses `j0.unnest` as a virtual column to perform the unnest. An underscore is added for each unnest, so you may notice virtual columns named `_j0.unnest` or `__j0.unnest`.
+- UNNEST preserves the ordering of the source array that is being unnested.
+
+For examples, see the [Unnest arrays tutorial](../tutorials/tutorial-unnest-arrays.md).
+
+The UNNEST function has the following limitations:
+
+- The function does not remove any duplicates or nulls in an array. Nulls will be treated as any other value in an array. If there are multiple nulls within the array, a record corresponding to each of the nulls gets created.
+- Arrays of complex objects inside complex JSON types are not supported.
+  
+UNNEST is the SQL equivalent of the [unnest datasource](./datasource.md#unnest).
+
+## WHERE
+
+The WHERE clause refers to columns in the FROM table, and will be translated to [native filters](filters.md). The
+WHERE clause can also reference a subquery, like `WHERE col1 IN (SELECT foo FROM ...)`. Queries like this are executed
+as a join on the subquery, described in the [Query translation](sql-translation.md#subqueries) section.
+
+Strings and numbers can be compared in the WHERE clause of a SQL query through implicit type conversion.
+For example, you can evaluate `WHERE stringDim = 1` for a string-typed dimension named `stringDim`.
+However, for optimal performance, you should explicitly cast the reference number as a string when comparing against a string dimension:
+```
+WHERE stringDim = '1'
+```
+
+Similarly, if you compare a string-typed dimension with reference to an array of numbers, cast the numbers to strings:
+```
+WHERE stringDim IN ('1', '2', '3')
+```
+
+Note that explicit type casting does not lead to significant performance improvement when comparing strings and numbers involving numeric dimensions since numeric dimensions are not indexed.
+
+## GROUP BY
+
+The GROUP BY clause refers to columns in the FROM table. Using GROUP BY, DISTINCT, or any aggregation functions will
+trigger an aggregation query using one of Druid's [three native aggregation query types](sql-translation.md#query-types). GROUP BY
+can refer to an expression or a select clause ordinal position (like `GROUP BY 2` to group by the second selected
+column).
+
+The GROUP BY clause can also refer to multiple grouping sets in three ways. The most flexible is GROUP BY GROUPING SETS,
+for example `GROUP BY GROUPING SETS ( (country, city), () )`. This example is equivalent to a `GROUP BY country, city`
+followed by `GROUP BY ()` (a grand total). With GROUPING SETS, the underlying data is only scanned one time, leading to
+better efficiency. Second, GROUP BY ROLLUP computes a grouping set for each level of the grouping expressions. For
+example `GROUP BY ROLLUP (country, city)` is equivalent to `GROUP BY GROUPING SETS ( (country, city), (country), () )`
+and will produce grouped rows for each country / city pair, along with subtotals for each country, along with a grand
+total. Finally, GROUP BY CUBE computes a grouping set for each combination of grouping expressions. For example,
+`GROUP BY CUBE (country, city)` is equivalent to `GROUP BY GROUPING SETS ( (country, city), (country), (city), () )`.
+
+Grouping columns that do not apply to a particular row will contain `NULL`. For example, when computing
+`GROUP BY GROUPING SETS ( (country, city), () )`, the grand total row corresponding to `()` will have `NULL` for the
+"country" and "city" columns. Column may also be `NULL` if it was `NULL` in the data itself. To differentiate such rows, 
+you can use `GROUPING` aggregation. 
+
+When using GROUP BY GROUPING SETS, GROUP BY ROLLUP, or GROUP BY CUBE, be aware that results may not be generated in the
+order that you specify your grouping sets in the query. If you need results to be generated in a particular order, use
+the ORDER BY clause.
+
+## HAVING
+
+The HAVING clause refers to columns that are present after execution of GROUP BY. It can be used to filter on either
+grouping expressions or aggregated values. It can only be used together with GROUP BY.
+
+## ORDER BY
+
+The ORDER BY clause refers to columns that are present after execution of GROUP BY. It can be used to order the results
+based on either grouping expressions or aggregated values. ORDER BY can refer to an expression or a select clause
+ordinal position (like `ORDER BY 2` to order by the second selected column). For non-aggregation queries, ORDER BY
+can only order by the `__time` column. For aggregation queries, ORDER BY can order by any column.
+
+## LIMIT
+
+The LIMIT clause limits the number of rows returned. In some situations Druid will push down this limit to data servers,
+which boosts performance. Limits are always pushed down for queries that run with the native Scan or TopN query types.
+With the native GroupBy query type, it is pushed down when ordering on a column that you are grouping by. If you notice
+that adding a limit doesn't change performance very much, then it's possible that Druid wasn't able to push down the
+limit for your query.
+
+## OFFSET
+
+The OFFSET clause skips a certain number of rows when returning results.
+
+If both LIMIT and OFFSET are provided, then OFFSET will be applied first, followed by LIMIT. For example, using
+LIMIT 100 OFFSET 10 will return 100 rows, starting from row number 10.
+
+Together, LIMIT and OFFSET can be used to implement pagination. However, note that if the underlying datasource is
+modified between page fetches, then the different pages will not necessarily align with each other.
+
+There are two important factors that can affect the performance of queries that use OFFSET:
+
+- Skipped rows still need to be generated internally and then discarded, meaning that raising offsets to high values
+  can cause queries to use additional resources.
+- OFFSET is only supported by the Scan and GroupBy [native query types](sql-translation.md#query-types). Therefore, a query with OFFSET
+  will use one of those two types, even if it might otherwise have run as a Timeseries or TopN. Switching query engines
+  in this way can affect performance.
+
+## UNION ALL
+
+The UNION ALL operator fuses multiple queries together. Druid SQL supports the UNION ALL operator in two situations: top-level and table-level, as described below. Queries that use UNION ALL in any other way will fail.
+
+### Top-level
+
+In top-level queries, you can use UNION ALL at the very top outer layer of the query - not in a subquery, and not in the FROM clause. The underlying queries run sequentially. Druid concatenates their results so that they appear one after the other.
+
+For example:
+
+```
+SELECT COUNT(*) FROM tbl WHERE my_column = 'value1'
+UNION ALL
+SELECT COUNT(*) FROM tbl WHERE my_column = 'value2'
+```
+
+Certain limitations apply when you use a top-level UNION ALL. For all top-level UNION ALL queries, you can't apply a GROUP BY, ORDER BY, or any other operator to the results of the query. For any top-level UNION ALL that uses the MSQ task engine, the SQL planner attempts to plan the top-level UNION ALL as a table-level UNION ALL. Because of this, UNION ALL queries that use the MSQ task engine always behave the same as table-level UNION ALL queries. They have the same characteristics and limitations. If the planner can't plan the query as a table-level UNION ALL, the query fails.
+
+### Table-level
+
+In table-level queries, you must use UNION ALL in a subquery in the FROM clause, and create the lower-level subqueries that are inputs to the UNION ALL operator as simple table SELECTs. You can't use features like expressions, column aliasing, JOIN, GROUP BY, or ORDER BY in table-level queries.
+
+The query runs natively using a [union datasource](datasource.md#union).
+
+At table-level queries, you must select the same columns from each table in the same order, and those columns must either have the same types, or types that can be implicitly cast to each other (such as different numeric types). For this reason, it is generally more robust to write your queries to select specific columns. If you use `SELECT *`, you must modify your queries if a new column is added to one table but not to the others.
+
+For example:
+
+```
+SELECT col1, COUNT(*)
+FROM (
+  SELECT col1, col2, col3 FROM tbl1
+  UNION ALL
+  SELECT col1, col2, col3 FROM tbl2
+)
+GROUP BY col1
+```
+
+With table-level UNION ALL, the rows from the unioned tables are not guaranteed to process in any particular order. They may process in an interleaved fashion. If you need a particular result ordering, use [ORDER BY](#order-by) on the outer query.
+
+To reference such unions a [TABLE(APPEND())](datasource.md#dynamic-table-append) datasource could also be used:
+```sql
+SELECT col1, COUNT(*) from TABLE(APPEND('tbl1', 'tbl2'))
+```
+
+
+## EXPLAIN PLAN
+
+Add "EXPLAIN PLAN FOR" to the beginning of any query to get information about how it will be translated. In this case,
+the query will not actually be executed. Refer to the [Query translation](sql-translation.md#interpreting-explain-plan-output)
+documentation for more information on the output of EXPLAIN PLAN.
+
+:::info
+ For the legacy plan, be careful when interpreting EXPLAIN PLAN output, and use [request logging](../configuration/index.md#request-logging) if in doubt.
+Request logs show the exact native query that will be run. Alternatively, to see the native query plan, set `useNativeQueryExplain` to true in the query context.
+:::
+
+## SET
+
+SET statements allow you to specify SQL query context parameters that modify the behavior of a Druid SQL query. You can include one or more SET statements before the main SQL query. Druid supports using SET in the Druid SQL [JSON API](../api-reference/sql-api.md) and the [web console](../operations/web-console.md). 
+
+The syntax of a `SET` statement is:
+
+```sql
+SET identifier = literal;
+```
+
+For example:
+
+```sql
+SET useApproximateTopN = false;
+SET sqlTimeZone = 'America/Los_Angeles';
+SET timeout = 90000;
+SELECT some_column, COUNT(*) FROM druid.foo WHERE other_column = 'foo' GROUP BY 1 ORDER BY 2 DESC
+```
+
+SET statements only apply to the query in the same request. Subsequent requests are not affected.
+
+SET statements work with SELECT, INSERT, and REPLACE queries.
+
+If you use the [JSON API](../api-reference/sql-api.md), you can also include query context parameters using the `context` field. If you include both, the parameter value in SET takes precedence over the parameter value in `context`.
+
+Note that you can only use SET to assign literal values, such as numbers, strings, or Booleans. To set a query context parameter to an array or JSON object, use the `context` field rather than SET.
+
+For other approaches to set the query context, see [Set query context](./query-context.md).
+
+## Identifiers and literals
+
+Identifiers like datasource and column names can optionally be quoted using double quotes. To escape a double quote
+inside an identifier, use another double quote, like `"My ""very own"" identifier"`. All identifiers are case-sensitive
+and no implicit case conversions are performed.
+
+Literal strings should be quoted with single quotes, like `'foo'`. Literal strings with Unicode escapes can be written
+like `U&'fo\00F6'`, where character codes in hex are prefixed by a backslash. Literal numbers can be written in forms
+like `100` (denoting an integer), `100.0` (denoting a floating point value), or `1.0e5` (scientific notation). Literal
+timestamps can be written like `TIMESTAMP '2000-01-01 00:00:00'`. Literal intervals, used for time arithmetic, can be
+written like `INTERVAL '1' HOUR`, `INTERVAL '1 02:03' DAY TO MINUTE`, `INTERVAL '1-2' YEAR TO MONTH`, and so on.
+
+
+## Dynamic parameters
+
+Druid SQL supports dynamic parameters using question mark (`?`) syntax, where parameters are bound to `?` placeholders
+at execution time. To use dynamic parameters, replace any literal in the query with a `?` character and provide a
+corresponding parameter value when you execute the query. Parameters are bound to the placeholders in the order in
+which they are passed. Parameters are supported in both the [HTTP POST](../api-reference/sql-api.md) and [JDBC](../api-reference/sql-jdbc.md) APIs.
+
+Druid supports double and null values in arrays for dynamic queries.
+The following example query uses the [ARRAY_CONTAINS](./sql-functions.md#array_contains) function to return `doubleArrayColumn` when the reference array `[-25.7, null, 36.85]` contains all elements of the value of `doubleArrayColumn`:
+
+```sql
+{
+   "query": "SELECT doubleArrayColumn from druid.table where ARRAY_CONTAINS(doubleArrayColumn, ?)",
+   "parameters": [
+      {
+        "type": "ARRAY",
+        "value": [-25.7, null, 36.85]
+      }
+   ]
+}
+```
+
+In certain cases, using dynamic parameters in expressions can cause type inference issues which cause your query to fail, for example:
+
+```sql
+SELECT * FROM druid.foo WHERE dim1 like CONCAT('%', ?, '%')
+```
+
+To solve this issue, explicitly provide the type of the dynamic parameter using the `CAST` keyword. Consider the fix for the preceding example:
+
+```sql
+SELECT * FROM druid.foo WHERE dim1 like CONCAT('%', CAST (? AS VARCHAR), '%')
+```
+
+Dynamic parameters can even replace arrays, reducing the parsing time. Refer to the parameters in the [API request body](../api-reference/sql-api.md#request-body) for usage.
+
+```sql
+SELECT arrayColumn from druid.table where ARRAY_CONTAINS(arrayColumn, ?)
+```
+
+You can replace an IN filter with many values by dynamically passing a parameter into [SCALAR_IN_ARRAY](sql-functions.md#scalar_in_array).
+For example Java queries, see [Dynamic parameters](../api-reference/sql-jdbc.md#dynamic-parameters).
+
+```sql
+SELECT count(city) from druid.table where SCALAR_IN_ARRAY(city, ?)
+```
+
+## Reserved keywords
+
+Druid SQL reserves certain keywords which are used in its query language. Apache Druid inherits all of the reserved keywords from [Apache Calcite](https://calcite.apache.org/docs/reference.html#keywords). In addition to these, the following reserved keywords are unique to Apache Druid:
+
+* **CLUSTERED**
+* **PARTITIONED**
+
+To use the reserved keywords in queries, enclose them in double quotation marks. For example, the reserved keyword **PARTITIONED** can be used in a query if and only if it is correctly quoted:
+
+```sql
+SELECT "PARTITIONED" from druid.table
+```
diff --git a/docs/35.0.0/querying/timeboundaryquery.md b/docs/35.0.0/querying/timeboundaryquery.md
new file mode 100644
index 0000000000..1616620394
--- /dev/null
+++ b/docs/35.0.0/querying/timeboundaryquery.md
@@ -0,0 +1,63 @@
+---
+id: timeboundaryquery
+title: "TimeBoundary queries"
+sidebar_label: "TimeBoundary"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ Apache Druid supports two query languages: [Druid SQL](sql.md) and [native queries](querying.md).
+ This document describes a query
+ type that is only available in the native language.
+:::
+
+Time boundary queries return the earliest and latest data points of a data set. The grammar is:
+
+```json
+{
+    "queryType" : "timeBoundary",
+    "dataSource": "sample_datasource",
+    "bound"     : < "maxTime" | "minTime" > # optional, defaults to returning both timestamps if not set
+    "filter"    : { "type": "and", "fields": [<filter>, <filter>, ...] } # optional
+}
+```
+
+There are 3 main parts to a time boundary query:
+
+|property|description|required?|
+|--------|-----------|---------|
+|queryType|This String should always be "timeBoundary"; this is the first thing Apache Druid looks at to figure out how to interpret the query|yes|
+|dataSource|A String or Object defining the data source to query, very similar to a table in a relational database. See [DataSource](../querying/datasource.md) for more information.|yes|
+|bound   | Optional, set to `maxTime` or `minTime` to return only the latest or earliest timestamp. Default to returning both if not set| no |
+|filter|See [Filters](../querying/filters.md)|no|
+|context|See [Query context reference](../querying/query-context-reference.md)|no|
+
+The format of the result is:
+
+```json
+[ {
+  "timestamp" : "2013-05-09T18:24:00.000Z",
+  "result" : {
+    "minTime" : "2013-05-09T18:24:00.000Z",
+    "maxTime" : "2013-05-09T18:37:00.000Z"
+  }
+} ]
+```
diff --git a/docs/35.0.0/querying/timeseriesquery.md b/docs/35.0.0/querying/timeseriesquery.md
new file mode 100644
index 0000000000..6d093f2a74
--- /dev/null
+++ b/docs/35.0.0/querying/timeseriesquery.md
@@ -0,0 +1,171 @@
+---
+id: timeseriesquery
+title: "Timeseries queries"
+sidebar_label: "Timeseries"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ Apache Druid supports two query languages: [Druid SQL](sql.md) and [native queries](querying.md).
+ This document describes a query
+ type in the native language. For information about when Druid SQL will use this query type, refer to the
+ [SQL documentation](sql-translation.md#query-types).
+:::
+
+These types of queries take a timeseries query object and return an array of JSON objects where each object represents a value asked for by the timeseries query.
+
+An example timeseries query object is shown below:
+
+```json
+{
+  "queryType": "timeseries",
+  "dataSource": "sample_datasource",
+  "granularity": "day",
+  "descending": "true",
+  "filter": {
+    "type": "and",
+    "fields": [
+      { "type": "selector", "dimension": "sample_dimension1", "value": "sample_value1" },
+      { "type": "or",
+        "fields": [
+          { "type": "selector", "dimension": "sample_dimension2", "value": "sample_value2" },
+          { "type": "selector", "dimension": "sample_dimension3", "value": "sample_value3" }
+        ]
+      }
+    ]
+  },
+  "aggregations": [
+    { "type": "longSum", "name": "sample_name1", "fieldName": "sample_fieldName1" },
+    { "type": "doubleSum", "name": "sample_name2", "fieldName": "sample_fieldName2" }
+  ],
+  "postAggregations": [
+    { "type": "arithmetic",
+      "name": "sample_divide",
+      "fn": "/",
+      "fields": [
+        { "type": "fieldAccess", "name": "postAgg__sample_name1", "fieldName": "sample_name1" },
+        { "type": "fieldAccess", "name": "postAgg__sample_name2", "fieldName": "sample_name2" }
+      ]
+    }
+  ],
+  "intervals": [ "2012-01-01T00:00:00.000/2012-01-03T00:00:00.000" ]
+}
+```
+
+There are 7 main parts to a timeseries query:
+
+|property|description|required?|
+|--------|-----------|---------|
+|queryType|This String should always be "timeseries"; this is the first thing Apache Druid looks at to figure out how to interpret the query|yes|
+|dataSource|A String or Object defining the data source to query, very similar to a table in a relational database. See [DataSource](../querying/datasource.md) for more information.|yes|
+|descending|Whether to make descending ordered result. Default is `false`(ascending).|no|
+|intervals|A JSON Object representing ISO-8601 Intervals. This defines the time ranges to run the query over.|yes|
+|granularity|Defines the granularity to bucket query results. See [Granularities](../querying/granularities.md)|yes|
+|filter|See [Filters](../querying/filters.md)|no|
+|virtualColumns|A JSON list of [virtual columns](./virtual-columns.md). You can reference the virtual columns in `aggregations` or `postAggregations`.| no (default none)|
+|aggregations|See [Aggregations](../querying/aggregations.md)|no|
+|postAggregations|See [Post Aggregations](../querying/post-aggregations.md)|no|
+|limit|An integer that limits the number of results. The default is unlimited.|no|
+|context|Can be used to modify query behavior, including [grand totals](#grand-totals) and [empty bucket values](#empty-bucket-values). See also [Query context reference](../querying/query-context-reference.md) for parameters that apply to all query types.|no|
+
+To pull it all together, the above query would return 2 data points, one for each day between 2012-01-01 and 2012-01-03, from the "sample\_datasource" table. Each data point would be the (long) sum of sample\_fieldName1, the (double) sum of sample\_fieldName2 and the (double) result of sample\_fieldName1 divided by sample\_fieldName2 for the filter set. The output looks like this:
+
+```json
+[
+  {
+    "timestamp": "2012-01-01T00:00:00.000Z",
+    "result": { "sample_name1": <some_value>, "sample_name2": <some_value>, "sample_divide": <some_value> }
+  },
+  {
+    "timestamp": "2012-01-02T00:00:00.000Z",
+    "result": { "sample_name1": <some_value>, "sample_name2": <some_value>, "sample_divide": <some_value> }
+  }
+]
+```
+
+## Grand totals
+
+Druid can include an extra "grand totals" row as the last row of a timeseries result set. To enable this, add
+`"grandTotal" : true` to your query context. For example:
+
+```json
+{
+  "queryType": "timeseries",
+  "dataSource": "sample_datasource",
+  "intervals": [ "2012-01-01T00:00:00.000/2012-01-03T00:00:00.000" ],
+  "granularity": "day",
+  "aggregations": [
+    { "type": "longSum", "name": "sample_name1", "fieldName": "sample_fieldName1" },
+    { "type": "doubleSum", "name": "sample_name2", "fieldName": "sample_fieldName2" }
+  ],
+  "context": {
+    "grandTotal": true
+  }
+}
+```
+
+The grand totals row will appear as the last row in the result array, and will have no timestamp. It will be the last
+row even if the query is run in "descending" mode. Post-aggregations in the grand totals row will be computed based
+upon the grand total aggregations.
+
+## Empty bucket values
+
+By default Druid fills empty interior time buckets in the results of timeseries queries with the default value for the [aggregator function](./sql-aggregations.md).
+For example, if you issue a "day" granularity
+timeseries query for the interval 2012-01-01/2012-01-04 using the SUM aggregator, and no data exists for 2012-01-02, Druid returns:
+
+```json
+[
+  {
+    "timestamp": "2012-01-01T00:00:00.000Z",
+    "result": { "sample_name1": <some_value> }
+  },
+  {
+   "timestamp": "2012-01-02T00:00:00.000Z",
+   "result": { "sample_name1": NULL }
+  },
+  {
+    "timestamp": "2012-01-03T00:00:00.000Z",
+    "result": { "sample_name1": <some_value> }
+  }
+]
+```
+
+Time buckets that lie completely outside the data interval are not filled with the default value.
+
+You can disable all empty bucket filling with the context flag `skipEmptyBuckets`.
+In this mode, Druid omits the data point 2012-01-02 from the results.
+For example:
+
+```json
+{
+  "queryType": "timeseries",
+  "dataSource": "sample_datasource",
+  "granularity": "day",
+  "aggregations": [
+    { "type": "longSum", "name": "sample_name1", "fieldName": "sample_fieldName1" }
+  ],
+  "intervals": [ "2012-01-01T00:00:00.000/2012-01-04T00:00:00.000" ],
+  "context" : {
+    "skipEmptyBuckets": "true"
+  }
+}
+```
\ No newline at end of file
diff --git a/docs/35.0.0/querying/tips-good-queries.md b/docs/35.0.0/querying/tips-good-queries.md
new file mode 100644
index 0000000000..adbba8d59b
--- /dev/null
+++ b/docs/35.0.0/querying/tips-good-queries.md
@@ -0,0 +1,203 @@
+---
+id: tips-good-queries
+title: "Tips for writing good queries in Druid"
+sidebar_label: "Tips for writing good queries"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+This topic includes tips and examples that can help you investigate and improve query performance and accuracy using [Apache Druid SQL](./sql.md).
+
+For an interactive tutorial on Druid SQL, see [Learn the basics of Druid SQL](https://github.com/implydata/learn-druid/tree/main/notebooks) within the [Learn Druid repo](https://github.com/implydata/learn-druid).
+
+Your ability to effectively query your data depends in large part on the way you've ingested and stored the data in Apache Druid. This document assumes that you've followed the best practices described in [Schema design tips and best practices](../ingestion/schema-design.md#general-tips-and-best-practices) when modeling your data. 
+
+## Investigate query performance
+
+If your queries run slower than anticipated, you can use the following tools to investigate query performance issues.
+
+### Analyze query metrics
+
+You can configure Druid processes to emit metrics that are essential for monitoring query execution. See [Query metrics](../operations/metrics.md#query-metrics) for more information. 
+
+### Generate an explain plan
+
+An explain plan shows the full query details and all of the operations Druid performs to execute it. You can use the information in the plan to identify possible areas of query improvement.
+
+See [Explain plan](./sql.md#explain-plan) and [Interpreting explain plan output](./sql-translation.md#interpreting-explain-plan-output) for more information.
+
+You can follow the [Get to know Query view tutorial](../tutorials/tutorial-sql-query-view.md) to create an example explain plan in the Druid console.
+
+## Improve query performance
+
+In most cases, you can improve query performance by adjusting Druid settings and by manually tuning your queries.
+
+### Adjust Druid settings
+
+This section outlines Druid settings that can help to improve query performance.
+
+#### Turn on query caching
+
+You can enable caching in Druid to improve query times for frequently accessed data. Caching enables increased concurrency on the same system, leading to noticeable performance improvements for queries handling throughput for concurrent, mixed workloads.
+
+The largest performance gains from caching tend to apply to TopN and timeseries queries. For GroupBy queries, if the bottleneck is in the merging phase on the Broker, enabling caching results in little noticeable query improvement. See [Performance considerations for caching](./caching.md#performance-considerations-for-caching) for more information.
+
+#### Use approximation
+
+When possible, design your SQL queries in such a way that they match the rules for TopN approximation, so that Druid enables TopN by default. For Druid to automatically optimize for TopN, your SQL query must include the following:
+
+- GROUP BY on one dimension, and
+- ORDER BY on one aggregate.
+
+ See [TopN queries](./topnquery.md) for more information.
+
+Note that TopN queries are approximate in that each data process ranks its top K results and only returns those top K results to the Broker.
+
+You can follow the tutorial [Using TopN approximation in Druid queries](https://github.com/implydata/learn-druid/tree/main/notebooks) within the [Learn Druid repo](https://github.com/implydata/learn-druid) to work through some examples with approximation turned on and off.
+The tutorial [Get to know Query view](../tutorials/tutorial-sql-query-view.md) demonstrates running aggregate queries in the Druid console.
+
+### Manually tune your queries
+
+This section outlines techniques you can use to improve your query accuracy and performance.
+
+#### Query one table at a time
+
+Query a single table at a time to minimize the load on the Druid processor.
+
+#### Select specific columns
+
+Only select the columns needed for the query instead of retrieving all columns from the table. This reduces the amount of data retrieved from the database, which improves query performance.
+
+#### Use filters
+
+Use filters, for example the WHERE clause, and filter on time. Try to minimize the use of inequality filters, because they're very resource-intensive.
+
+The following example query filters on `__time` and `product`:
+
+```
+SELECT
+  FLOOR(__time to day),
+  product,
+  sum(quantity * price) as revenue
+FROM "orders"
+WHERE
+  __time > '2023-08-20' and product = 'product 1'
+GROUP BY 1, 2
+```
+
+The following example uses a wildcard filter on the `diffUrl` column:
+
+```
+SELECT * from Wikipedia
+WHERE diffUrl LIKE 'https://en.wikipedia%'
+AND TIME_IN_INTERVAL(__time, '2016-06-27T01:00:00/2016-06-27T02:00:00')
+```
+
+#### Shorten your queries
+
+Make your queries shorter where possible&mdash;Druid processes shorter queries faster. You might also be able to divide a single query into multiple queries.
+
+For example, the following query aggregates over multiple datasources using UNION ALL:
+
+```
+SELECT id, SUM(revenue) FROM
+   (SELECT id, revenue from datasource_1
+UNION ALL
+  SELECT id, revenue FROM datasource_2)
+...
+UNION ALL
+   SELECT id, revenue FROM datasource_n)
+GROUP BY id
+```
+
+To simplify this query, you could split it into several queries, for example:
+
+```
+SELECT id, SUM(revenue) FROM datasource_1
+
+SELECT id, SUM(revenue) FROM datasource_2
+...
+SELECT id, SUM(revenue) FROM datasource_n
+```
+
+You could then manually aggregate the results of the individual queries.
+
+#### Minimize or remove subqueries
+
+Consider whether you can pre-compute a subquery task and store it as a join or make it a part of the datasource. See [Datasources: join](./datasource.md#join) and [SQL query translation: Joins](./sql-translation.md#joins) for more information and examples.
+
+#### Consider alternatives to GroupBy
+
+Consider using Timeseries and TopN as alternatives to GroupBy. See [GroupBy queries: alternatives](./groupbyquery.md#alternatives) for more information.
+
+Avoid grouping on high cardinality columns, for example user ID. Investigate whether you can apply a filter first, to reduce the number of results for grouping. 
+
+#### Query over smaller intervals
+
+Consider whether you can query a smaller time interval to return a smaller results set.
+
+For example, the following query doesn't limit on time and could be resource-intensive:
+
+```
+SELECT cust_id, sum(revenue) FROM myDatasource
+GROUP BY cust_id
+```
+
+This query could be split into multiple queries over smaller time spans, with the results combined client-side. For example:
+
+```
+SELECT cust_id, sum(revenue) FROM myDatasource
+GROUP BY cust_id
+WHERE __time BETWEEN '2023-07-01' AND '2023-07-31'
+
+SELECT cust_id, sum(revenue) FROM myDatasource
+GROUP BY cust_id
+WHERE __time BETWEEN '2023-08-01' AND '2023-08-31'
+```
+
+#### Reduce the computation in your queries
+
+Examine your query to see if it uses a lot of transformations, functions, and expressions. Consider whether you could rewrite the query to reduce the level of computation.
+
+## Druid SQL query example
+
+The following example query demonstrates many of the tips outlined in this topic.
+The query:
+
+- selects specific dimensions and metrics
+- uses approximation
+- selects from a single table
+- groups by low cardinality columns
+- filters on both dimensions and time
+- orders by a dimension and a measure
+- includes a limit
+
+```
+SELECT
+   FLOOR() AS month,
+   country,
+   SUM(price),
+   APPROX_COUNT_DISTINCT_DS_HLL(userid)
+FROM sales
+GROUP BY month, country
+WHERE artist = 'Madonna' AND TIME_IN_INTERVAL(__time, '2023-08-01/P1M')
+ORDER BY country, SUM(price) DESC
+LIMIT 100
+```
diff --git a/docs/35.0.0/querying/topnmetricspec.md b/docs/35.0.0/querying/topnmetricspec.md
new file mode 100644
index 0000000000..844f0cf306
--- /dev/null
+++ b/docs/35.0.0/querying/topnmetricspec.md
@@ -0,0 +1,91 @@
+---
+id: topnmetricspec
+title: "Sorting (topN)"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ Apache Druid supports two query languages: [Druid SQL](sql.md) and [native queries](querying.md).
+ This document describes the native
+ language. For information about sorting in SQL, refer to the [SQL documentation](sql.md#order-by).
+:::
+
+In Apache Druid, the topN metric spec specifies how topN values should be sorted.
+
+## Numeric TopNMetricSpec
+
+The simplest metric specification is a String value indicating the metric to sort topN results by. They are included in a topN query with:
+
+```json
+"metric": "<metric_name>"
+```
+
+The metric field can also be given as a JSON object. The grammar for dimension values sorted by numeric value is shown below:
+
+```json
+"metric": {
+    "type": "numeric",
+    "metric": "<metric_name>"
+}
+```
+
+|property|description|required?|
+|--------|-----------|---------|
+|type|this indicates a numeric sort|yes|
+|metric|the actual metric field in which results will be sorted by|yes|
+
+## Dimension TopNMetricSpec
+
+This metric specification sorts TopN results by dimension value, using one of the sorting orders described here: [Sorting Orders](./sorting-orders.md)
+
+|property|type|description|required?|
+|--------|----|-----------|---------|
+|type|String|this indicates a sort a dimension's values|yes, must be 'dimension'|
+|ordering|String|Specifies the sorting order. Can be one of the following values: "lexicographic", "alphanumeric", "numeric", "strlen". See [Sorting Orders](./sorting-orders.md) for more details.|no, default: "lexicographic"|
+|previousStop|String|the starting point of the sort. For example, if a previousStop value is 'b', all values before 'b' are discarded. This field can be used to paginate through all the dimension values.|no|
+
+The following metricSpec uses lexicographic sorting.
+
+```json
+"metric": {
+    "type": "dimension",
+    "ordering": "lexicographic",
+    "previousStop": "<previousStop_value>"
+}
+```
+
+Note that in earlier versions of Druid, the functionality provided by the DimensionTopNMetricSpec was handled by two separate spec types, Lexicographic and Alphanumeric (when only two sorting orders were supported). These spec types have been deprecated but are still usable.
+
+## Inverted TopNMetricSpec
+
+Sort dimension values in inverted order, i.e inverts the order of the delegate metric spec. It can be used to sort the values in ascending order.
+
+```json
+"metric": {
+    "type": "inverted",
+    "metric": <delegate_top_n_metric_spec>
+}
+```
+
+|property|description|required?|
+|--------|-----------|---------|
+|type|this indicates an inverted sort|yes|
+|metric|the delegate metric spec. |yes|
diff --git a/docs/35.0.0/querying/topnquery.md b/docs/35.0.0/querying/topnquery.md
new file mode 100644
index 0000000000..fe03532314
--- /dev/null
+++ b/docs/35.0.0/querying/topnquery.md
@@ -0,0 +1,264 @@
+---
+id: topnquery
+title: "TopN queries"
+sidebar_label: "TopN"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ Apache Druid supports two query languages: [Druid SQL](sql.md) and [native queries](querying.md).
+ This document describes a query
+ type in the native language. For information about when Druid SQL will use this query type, refer to the
+ [SQL documentation](sql-translation.md#query-types).
+:::
+
+Apache Druid TopN queries return a sorted set of results for the values in a given dimension according to some criteria. Conceptually, they can be thought of as an approximate [GroupByQuery](../querying/groupbyquery.md) over a single dimension with an [Ordering](../querying/limitspec.md) spec. TopNs are much faster and resource efficient than GroupBys for this use case. These types of queries take a topN query object and return an array of JSON objects where each object represents a value asked for by the topN query.
+
+TopNs are approximate in that each data process will rank their top K results and only return those top K results to the Broker. K, by default in Druid, is `max(1000, threshold)`.
+
+A topN query object looks like:
+
+```json
+{
+  "queryType": "topN",
+  "dataSource": "sample_data",
+  "dimension": "sample_dim",
+  "threshold": 5,
+  "metric": "count",
+  "granularity": "all",
+  "filter": {
+    "type": "and",
+    "fields": [
+      {
+        "type": "selector",
+        "dimension": "dim1",
+        "value": "some_value"
+      },
+      {
+        "type": "selector",
+        "dimension": "dim2",
+        "value": "some_other_val"
+      }
+    ]
+  },
+  "aggregations": [
+    {
+      "type": "longSum",
+      "name": "count",
+      "fieldName": "count"
+    },
+    {
+      "type": "doubleSum",
+      "name": "some_metric",
+      "fieldName": "some_metric"
+    }
+  ],
+  "postAggregations": [
+    {
+      "type": "arithmetic",
+      "name": "average",
+      "fn": "/",
+      "fields": [
+        {
+          "type": "fieldAccess",
+          "name": "some_metric",
+          "fieldName": "some_metric"
+        },
+        {
+          "type": "fieldAccess",
+          "name": "count",
+          "fieldName": "count"
+        }
+      ]
+    }
+  ],
+  "intervals": [
+    "2013-08-31T00:00:00.000/2013-09-03T00:00:00.000"
+  ]
+}
+```
+
+There are 11 parts to a topN query.
+
+|property|description|required?|
+|--------|-----------|---------|
+|queryType|This String should always be "topN"; this is the first thing Druid looks at to figure out how to interpret the query|yes|
+|dataSource|A String or Object defining the data source to query, very similar to a table in a relational database. See [DataSource](../querying/datasource.md) for more information.|yes|
+|intervals|A JSON Object representing ISO-8601 Intervals. This defines the time ranges to run the query over.|yes|
+|granularity|Defines the granularity to bucket query results. See [Granularities](../querying/granularities.md)|yes|
+|filter|See [Filters](../querying/filters.md)|no|
+|virtualColumns|A JSON list of [virtual columns](./virtual-columns.md). You can reference a virtual column as the grouping `dimension` or as an input in `aggregations` or `postAggregations`.| no (default none)|
+|aggregations|See [Aggregations](../querying/aggregations.md)|for numeric metricSpec, aggregations or postAggregations should be specified. Otherwise no.|
+|postAggregations|See [Post Aggregations](../querying/post-aggregations.md)|for numeric metricSpec, aggregations or postAggregations should be specified. Otherwise no.|
+|dimension|A String or JSON object defining the dimension that you want the top taken for. For more info, see [DimensionSpecs](../querying/dimensionspecs.md)|yes|
+|threshold|An integer defining the N in the topN (i.e. how many results you want in the top list)|yes|
+|metric|A String or JSON object specifying the metric to sort by for the top list. For more info, see [TopNMetricSpec](../querying/topnmetricspec.md).|yes|
+|context|See [Query context reference](../querying/query-context-reference.md)|no|
+
+Please note the context JSON object is also available for topN queries and should be used with the same caution as the timeseries case.
+The format of the results would look like so:
+
+```json
+[
+  {
+    "timestamp": "2013-08-31T00:00:00.000Z",
+    "result": [
+      {
+        "dim1": "dim1_val",
+        "count": 111,
+        "some_metrics": 10669,
+        "average": 96.11711711711712
+      },
+      {
+        "dim1": "another_dim1_val",
+        "count": 88,
+        "some_metrics": 28344,
+        "average": 322.09090909090907
+      },
+      {
+        "dim1": "dim1_val3",
+        "count": 70,
+        "some_metrics": 871,
+        "average": 12.442857142857143
+      },
+      {
+        "dim1": "dim1_val4",
+        "count": 62,
+        "some_metrics": 815,
+        "average": 13.14516129032258
+      },
+      {
+        "dim1": "dim1_val5",
+        "count": 60,
+        "some_metrics": 2787,
+        "average": 46.45
+      }
+    ]
+  }
+]
+```
+
+## Behavior on multi-value dimensions
+
+topN queries can group on multi-value dimensions. When grouping on a multi-value dimension, _all_ values
+from matching rows will be used to generate one group per value. It's possible for a query to return more groups than
+there are rows. For example, a topN on the dimension `tags` with filter `"t1" AND "t3"` would match only row1, and
+generate a result with three groups: `t1`, `t2`, and `t3`. If you only need to include values that match
+your filter, you can use a [filtered dimensionSpec](dimensionspecs.md#filtered-dimensionspecs). This can also
+improve performance.
+
+See [Multi-value dimensions](multi-value-dimensions.md) for more details.
+
+## Aliasing
+
+The current TopN algorithm is an approximate algorithm. The top 1000 local results from each segment are returned for merging to determine the global topN. As such, the topN algorithm is approximate in both rank and results. Approximate results *ONLY APPLY WHEN THERE ARE MORE THAN 1000 DIM VALUES*. A topN over a dimension with fewer than 1000 unique dimension values can be considered accurate in rank and accurate in aggregates.
+
+The threshold can be modified from its default 1000 via the server parameter `druid.query.topN.minTopNThreshold`, which needs a restart of the servers to take effect, or via `minTopNThreshold` in the query context, which takes effect per query.
+
+If you are wanting the top 100 of a high cardinality, uniformly distributed dimension ordered by some low-cardinality, uniformly distributed dimension, you are potentially going to get aggregates back that are missing data.
+
+To put it another way, the best use cases for topN are when you can have confidence that the overall results are uniformly in the top. For example, if a particular site ID is in the top 10 for some metric for every hour of every day, then it will probably be accurate in the topN over multiple days. But if a site is barely in the top 1000 for any given hour, but over the whole query granularity is in the top 500 (example: a site which gets highly uniform traffic co-mingling in the dataset with sites with highly periodic data), then a top500 query may not have that particular site at the exact rank, and may not be accurate for that particular site's aggregates.
+
+Before continuing in this section, please consider if you really need exact results. Getting exact results is a very resource intensive process. For the vast majority of "useful" data results, an approximate topN algorithm supplies plenty of accuracy.
+
+Users wishing to get an *exact rank and exact aggregates* topN over a dimension with greater than 1000 unique values should issue a groupBy query and sort the results themselves. This is very computationally expensive for high-cardinality dimensions.
+
+Users who can tolerate *approximate rank* topN over a dimension with greater than 1000 unique values, but require *exact aggregates* can issue two queries. One to get the approximate topN dimension values, and another topN with dimension selection filters which only use the topN results of the first.
+
+### Example First query
+
+```json
+{
+    "aggregations": [
+         {
+             "fieldName": "L_QUANTITY_longSum",
+             "name": "L_QUANTITY_",
+             "type": "longSum"
+         }
+    ],
+    "dataSource": "tpch_year",
+    "dimension":"l_orderkey",
+    "granularity": "all",
+    "intervals": [
+        "1900-01-09T00:00:00.000Z/2992-01-10T00:00:00.000Z"
+    ],
+    "metric": "L_QUANTITY_",
+    "queryType": "topN",
+    "threshold": 2
+}
+```
+
+### Example second query
+
+```json
+{
+    "aggregations": [
+         {
+             "fieldName": "L_TAX_doubleSum",
+             "name": "L_TAX_",
+             "type": "doubleSum"
+         },
+         {
+             "fieldName": "L_DISCOUNT_doubleSum",
+             "name": "L_DISCOUNT_",
+             "type": "doubleSum"
+         },
+         {
+             "fieldName": "L_EXTENDEDPRICE_doubleSum",
+             "name": "L_EXTENDEDPRICE_",
+             "type": "doubleSum"
+         },
+         {
+             "fieldName": "L_QUANTITY_longSum",
+             "name": "L_QUANTITY_",
+             "type": "longSum"
+         },
+         {
+             "name": "count",
+             "type": "count"
+         }
+    ],
+    "dataSource": "tpch_year",
+    "dimension":"l_orderkey",
+    "filter": {
+        "fields": [
+            {
+                "dimension": "l_orderkey",
+                "type": "selector",
+                "value": "103136"
+            },
+            {
+                "dimension": "l_orderkey",
+                "type": "selector",
+                "value": "1648672"
+            }
+        ],
+        "type": "or"
+    },
+    "granularity": "all",
+    "intervals": [
+        "1900-01-09T00:00:00.000Z/2992-01-10T00:00:00.000Z"
+    ],
+    "metric": "L_QUANTITY_",
+    "queryType": "topN",
+    "threshold": 2
+}
+```
diff --git a/docs/35.0.0/querying/troubleshooting.md b/docs/35.0.0/querying/troubleshooting.md
new file mode 100644
index 0000000000..4b9a83d8a2
--- /dev/null
+++ b/docs/35.0.0/querying/troubleshooting.md
@@ -0,0 +1,68 @@
+---
+id: troubleshooting
+title: "Troubleshooting query execution in Druid"
+sidebar_label: "Troubleshooting"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+This topic describes issues that may affect query execution in Druid, how to identify those issues, and strategies to resolve them.
+
+## Query fails due to internal communication timeout
+
+In Druid's query processing, when the Broker sends a query to the data servers, the data servers process the query and push their intermediate results back to the Broker.
+Because calls from the Broker to the data servers are synchronous, the Jetty server can time out in data servers in certain cases: 
+
+1. The data servers don't push any results to the Broker before the maximum idle time.
+2. The data servers started to push data but paused for longer than the maximum idle time such as due to [Broker backpressure](../operations/basic-cluster-tuning.md#broker-backpressure).
+
+When such timeout occurs, the server interrupts the connection between the Broker and data servers which causes the query to fail with a channel disconnection error. For example,
+
+```json
+{
+   "error": {
+      "error": "Unknown exception",
+      "errorMessage": "Query[6eee73a6-a95f-4bdc-821d-981e99e39242] url[https://localhost:8283/druid/v2/] failed with exception msg [Channel disconnected] (through reference chain: org.apache.druid.query.scan.ScanResultValue[\"segmentId\"])",
+      "errorClass": "com.fasterxml.jackson.databind.JsonMappingException",
+      "host": "localhost:8283"
+   }
+}
+```
+
+Channel disconnection occurs for various reasons.
+To verify that the error is due to web server timeout, search for the query ID in the Historical logs.
+The query ID in the example above is `6eee73a6-a95f-4bdc-821d-981e99e39242`.
+The `"host"` field in the error message above indicates the IP address of the Historical in question.
+In the Historical logs, you will see a raised exception indicating `Idle timeout expired`:
+
+```text
+2021-09-14T19:52:27,685 ERROR [qtp475526834-85[scan_[test_large_table]_6eee73a6-a95f-4bdc-821d-981e99e39242]] org.apache.druid.server.QueryResource - Unable to send query response. (java.io.IOException: java.util.concurrent.TimeoutException: Idle timeout expired: 300000/300000 ms)
+2021-09-14T19:52:27,685 ERROR [qtp475526834-85] org.apache.druid.server.QueryLifecycle - Exception while processing queryId [6eee73a6-a95f-4bdc-821d-981e99e39242] (java.io.IOException: java.util.concurrent.TimeoutException: Idle timeout expired: 300000/300000 ms)
+2021-09-14T19:52:27,686 WARN [qtp475526834-85] org.eclipse.jetty.server.HttpChannel - handleException /druid/v2/ java.io.IOException: java.util.concurrent.TimeoutException: Idle timeout expired: 300000/300000 ms
+```
+
+To mitigate query failure due to web server timeout:
+* Increase the max idle time for the web server.
+Set the max idle time in the `druid.server.http.maxIdleTime` property in the `historical/runtime.properties` file.
+You must restart the Druid cluster for this change to take effect.
+See [Configuration reference](../configuration/index.md) for more information on configuring the server. 
+* If the timeout occurs because the data servers have not pushed any results to the Broker, consider optimizing data server performance. Significant slowdown in the data servers may be a result of spilling too much data to disk in [groupBy queries](groupbyquery.md#performance-tuning-for-groupby), large [`IN` filters](filters.md#in-filter) in the query, or an under scaled cluster. Analyze your [Druid query metrics](../operations/metrics.md#query-metrics) to determine the bottleneck.
+* If the timeout is caused by Broker backpressure, consider optimizing Broker performance. Check whether the connection is fast enough between the Broker and deep storage.
+
diff --git a/docs/35.0.0/querying/using-caching.md b/docs/35.0.0/querying/using-caching.md
new file mode 100644
index 0000000000..02561fac59
--- /dev/null
+++ b/docs/35.0.0/querying/using-caching.md
@@ -0,0 +1,96 @@
+---
+id: using-caching
+title: "Using query caching"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+This topic covers how to configure services to populate and use the Druid query caches. For a conceptual overview and use cases, see [Query caching](./caching.md). For information on how to configure the caching mechanism, see [Cache configuration](../configuration/index.md#cache-configuration).
+
+All query caches have a pair of parameters that control the way individual queries interact with the cache:
+
+- `useCache` to instruct queries to use the cache for results.
+- `populateCache` to instruct a query to cache its results.
+
+The separation of concerns, usage and population, lets you include cached results for queries on uncommon data without polluting the cache with results that are unlikely to be reused by other queries, for example, large reports or queries on very old data.
+
+To use caching, it must be enabled in the settings for the service to perform caching in the service's runtime properties. By default, per-segment cache is enabled on Historicals. For individual queries, you can control cache usage and population within the query context.
+
+
+## Enabling query caching on Historicals
+Historicals only support **segment-level** caching, which is enabled by default. To control caching on the Historical, set the `useCache` and `populateCache` runtime properties. For example, to set the Historical to both use and populate the segment cache for queries:
+ ```
+ druid.historical.cache.useCache=true
+ druid.historical.cache.populateCache=true
+ ```
+See [Historical caching](../configuration/index.md#historical-caching) for a description of all available Historical cache configurations.
+ 
+## Enabling query caching on task executor services
+Task executor services, the Peon or the Indexer, only support **segment-level** caching. To control caching on a task executor service, set the `useCache` and `populateCache` runtime properties. For example, to set the Peon to both use and populate the segment cache for queries:
+
+```
+druid.realtime.cache.useCache=true
+druid.realtime.cache.populateCache=true
+```
+
+See [Peon caching](../configuration/index.md#peon-caching) and [Indexer caching](../configuration/index.md#indexer-caching) for a description of all available task executor service caching options.
+
+## Enabling query caching on Brokers
+Brokers support both segment-level and whole-query result level caching.
+
+To control **segment caching** on the Broker, set the `useCache` and `populateCache`runtime properties. For example, to set the Broker to use and populate the segment cache for queries:
+```
+druid.broker.cache.useCache=true
+druid.broker.cache.populateCache=true
+```
+
+To control **whole-query caching** on the Broker, set the `useResultLevelCache` and `populateResultLevelCache` runtime properties. For example, to set the Broker to use and populate the whole-query cache for queries:
+
+```
+druid.broker.cache.useResultLevelCache=true
+druid.broker.cache.populateResultLevelCache=true
+```
+
+See [Broker caching](../configuration/index.md#broker-caching) for a description of all available Broker cache configurations.
+ 
+## Enabling caching in the query context
+
+As long as the service is set to populate the cache, you can set cache options for individual queries in the [query context](./query-context-reference.md). For example, you can send a POST request to the Druid SQL API and include the context as a JSON object:
+
+```
+{
+  "query" : "SELECT COUNT(*) FROM data_source WHERE foo = 'bar' AND __time > TIMESTAMP '2020-01-01 00:00:00'",
+  "context" : {
+    "useCache" : "true",
+    "populateCache" : "false"
+  }
+}
+```
+
+In this example the user has set `populateCache` to `false` to avoid filling the result cache with results for segments that are over a year old. For more information, see [Druid SQL client APIs](../api-reference/sql-api.md).
+
+You can also use the SET command to specify cache options directly within your SQL query string. For more information, see [SET](../querying/sql.md#set). 
+
+## Learn more
+See the following topics for more information:
+- [Query caching](./caching.md) for an overview of caching.
+- [Query context reference](./query-context-reference.md) for more details about query context parameters.
+- [Cache configuration](../configuration/index.md#cache-configuration) for information about different cache types and additional configuration options.
diff --git a/docs/35.0.0/querying/virtual-columns.md b/docs/35.0.0/querying/virtual-columns.md
new file mode 100644
index 0000000000..fbfae24ed5
--- /dev/null
+++ b/docs/35.0.0/querying/virtual-columns.md
@@ -0,0 +1,193 @@
+---
+id: virtual-columns
+title: "Virtual columns"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ Apache Druid supports two query languages: [Druid SQL](sql.md) and [native queries](querying.md).
+ This document describes the native
+ language. For information about functions available in SQL, refer to the
+ [SQL documentation](sql-scalar.md).
+:::
+
+Virtual columns are queryable column "views" created from a set of columns during a query.
+
+A virtual column can potentially draw from multiple underlying columns, although a virtual column always presents itself as a single column.
+
+Virtual columns can be referenced by their output names to be used as [dimensions](./dimensionspecs.md) or as inputs to [filters](./filters.md) and [aggregators](./aggregations.md).
+
+Each Apache Druid query can accept a list of virtual columns as a parameter. The following scan query is provided as an example:
+
+```
+{
+ "queryType": "scan",
+ "dataSource": "page_data",
+ "columns":[],
+ "virtualColumns": [
+    {
+      "type": "expression",
+      "name": "fooPage",
+      "expression": "concat('foo' + page)",
+      "outputType": "STRING"
+    },
+    {
+      "type": "expression",
+      "name": "tripleWordCount",
+      "expression": "wordCount * 3",
+      "outputType": "LONG"
+    }
+  ],
+ "intervals": [
+   "2013-01-01/2019-01-02"
+ ]
+}
+```
+
+
+## Virtual column types
+
+### Expression virtual column
+
+Expression virtual columns use Druid's native [expression](math-expr.md) system to allow defining query time
+transforms of inputs from one or more columns.
+
+The expression virtual column has the following syntax:
+
+```json
+{
+  "type": "expression",
+  "name": <name of the virtual column>,
+  "expression": <row expression>,
+  "outputType": <output value type of expression>
+}
+```
+
+|property|description|required?|
+|--------|-----------|---------|
+|type|Must be `"expression"` to indicate that this is an expression virtual column.|yes|
+|name|The name of the virtual column.|yes|
+|expression|An [expression](math-expr.md) that takes a row as input and outputs a value for the virtual column.|yes|
+|outputType|The expression's output will be coerced to this type. Can be LONG, FLOAT, DOUBLE, STRING, ARRAY types, or COMPLEX types.|no, default is FLOAT|
+
+### Nested field virtual column
+
+The nested field virtual column is an optimized virtual column that can provide direct access into various paths of
+a `COMPLEX<json>` column, including using their indexes.
+
+This virtual column is used for the SQL operators `JSON_VALUE` (if `processFromRaw` is set to false) or `JSON_QUERY`
+(if `processFromRaw` is true), and accepts 'JSONPath' or 'jq' syntax string representations of paths, or a parsed
+list of "path parts" in order to determine what should be selected from the column.
+
+You can define a nested field virtual column with any of the following equivalent syntaxes. The examples all produce
+the same output value, with each example showing a different way to specify how to access the nested value. The first
+is using JSONPath syntax `path`, the second with a jq `path`, and the third uses `pathParts`.
+
+```json
+    {
+      "type": "nested-field",
+      "columnName": "shipTo",
+      "outputName": "v0",
+      "expectedType": "STRING",
+      "path": "$.phoneNumbers[1].number"
+    }
+```
+
+```json
+    {
+      "type": "nested-field",
+      "columnName": "shipTo",
+      "outputName": "v1",
+      "expectedType": "STRING",
+      "path": ".phoneNumbers[1].number",
+      "useJqSyntax": true
+    }
+```
+
+```json
+    {
+      "type": "nested-field",
+      "columnName": "shipTo",
+      "outputName": "v2",
+      "expectedType": "STRING",
+      "pathParts": [
+        {
+          "type": "field",
+          "field": "phoneNumbers"
+        },
+        {
+          "type": "arrayElement",
+          "index": 1
+        },
+        {
+          "type": "field",
+          "field": "number"
+        }
+      ]
+    }
+```
+
+|property|description|required?|
+|--------|-----------|---------|
+|type|Must be `"nested-field"` to indicate that this is a nested field virtual column.|yes|
+|columnName|The name of the `COMPLEX<json>` input column.|yes|
+|outputName|The name of the virtual column.|yes|
+|expectedType|The native Druid output type of the column, Druid will coerce output to this type if it does not match the underlying data. This can be `STRING`, `LONG`, `FLOAT`, `DOUBLE`, or `COMPLEX<json>`. Extracting `ARRAY` types is not yet supported.|no, default `STRING`|
+|pathParts|The parsed path parts used to locate the nested values. `path` will be translated into `pathParts` internally. One of `path` or `pathParts` must be set|no, if `path` is defined|
+|processFromRaw|If set to true, the virtual column will process the "raw" JSON data to extract values rather than using an optimized "literal" value selector. This option allows extracting non-literal values (such as nested JSON objects or arrays) as a `COMPLEX<json>` at the cost of much slower performance.|no, default false|
+|path|'JSONPath' (or 'jq') syntax path. One of `path` or `pathParts` must be set. |no, if `pathParts` is defined|
+|useJqSyntax|If true, parse `path` using 'jq' syntax instead of 'JSONPath'.|no, default is false|
+
+#### Nested path part
+
+Specify `pathParts` as an array of objects that describe each component of the path to traverse. Each object can take the following properties:
+
+|property|description|required?|
+|--------|-----------|---------|
+|type|Must be 'field' or 'arrayElement'. Use `field` when accessing a specific field in a nested structure. Use `arrayElement` when accessing a specific integer position of an array (zero based).|yes|
+|field|The name of the 'field' in a 'field' `type` path part|yes, if `type` is 'field'|
+|index|The array element index if `type` is `arrayElement`|yes, if `type` is 'arrayElement'|
+
+See [Nested columns](./nested-columns.md) for more information on ingesting and storing nested data.
+
+### List filtered virtual column
+
+This virtual column provides an alternative way to use
+['list filtered' dimension spec](./dimensionspecs.md#filtered-dimensionspecs) as a virtual column. It has optimized
+access to the underlying column value indexes that can provide a small performance improvement in some cases.
+
+```json
+    {
+      "type": "mv-filtered",
+      "name": "filteredDim3",
+      "delegate": "dim3",
+      "values": ["hello", "world"],
+      "isAllowList": true
+    }
+```
+
+|property|description|required?|
+|--------|-----------|---------|
+|type|Must be `"mv-filtered"` to indicate that this is a list filtered virtual column.|yes|
+|name|The output name of the virtual column|yes|
+|delegate|The name of the multi-value STRING input column to filter|yes|
+|values|Set of STRING values to allow or deny|yes|
+|isAllowList|If true, the output of the virtual column will be limited to the set specified by `values`, else it will provide all values _except_ those specified.|No, default true|
diff --git a/docs/35.0.0/release-info/migr-ansi-sql-null.md b/docs/35.0.0/release-info/migr-ansi-sql-null.md
new file mode 100644
index 0000000000..b8548e8ce1
--- /dev/null
+++ b/docs/35.0.0/release-info/migr-ansi-sql-null.md
@@ -0,0 +1,376 @@
+---
+id: migr-ansi-sql-null
+title: "Migration guide: SQL compliant mode"
+sidebar_label: SQL compliant mode
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+-->
+import Tabs from '@theme/Tabs';
+import TabItem from '@theme/TabItem';
+
+In Apache Druid 32.0.0, legacy configurations which were incompatible with the ANSI SQL standard were removed. 
+
+These configurations were:
+* `druid.generic.useDefaultValueForNull`
+* `druid.expressions.useStrictBooleans`
+* `druid.generic.useThreeValueLogicForNativeFilters`
+
+This guide provides strategies for Druid operators who rely on legacy Druid null handling behavior in their applications to transition to Druid 32.0.0 or later.
+
+## SQL compliant null handling
+
+As of Druid 28.0.0, Druid writes segments in an ANSI SQL compatible null handling mode by default, and in Druid 32.0.0 this is no longer configurable.
+This is a change of legacy behavior and means that Druid stores null values distinctly from empty strings for string dimensions and distinctly from 0 for numeric dimensions.
+
+This can impact your application behavior because the ANSI SQL standard defines any comparison to null to be unknown.
+According to this three-valued logic, `x <> 'some value'` only returns non-null values.
+
+Follow the [Null handling tutorial](../tutorials/tutorial-sql-null.md) to learn how null handling works in Druid.
+
+## Legacy null handling and two-valued filter logic
+
+Prior to Druid 28.0.0, Druid defaulted to a legacy mode which stored default values instead of nulls.
+In this mode, Druid created segments with the following characteristics at ingestion time:
+
+- String columns couldn't distinguish an empty string, `''`, from null.
+    Therefore, Druid treated both values as interchangeable.
+- Numeric columns couldn't represent null valued rows.
+    Therefore, Druid stored `0` instead of `null`.
+
+## Migrate to SQL compliant mode
+
+If your business logic relies on the behavior of legacy mode, you have the following options to operate Druid in an ANSI SQL compatible null handling mode:
+
+- Modify incoming data to either [avoid nulls](#replace-null-values-at-ingestion-time) or [avoid empty strings](#coerce-empty-strings-to-null-at-ingestion-time) to achieve the same query behavior as legacy mode. This means modifying your ingestion SQL queries and ingestion specs to handle nulls or empty strings.
+    For example, replacing a null for a string column with an empty string or a 0 for a numeric column.
+    However, it means that your existing queries should operate as if Druid were in legacy mode.
+    If you do not care about preserving null values, this is a good option for you.
+
+- Preserve null values and [update all of your SQL queries to be ANSI SQL compliant](#rewrite-your-queries-to-be-sql-compliant).
+    This means you can preserve the incoming data with nulls intact.
+    However, you must rewrite any affected client-side queries to be ANSI SQL compliant.
+    If you have a requirement to preserve null values, choose this option.
+
+### Replace null values at ingestion time
+
+If you don't need to preserve null values within Druid, you can use a transform at ingestion time to replace nulls with other values.
+
+Consider the following input data:
+
+```json
+{"time":"2024-01-01T00:00:00.000Z","string_example":"my_string","number_example":99}
+{"time":"2024-01-02T00:00:00.000Z","string_example":"","number_example":0}
+{"time":"2024-01-03T00:00:00.000Z","string_example":null,"number_example":null}
+```
+ 
+The following example illustrates how to use COALESCE and NVL at ingestion time to avoid null values in Druid:
+
+<Tabs>
+
+<TabItem value="0" label="SQL-based batch">
+
+```sql
+REPLACE INTO "no_nulls_example" OVERWRITE ALL
+WITH "ext" AS (
+  SELECT *
+  FROM TABLE(
+    EXTERN(
+      '{"type":"inline","data":"{\"time\":\"2024-01-01T00:00:00.000Z\",\"string_example\":\"my_string\",\"number_example\":99}\n{\"time\":\"2024-01-02T00:00:00.000Z\",\"string_example\":\"\",\"number_example\":0}\n{\"time\":\"2024-01-03T00:00:00.000Z\",\"string_example\":null,\"number_example\":null}"}',
+      '{"type":"json"}'
+    )
+  ) EXTEND ("time" VARCHAR, "string_example" VARCHAR, "number_example" BIGINT)
+)
+SELECT
+  TIME_PARSE("time") AS "__time",
+  -- Replace any null string values with an empty string
+  COALESCE("string_example",'') AS string_example,
+  -- Replace any null numeric values with 0
+  NVL("number_example",0) AS number_example
+FROM "ext"
+PARTITIONED BY MONTH
+```
+</TabItem>
+
+<TabItem value="1" label="JSON-based batch">
+
+```json
+{
+  "type": "index_parallel",
+  "spec": {
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "inline",
+        "data": "{\"time\":\"2024-01-01T00:00:00.000Z\",\"string_example\":\"my_string\",\"number_example\":99}\n{\"time\":\"2024-01-02T00:00:00.000Z\",\"string_example\":\"\",\"number_example\":0}\n{\"time\":\"2024-01-03T00:00:00.000Z\",\"string_example\":null,\"number_example\":null}"
+      },
+      "inputFormat": {
+        "type": "json"
+      }
+    },
+    "tuningConfig": {
+      "type": "index_parallel",
+      "partitionsSpec": {
+        "type": "dynamic"
+      }
+    },
+    "dataSchema": {
+      "dataSource": "inline_data_native",
+      "timestampSpec": {
+        "column": "time",
+        "format": "iso"
+      },
+      "dimensionsSpec": {
+        "dimensions": [
+          "string_example",
+          {
+            "type": "long",
+            "name": "number_example"
+          }
+        ]
+      },
+      "granularitySpec": {
+        "queryGranularity": "none",
+        "rollup": false,
+        "segmentGranularity": "MONTH"
+      },
+      "transformSpec": {
+        "transforms": [
+          {
+            "type": "expression",
+            "name": "string_example",
+            "expression": "COALESCE(\"string_example\",'')"
+          },
+          {
+            "type": "expression",
+            "name": "number_example",
+            "expression": "NVL(\"number_example\",0)"
+          }
+        ]
+      }
+    }
+  }
+}
+```
+
+</TabItem>
+</Tabs>
+
+Druid ingests the data with no null values as follows:
+
+| `__time` | `string_example` | `number_example`|
+| -- | -- | -- |
+| `2024-01-01T00:00:00.000Z`| `my_string`| 99 |
+| `2024-01-02T00:00:00.000Z`| `empty`| 0 |
+| `2024-01-03T00:00:00.000Z`| `empty`| 0 |
+
+### Coerce empty strings to null at ingestion time
+
+In legacy mode, Druid recognized empty strings as nulls for equality comparison.
+If your queries rely on empty strings to represent nulls, you can coerce empty strings to null at ingestion time using NULLIF.
+
+For example, consider the following sample input data:
+
+```json
+{"time":"2024-01-01T00:00:00.000Z","string_example":"my_string"}
+{"time":"2024-01-02T00:00:00.000Z","string_example":""}
+{"time":"2024-01-03T00:00:00.000Z","string_example":null}
+```
+
+In legacy mode, Druid wrote an empty string for the third record.
+Therefore the following query returned 2:
+
+```sql
+SELECT count(*)
+FROM "null_string"
+WHERE "string_example" IS NULL
+```
+
+In SQL compliant mode, Druid differentiates between empty strings and nulls, so the same query would return 1.
+The following example shows how to coerce empty strings into null to accommodate IS NULL comparisons:
+
+<Tabs>
+
+<TabItem value="0" label="SQL-based batch">
+
+```sql
+REPLACE INTO "null_string" OVERWRITE ALL
+WITH "ext" AS (
+  SELECT *
+  FROM TABLE(
+    EXTERN(
+      '{"type":"inline","data":"{\"time\":\"2024-01-01T00:00:00.000Z\",\"string_example\":\"my_string\"}\n{\"time\":\"2024-01-02T00:00:00.000Z\",\"string_example\":\"\"}\n{\"time\":\"2024-01-03T00:00:00.000Z\",\"string_example\":null}"}',
+      '{"type":"json"}'
+    )
+  ) EXTEND ("time" VARCHAR, "string_example" VARCHAR)
+)
+SELECT
+  TIME_PARSE("time") AS "__time",
+  NULLIF("string_example",'') AS "string_example"
+FROM "ext"
+PARTITIONED BY MONTH
+```
+
+</TabItem>
+
+<TabItem value="1" label="JSON-based batch">
+
+```json
+{
+  "type": "index_parallel",
+  "spec": {
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "inline",
+        "data": "{\"time\":\"2024-01-01T00:00:00.000Z\",\"string_example\":\"my_string\"}\n{\"time\":\"2024-01-02T00:00:00.000Z\",\"string_example\":\"\"}\n{\"time\":\"2024-01-03T00:00:00.000Z\",\"string_example\":null}"
+      },
+      "inputFormat": {
+        "type": "json"
+      }
+    },
+    "tuningConfig": {
+      "type": "index_parallel",
+      "partitionsSpec": {
+        "type": "dynamic"
+      }
+    },
+    "dataSchema": {
+      "dataSource": "null_string",
+      "timestampSpec": {
+        "column": "time",
+        "format": "iso"
+      },
+      "transformSpec": {
+        "transforms": [
+          {
+            "type": "expression",
+            "expression": "case_searched((\"string_example\" == ''),null,\"string_example\")",
+            "name": "string_example"
+          }
+        ]
+      },
+      "dimensionsSpec": {
+        "dimensions": [
+          "string_example"
+        ]
+      },
+      "granularitySpec": {
+        "queryGranularity": "none",
+        "rollup": false,
+        "segmentGranularity": "month"
+      }
+    }
+  }
+}
+```
+
+</TabItem>
+</Tabs>
+
+Druid ingests the data with no empty strings as follows:
+
+| `__time` | `string_example` |
+| -- | -- | -- |
+| `2024-01-01T00:00:00.000Z`| `my_string`|
+| `2024-01-02T00:00:00.000Z`| `null`|
+| `2024-01-03T00:00:00.000Z`| `null`|
+
+Therefore `SELECT count(*) FROM "null_string" WHERE "string_example" IS NULL` returns 2.
+
+### Rewrite your queries to be SQL compliant
+
+If you want to maintain null values in your data within Druid, you can use the following ANSI SQL compliant querying strategies to achieve the same results as legacy null handling:
+
+- Modify inequality queries to include null values.
+  For example, `x <> 'some value'` becomes `(x <> 'some value' OR x IS NULL)`.
+- Use COALESCE or NVL to replace nulls with a value.
+  For example, `x + 1` becomes `NVL(numeric_value, 0)+1`
+
+Consider the following Druid datasource `null_example`:
+
+| `__time` | `string_example` | `number_example`|
+| -- | -- | -- |
+| `2024-01-01T00:00:00.000Z`| `my_string`| 99 |
+| `2024-01-02T00:00:00.000Z`| `empty`| 0 |
+| `2024-01-03T00:00:00.000Z`| `null`| null |
+
+Druid excludes null strings from equality comparisons. For example:
+
+```sql
+SELECT COUNT(*) AS count_example
+FROM "null_example"
+WHERE "string_example"<> 'my_string'
+```
+
+Druid returns 1 because null is considered unknown: neither equal nor unequal to the value.
+
+To count null values in the result, you can use an OR operator:
+
+```sql
+SELECT COUNT(*) AS count_example
+FROM "null_example"
+WHERE ("string_example"<> 'my_string') OR "string_example" IS NULL
+```
+
+Druid returns 2.
+To achieve the same result, you can use IS DISTINCT FROM for null-safe comparison:
+
+```sql
+SELECT COUNT(*) as count_example
+FROM "null_example"
+WHERE "string_example" IS DISTINCT FROM 'my_string'
+```
+
+Similarly, arithmetic operators on null return null. For example:
+
+```sql
+SELECT "number_example" + 1 AS additon_example
+FROM "null_example"
+```
+
+Druid returns the following because null + any value is null for the ANSI SQL standard:
+
+| `addition_example`|
+| -- |
+| 100 |
+| 1 |
+| null |
+
+Use NVL to avoid nulls with arithmetic. For example:
+
+```sql
+SELECT NVL("number_example",0) + 1 AS additon_example
+FROM "null_example"
+```
+
+Druid returns the following:
+
+| `addition_example` |
+| -- |
+| 100 |
+| 1 |
+| 1 |
+
+## Learn more
+
+See the following topics for more information:
+ - [Null handling tutorial](../tutorials/tutorial-sql-null.md) to learn how the default null handling works in Druid.
+ - [Null values](../querying/sql-data-types.md#null-values) for a description of Druid's null values.
+ - [Handling null values](../design/segments.md#handling-null-values) for details about how Druid stores null values.
\ No newline at end of file
diff --git a/docs/35.0.0/release-info/migr-front-coded-dict.md b/docs/35.0.0/release-info/migr-front-coded-dict.md
new file mode 100644
index 0000000000..4080d5f470
--- /dev/null
+++ b/docs/35.0.0/release-info/migr-front-coded-dict.md
@@ -0,0 +1,122 @@
+---
+id: migr-front-coded-dict
+title: "Migration guide: front-coded dictionaries"
+sidebar_label: Front-coded dictionaries
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+-->
+
+:::info
+Front coding is an [experimental feature](../development/experimental.md) introduced in Druid 25.0.0.
+:::
+
+Apache Druid encodes string columns into dictionaries for better compression.
+Front coding is an incremental encoding strategy that lets you store STRING and [COMPLEX&lt;json&gt;](../querying/nested-columns.md) columns in Druid with minimal performance impact.
+Front-coded dictionaries reduce storage and improve performance by optimizing for strings where the front part looks similar.
+For example, if you are tracking website visits, most URLs start with `https://domain.xyz/`, and front coding is able to exploit this pattern for more optimal compression when storing such datasets.
+Druid performs the optimization automatically, which means that the performance of string columns is generally not affected when they don't match the front-coded pattern.
+Consequently, you can enable this feature universally without having to know the underlying data shapes of the columns.
+
+You can use front coding with all types of ingestion.
+
+## Enable front coding
+
+To enable front coding, set `indexSpec.stringDictionaryEncoding.type` to `frontCoded` in the `tuningConfig` object of your [ingestion spec](../ingestion/ingestion-spec.md).
+
+You can specify the following optional properties:
+
+* `bucketSize`: Number of values to place in a bucket to perform delta encoding. Setting this property instructs indexing tasks to write segments using compressed dictionaries of the specified bucket size. You can set it to any power of 2 less than or equal to 128. `bucketSize` defaults to 4.
+* `formatVersion`: Specifies which front coding version to use. Options are 0 and 1 (supported for Druid versions 26.0.0 and higher). `formatVersion` defaults to 0.
+
+For example:
+
+```json
+"tuningConfig": {
+  "indexSpec": {
+    "stringDictionaryEncoding": {
+      "type":"frontCoded",
+      "bucketSize": 4,
+      "formatVersion": 0
+    }
+  }
+}
+```
+
+For SQL based ingestion, you can add the `indexSpec` to your query context.
+In the Web Console, select *Edit context* from the context from the *Engine:* menu and enter the `indexSpec`. For example:
+
+```json
+{
+...
+"indexSpec": {
+  "stringDictionaryEncoding": {
+  "type": "frontCoded",
+  "bucketSize": 4,
+  "formatVersion": 1
+  }
+}
+}
+```
+
+For API calls to the SQL-based ingestion API, include the `indexSpec` in the context in the request payload. For example:
+
+```json
+{
+"query": ...
+"context": {
+  "maxNumTasks": 3
+  "indexSpec": {
+  "stringDictionaryEncoding": {
+    "type": "frontCoded",
+    "bucketSize": 4,
+    "formatVersion": 1}
+    }
+  }
+}
+```
+
+## Upgrade from Druid 25.0.0
+
+Druid 26.0.0 introduced a new version of the front-coded dictionary, version 1, offering typically faster read speeds and smaller storage sizes.
+When upgrading to versions Druid 26.0.0 and higher, Druid continues to default front coding settings to version 0.
+This default enables seamless downgrades to Druid 25.0.0.
+
+To use the newer version, set the `formatVersion` property to 1:
+
+```
+"tuningConfig": {
+  "indexSpec": {
+    "stringDictionaryEncoding": {
+      "type":"frontCoded",
+      "bucketSize": 4,
+      "formatVersion": 1
+    }
+  }
+}
+```
+
+## Downgrade to Druid 25.0.0
+
+After upgrading to version 1, you can no longer downgrade to Druid 25.0.0 seamlessly.
+To downgrade to Druid 25.0.0, re-ingest your data with the `stringDictionaryEncoding.formatVersion` property set to 0.
+
+## Downgrade to a version preceding Druid 25.0.0
+
+Druid versions preceding 25.0.0 can't read segments with front-coded dictionaries. To downgrade to an older version, you must either delete the segments containing front-coded dictionaries or re-ingest them with `stringDictionaryEncoding.type` set to `utf8`.
diff --git a/docs/35.0.0/release-info/migr-mvd-array.md b/docs/35.0.0/release-info/migr-mvd-array.md
new file mode 100644
index 0000000000..3c5551d880
--- /dev/null
+++ b/docs/35.0.0/release-info/migr-mvd-array.md
@@ -0,0 +1,260 @@
+---
+id: migr-mvd-array
+title: "Migration guide: MVDs to arrays"
+sidebar_label: MVDs to arrays
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+-->
+
+
+Druid now supports SQL-compliant [arrays](../querying/arrays.md). We recommend using arrays over [multi-value dimensions](../querying/multi-value-dimensions.md) (MVDs) whenever possible.
+For new projects and complex use cases involving multiple data types, use arrays. Use MVDs for specific use cases, such as operating directly on individual elements like regular strings. If your operations involve entire arrays of values, including the ordering of values within a row, use arrays over MVDs.
+
+## Comparison between arrays and MVDs
+
+The following table compares the general behavior between arrays and MVDs.
+For specific query differences between arrays and MVDs, see [Querying arrays and MVDs](#querying-arrays-and-mvds).
+
+|  | Array| MVD |
+|---|---|---|
+| Data types | Supports VARCHAR, BIGINT, and DOUBLE types (ARRAY\<STRING\>, ARRAY\<LONG\>, ARRAY\<DOUBLE\>) | Only supports arrays of strings (VARCHAR) |
+| SQL compliance | Behaves like standard SQL arrays with SQL-compliant behavior | Behaves like SQL VARCHAR rather than standard SQL arrays and requires special SQL functions to achieve array-like behavior. See the [examples](#examples). |
+| Ingestion | <ul><li>JSON arrays are ingested as Druid arrays</li><li>Managed through the query context parameter `arrayIngestMode` in SQL-based ingestion. Supported options are `array`, `mvd`, and `none`. Note that if you set this mode to `none`, Druid raises an exception if you try to store any type of array.</li></ul> | <ul><li>JSON arrays are ingested as MVDs</li><li>Managed using functions like [ARRAY_TO_MV](../querying/sql-functions.md#array_to_mv) in SQL-based ingestion</li></ul> |
+| Filtering and grouping | <ul><li>Filters and groupings match the entire array value</li><li>Can be used as GROUP BY keys, grouping based on the entire array value</li><li>Use the [UNNEST operator](#group-by-array-elements) to group based on individual array elements</li></ul> | <ul><li>Filters match any value within the array</li><li>Grouping generates a group for each individual value, similar to an implicit UNNEST</li></ul> |
+| Conversion | Convert an MVD to an array using [MV_TO_ARRAY](../querying/sql-functions.md#mv_to_array) | Convert an array to an MVD using [ARRAY_TO_MV](../querying/sql-functions.md#array_to_mv) |
+
+## Querying arrays and MVDs
+
+In SQL queries, Druid operates on arrays differently than MVDs.
+A value in an array column is treated as a single array entity (SQL ARRAY), whereas a value in an MVD column is treated as individual strings (SQL VARCHAR).
+This behavior applies even though multiple string values within the same MVD are still stored as a single field in the MVD column.
+
+For example, consider the same value, `['a', 'b', 'c']` ingested into an array column and an MVD column.
+In your query, you want to filter results by comparing some value with `['a', 'b', 'c']`.
+
+* For array columns, Druid only returns the row when an equality filter matches the entire array.  
+For example: `WHERE "array_column" = ARRAY['a', 'b', 'c']`.
+
+* For MVD columns, Druid returns the row when an equality filter matches any value of the MVD.  
+For example, any of the following filters return the row for the query:  
+`WHERE "mvd_column" = 'a'`  
+`WHERE "mvd_column" = 'b'`  
+`WHERE "mvd_column" = 'c'`
+
+Note this difference between arrays and MVDs when you write queries that involve filtering or grouping.
+
+When your query applies both filters and grouping, MVDs may return rows that don't seem to match the filter,
+since the grouping occurs after Druid applies the filter. For an example, see [Filter and group by array elements](#filter-and-group-by-array-elements).
+
+## Examples
+
+The following examples highlight a few analogous queries between arrays and MVDs.
+For more information and examples, see [Querying arrays](../querying/arrays.md#querying-arrays) and [Querying multi-value dimensions](../querying/multi-value-dimensions.md#querying-multi-value-dimensions).
+
+### Filter by an array element
+
+Filter rows that have a certain value in the array or MVD.
+
+#### Array
+
+```sql
+SELECT label, tags
+FROM "array_example"
+WHERE ARRAY_CONTAINS(tags, 't3')
+```
+
+#### MVD
+
+```sql
+SELECT label, tags
+FROM "mvd_example"
+WHERE tags = 't3'
+```
+
+### Filter by one or more elements
+
+Filter rows for which the array or MVD contains one or more elements.
+Notice that [ARRAY_OVERLAP](../querying/sql-functions.md#array_overlap) checks for any overlapping elements, whereas [ARRAY_CONTAINS](../querying/sql-functions.md#array_contains) in the previous example checks that all elements are included.
+
+#### Array
+
+```sql
+SELECT *
+FROM "array_example"
+WHERE ARRAY_OVERLAP(tags, ARRAY['t1', 't7'])
+```
+
+#### MVD
+
+```sql
+SELECT *
+FROM "mvd_example"
+WHERE tags = 't1' OR tags = 't7'
+```
+
+### Filter using array equality
+
+Filter rows for which the array or MVD is equivalent to a reference array.
+
+#### Array
+
+```sql
+SELECT *
+FROM "array_example"
+WHERE tags = ARRAY['t1', 't2', 't3']
+```
+
+#### MVD
+
+```sql
+SELECT *
+FROM "mvd_example"
+WHERE MV_TO_ARRAY(tags) = ARRAY['t1', 't2', 't3']
+```
+
+### Group results by array
+
+Group results by the array or MVD.
+
+#### Array
+
+```sql
+SELECT label, tags
+FROM "array_example"
+GROUP BY 1, 2
+```
+
+#### MVD
+
+```sql
+SELECT label, MV_TO_ARRAY(tags)
+FROM "mvd_example"
+GROUP BY 1, 2
+```
+
+### Group by array elements
+
+Group results by individual array or MVD elements.
+
+#### Array
+
+```sql
+SELECT label, strings
+FROM "array_example" CROSS JOIN UNNEST(tags) as u(strings)
+GROUP BY 1, 2
+```
+
+#### MVD
+
+```sql
+SELECT label, tags
+FROM "mvd_example"
+GROUP BY 1, 2
+```
+
+### Filter and group by array elements
+
+Filter rows that have a certain value, then group by elements in the array or MVD.
+This example illustrates that while the results of filtering may match between arrays and MVDs,
+be aware that MVDs implicitly unnest their values so that results differ when you also apply a GROUP BY.
+
+For example, consider the queries from [Filter by an array element](#filter-by-an-array-element).
+Both queries return the following rows:
+
+```json
+{"label":"row1","tags":["t1","t2","t3"]}
+{"label":"row2","tags":["t3","t4","t5"]}
+```
+
+However, adding `GROUP BY 1, 2` to both queries changes the output.
+The two queries are now:
+
+```sql
+-- Array
+SELECT label, tags
+FROM "array_example"
+WHERE ARRAY_CONTAINS(tags, 't3')
+GROUP BY 1, 2
+
+-- MVD
+SELECT label, tags
+FROM "mvd_example"
+WHERE tags = 't3'
+GROUP BY 1, 2
+```
+
+The array query returns the following:
+
+```json
+{"label":"row1","tags":["t1","t2","t3"]}
+{"label":"row2","tags":["t3","t4","t5"]}
+```
+
+The MVD query returns the following:
+
+```json
+{"label":"row1","tags":"t1"}
+{"label":"row1","tags":"t2"}
+{"label":"row1","tags":"t3"}
+{"label":"row2","tags":"t3"}
+{"label":"row2","tags":"t4"}
+{"label":"row2","tags":"t5"}
+```
+
+The MVD results appear to show four extra rows for which `tags` does not equal `t3`.
+However, the rows match the filter based on how Druid evaluates equalities for MVDs.
+
+For the equivalent query on MVDs, use the [MV_FILTER_ONLY](../querying/sql-functions.md#mv_filter_only) function:
+
+```sql
+SELECT label, MV_FILTER_ONLY(tags, ARRAY['t3'])
+FROM "mvd_example"
+WHERE tags = 't3'
+GROUP BY 1, 2
+```
+
+
+## How to ingest arrays
+
+:::tip
+As a best practice, store data as arrays rather than MVDs.
+:::
+
+You can ingest arrays in Druid as follows:
+
+* For native batch and streaming ingestion, configure the dimensions in [`dimensionsSpec`](../ingestion/ingestion-spec.md#dimensionsspec).
+Within `dimensionsSpec`, set `"useSchemaDiscovery": true`, and use `dimensions` to list the array inputs with type `auto`.  
+For an example, see [Ingesting arrays: Native batch and streaming ingestion](../querying/arrays.md#native-batch-and-streaming-ingestion).
+
+* For SQL-based batch ingestion, include the [query context parameter](../multi-stage-query/reference.md#context-parameters) `"arrayIngestMode": "array"` and reference the relevant array type (`VARCHAR ARRAY`, `BIGINT ARRAY`, or `DOUBLE ARRAY`) in the [EXTEND clause](../multi-stage-query/reference.md#extern-function) that lists the column names and data types.
+For examples, see [Ingesting arrays: SQL-based ingestion](../querying/arrays.md#sql-based-ingestion).
+
+## How to ingest MVDs
+
+You can't mix arrays and MVDs in the same column.
+If you need to continue to use MVDs, use the [ARRAY_TO_MV](../querying/sql-functions.md#array_to_mv) function when you ingest data.
+This ensures that VARCHAR ARRAYS are stored as MVDs rather than arrays of strings.
+To continue using MVDs in your existing queries, you need to ingest MVDs explicitly since arrays and MVDs behave differently.
+
+For an example using ARRAY_TO_MV, see [Multi-value dimensions: SQL-based ingestion](../querying/multi-value-dimensions.md#sql-based-ingestion).
+
+If you have MVD columns and want to migrate to array columns, [reindex](../data-management/update.md#reindex) your data to update its schema.
+Reindexing overwrites existing data where the source of new data is the existing data itself.
+Follow the same guidance on [How to ingest arrays](#how-to-ingest-arrays).
diff --git a/docs/35.0.0/release-info/migr-subquery-limit.md b/docs/35.0.0/release-info/migr-subquery-limit.md
new file mode 100644
index 0000000000..cad8ef6338
--- /dev/null
+++ b/docs/35.0.0/release-info/migr-subquery-limit.md
@@ -0,0 +1,64 @@
+---
+id: migr-subquery-limit
+title: "Migration guide: Subquery limit"
+sidebar_label: Subquery limit
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+-->
+
+Druid now allows you to set a byte-based limit on subquery size, to prevent brokers from running out of memory when handling large subqueries. 
+Druid uses subqueries as joins as well as in common table expressions, such as WITH.
+
+The byte-based subquery limit overrides Druid's row-based subquery limit.
+
+:::info
+We recommend that you move towards using byte-based limits starting in Druid 30.0.
+:::
+
+For queries that generate a large number of rows (5 million or more), we recommend that you don't use `maxSubqueryBytes` from the outset. 
+You can increase `maxSubqueryRows` and then configure the byte-based limit if you find that Druid needs it to process the query.
+
+## Row-based subquery limit
+
+Druid uses the `maxSubqueryRows` property to limit the number of rows Druid returns in a subquery. 
+Because this is a row-based limit, it doesn't restrict the overall size of the returned data.
+
+The `maxSubqueryRows` property is set to 100,000 by default.
+
+## Enable a byte-based subquery limit
+
+Set the optional property `maxSubqueryBytes` to set a maximum number of returned bytes. 
+This property takes precedence over `maxSubqueryRows`.
+
+## Usage considerations
+
+You can set both `maxSubqueryRows` and `maxSubqueryBytes` at cluster level and override them in individual queries. 
+See [Overriding default query context values](../configuration#overriding-default-query-context-values) for more information.
+
+Make sure you enable the Broker monitor `SubqueryCountStatsMonitor` so that Druid emits metrics for subquery statistics.
+To do this, add `org.apache.druid.server.metrics.SubqueryCountStatsMonitor` to the `druid.monitoring.monitors` property in your Broker's `runtime.properties` configuration file.
+See [Metrics monitors](../configuration/index.md#metrics-monitors-for-each-service) for more information.
+
+## Learn more
+
+See the following topics for more information:
+
+- [Query context reference](../querying/query-context-reference.md) for information on query context parameters.
+- [Broker configuration reference](../configuration#guardrails-for-materialization-of-subqueries) for more information on `maxSubqueryRows` and `maxSubqueryBytes`.
diff --git a/docs/35.0.0/release-info/migration-guide.md b/docs/35.0.0/release-info/migration-guide.md
new file mode 100644
index 0000000000..760b691d14
--- /dev/null
+++ b/docs/35.0.0/release-info/migration-guide.md
@@ -0,0 +1,47 @@
+---
+id: migration-guide
+title: "Migration guides"
+description: How to migrate from legacy features to get the most from Druid updates
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+In general, when we introduce new features and behaviors into Apache Druid, we make every effort to avoid breaking existing features when introducing new behaviors. However, sometimes there are either bugs or performance limitations with the old behaviors that are not possible to fix in a backward-compatible way. In these cases, we must introduce breaking changes for the future maintainability of Druid. 
+
+The guides in this section outline breaking changes introduced in Druid 25.0.0 and later. Each guide provides instructions to migrate to new features.
+
+
+## Migrate from multi-value dimensions to arrays
+
+Druid now supports SQL-compliant array types. Whenever possible, you should use the array type over multi-value dimensions. See [Migration guide: MVDs to arrays](./migr-mvd-array.md).
+
+## Migrate to front-coded dictionary encoding
+
+Druid encodes string columns into dictionaries for better compression. Front-coded dictionary encoding reduces storage and improves performance by optimizing for strings that share similar beginning substrings. See [Migration guide: front-coded dictionaries](./migr-front-coded-dict.md) for more information.
+
+## Migrate from `maxSubqueryRows` to `maxSubqueryBytes`
+
+Druid allows you to set a byte-based limit on subquery size to prevent Brokers from running out of memory when handling large subqueries. The byte-based subquery limit overrides Druid's row-based subquery limit. We recommend that you move towards using byte-based limits starting in Druid 30.0.0. See [Migration guide: subquery limit](./migr-subquery-limit.md) for more information.
+
+## Migrate to SQL compliant null handling mode
+
+By default, the Druid [null handling](../querying/sql-data-types.md#null-values) mode is now compliant with ANSI SQL.
+This guide provides strategies for Druid operators and users who rely on the legacy Druid null handling behavior in their applications to transition to ANSI SQL compliant mode.  See [Migration guide: SQL compliant mode](./migr-ansi-sql-null.md
+) for more information.
\ No newline at end of file
diff --git a/docs/35.0.0/release-info/release-notes.md b/docs/35.0.0/release-info/release-notes.md
new file mode 100644
index 0000000000..1635084308
--- /dev/null
+++ b/docs/35.0.0/release-info/release-notes.md
@@ -0,0 +1,119 @@
+---
+id: release-notes
+title: "Release notes"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+<!--Replace 35.0.0 with the correct Druid version.-->
+
+Apache Druid 35.0.0 contains over $NUMBER_FEATURES new features, bug fixes, performance enhancements, documentation improvements, and additional test coverage from $NUMBER_OF_CONTRIBUTORS contributors.
+
+<!--
+Replace {{MILESTONE}} with the correct milestone number. For example: https://github.com/apache/druid/issues?q=is%3Aclosed+milestone%3A28.0+sort%3Aupdated-desc+
+-->
+
+See the [complete set of changes](https://github.com/apache/druid/issues?q=is%3Aclosed+milestone%3A{{MILESTONE}}+sort%3Aupdated-desc+) for additional details, including bug fixes.
+
+Review the [upgrade notes](#upgrade-notes) and [incompatible changes](#incompatible-changes) before you upgrade to Druid 35.0.0.
+If you are upgrading across multiple versions, see the [Upgrade notes](upgrade-notes.md) page, which lists upgrade notes for the most recent Druid versions.
+
+<!-- 
+This file is a collaborative work in process. Adding a release note to this file doesn't guarantee its presence in the next release until the release branch is cut and the release notes are finalized.
+
+This file contains the following sections:
+- Important features, changes, and deprecations
+- Functional area and related changes
+- Upgrade notes and incompatible changes
+
+Please add your release note to the appropriate section and include the following:
+- Detailed title
+- Summary of the changes (a couple of sentences) aimed at Druid users
+- Link to the associated PR
+
+If your release note contains images, put the images in the release-info/assets folder.
+
+For tips about how to write a good release note, see [Release notes](https://github.com/apache/druid/blob/master/CONTRIBUTING.md#release-notes).
+-->
+
+## Important features, changes, and deprecations
+
+This section contains important information about new and existing features.
+
+## Functional area and related changes
+
+This section contains detailed release notes separated by areas.
+
+### Web console
+
+#### Other web console improvements
+
+### Ingestion
+
+#### SQL-based ingestion
+
+##### Other SQL-based ingestion improvements
+
+#### Streaming ingestion
+
+##### Other streaming ingestion improvements
+
+### Querying
+
+#### Other querying improvements
+
+### Cluster management
+
+#### Other cluster management improvements
+
+### Data management
+
+#### Other data management improvements
+
+### Metrics and monitoring
+
+### Extensions
+
+### Documentation improvements
+
+## Upgrade notes and incompatible changes
+
+### Upgrade notes
+
+#### Front-coded dictionaries
+
+<!--Carry this forward until 32. Then move it to incompatible changes -->
+
+In Druid 32.0.0, the front coded dictionaries feature will be turned on by default. Front-coded dictionaries reduce storage and improve performance by optimizing for strings where the front part looks similar.
+
+Once this feature is on, you cannot easily downgrade to an earlier version that does not support the feature. 
+
+For more information, see [Migration guide: front-coded dictionaries](./migr-front-coded-dict.md).
+
+If you're already using this feature, you don't need to take any action. 
+
+
+### Incompatible changes
+
+### Developer notes
+
+#### Dependency updates
+
+The following dependencies have had their versions bumped:
\ No newline at end of file
diff --git a/docs/35.0.0/release-info/upgrade-notes.md b/docs/35.0.0/release-info/upgrade-notes.md
new file mode 100644
index 0000000000..440eb7d77e
--- /dev/null
+++ b/docs/35.0.0/release-info/upgrade-notes.md
@@ -0,0 +1,983 @@
+---
+id: upgrade-notes
+title: "Upgrade notes"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+The upgrade notes assume that you are upgrading from the Druid version that immediately precedes your target version. If you are upgrading across multiple versions, make sure you read the upgrade notes for all the intermediate versions.
+
+For the full release notes for a specific version, see the [releases page](https://github.com/apache/druid/releases).
+
+## Announcements
+
+#### Front-coded dictionaries
+
+Front-coded dictionaries reduce storage and improve performance by optimizing for strings where the front part looks similar.
+
+Once this feature is on, you cannot easily downgrade to an earlier version that does not support the feature. 
+
+For more information, see [Migration guide: front-coded dictionaries](./migr-front-coded-dict.md).
+
+If you're already using this feature, you don't need to take any action. 
+
+## 34.0.0
+
+### Upgrade notes
+
+#### Hadoop-based ingestion
+
+Hadoop-based ingestion has been deprecated since Druid 32.0 and is scheduled to be removed in Druid 37.0.0. 
+
+We recommend one of Druid's other supported ingestion methods, such as [SQL-based ingestion](../multi-stage-query/index.md) or [MiddleManager-less ingestion using Kubernetes](../development/extensions-core/k8s-jobs.md).
+
+As part of this change, you must now opt-in to using the deprecated `index_hadoop` task type. If you don't do this, your Hadoop-based ingestion tasks will fail.
+
+To opt-in, set `druid.indexer.task.allowHadoopTaskExecution` to `true` in your `common.runtime.properties` file.
+[#18239](https://github.com/apache/druid/pull/18239)
+
+#### `groupBy` and `topN` queries
+
+Druid now uses the `groupBy` native query type, rather than `topN`, for SQL queries that group
+by and order by the same column, have `LIMIT`, and don't have `HAVING`. This speeds up execution
+of such queries since `groupBy` is vectorized while `topN` is not. 
+
+You can restore the previous behavior by setting the query context parameter `useLexicographicTopN` to `true`. Behavior for `useApproximateTopN` is unchanged, and the default remains `true`.
+
+#### `IS_INCREMENTAL_HANDOFF_SUPPORTED` config removed
+
+Removed the `IS_INCREMENTAL_HANDOFF_SUPPORTED` context reference from supervisors, as incremental publishing has been the default behavior since version 0.16.0. This context was originally introduced to support rollback to `LegacyKafkaIndexTaskRunner` in versions earlier than 0.16.0, which has since been removed.
+
+#### `useMaxMemoryEstimates` config removed 
+
+Removed the `useMaxMemoryEstimates` config. When set to false, Druid used a much more accurate memory estimate that was introduced in Druid 0.23.0. That more accurate method is the only available method now. The config has defaulted to false for several releases. 
+
+[#17936](https://github.com/apache/druid/pull/17936)
+
+## 33.0.0 
+
+### Upgrade notes
+
+#### `useMaxMemoryEstimates`
+
+`useMaxMemoryEstimates` is now set to false for MSQ task engine tasks. Additionally, the property has been deprecated and will be removed in a future release. Setting this to false allows for better on-heap memory estimation.
+
+[#17792](https://github.com/apache/druid/pull/17792)
+
+#### Automatic kill tasks interval
+
+Automatic kill tasks are now limited to 30 days or fewer worth of segments per task.
+
+The previous behavior (no limit on interval per kill task) can be restored by setting `druid.coordinator.kill.maxInterval = P0D`.
+
+[#17680](https://github.com/apache/druid/pull/17680)
+
+#### Kubernetes deployments
+
+By default, the Docker image now uses the canonical hostname if you're running Druid in Kubernetes. Otherwise, it uses the IP address otherwise [#17697](https://github.com/apache/druid/pull/17697) 
+
+#### Updated configs
+
+Various configs were deprecated in a previous release and have now been removed. The following table lists the removed configs and their replacements:
+
+| Removed config | Replacement config|
+|-|-|
+|`druid.processing.merge.task.initialYieldNumRows `|`druid.processing.merge.initialYieldNumRows`|
+|`druid.processing.merge.task.targetRunTimeMillis`|`druid.processing.merge.targetRunTimeMillis`|
+|`druid.processing.merge.task.smallBatchNumRows`|`druid.processing.merge.smallBatchNumRows`|
+|`druid.processing.merge.pool.awaitShutdownMillis`|
+|`druid.processing.merge.awaitShutdownMillis`|
+|`druid.processing.merge.pool.parallelism`|`druid.processing.merge.parallelism`|
+|`druid.processing.merge.pool.defaultMaxQueryParallelism`|`druid.processing.merge.defaultMaxQueryParallelism`|
+
+[#17776](https://github.com/apache/druid/pull/17776)
+
+#### Segment metadata cache configs
+
+If you need to downgrade to a version where Druid doesn't support the segment metadata cache, you must set the `druid.manager.segments.useCache` config to false or remove it prior to the upgrade.
+
+This feature is introduced in Druid 33.0.
+
+[#17653](https://github.com/apache/druid/pull/17653)
+
+## 32.0.0
+
+### Incompatible changes
+
+### ANSI-SQL compatibility and query results
+
+Support for the configs that let you maintain older behavior that wasn't ANSI-SQL compliant have been removed:
+
+- `druid.generic.useDefaultValueForNull=true`
+- `druid.expressions.useStrictBooleans=false`
+- `druid.generic.useThreeValueLogicForNativeFilters=false` 
+
+They no longer affect your query results. Only SQL-compliant non-legacy behavior is supported now. 
+
+If the configs are set to the legacy behavior, Druid services will fail to start. 
+
+If you want to continue to get the same results without these settings, you must update your queries or your results will be incorrect after you upgrade.
+
+For more information about how to update your queries, see the [migration guide](https://druid.apache.org/docs/latest/release-info/migr-ansi-sql-null).
+
+[#17568](https://github.com/apache/druid/pull/17568) [#17609](https://github.com/apache/druid/pull/17609)
+
+### Java support
+
+Java support in Druid has been updated:
+
+- Java 8 support has been removed
+- Java 11 support is deprecated
+
+We recommend that you upgrade to Java 17.
+
+[#17466](https://github.com/apache/druid/pull/17466)
+
+### Javascript support
+
+- Javascript tiered broker selector strategy and Javascript filters currently do not work on Java 17.
+
+### Deprecations
+
+### Hadoop-based ingestion
+
+Hadoop-based ingestion is now deprecated. We recommend that you migrate to SQL-based ingestion. 
+
+## 31.0.0
+
+### Upgrade notes
+
+#### Array ingest mode now defaults to array
+
+The SQL-based ingestion query context flag `arrayIngestMode` now defaults to `array` instead of `mvd`. This means that SQL `VARCHAR ARRAY` types is no longer implicitly translated and stored in `VARCHAR` columns, but is instead stored as `VARCHAR ARRAY`. This change permits other array types such as `BIGINT ARRAY` and `DOUBLE ARRAY` to be inserted with MSQ task engine into their respective array column types instead of failing as they do in `mvd` mode.
+
+To continue to store multi-value strings, modify any insert/replace queries to wrap the array types with the `ARRAY_TO_MV` operator.
+
+Validation is in place to prevent mixing `VARCHAR` and `VARCHAR ARRAY` columns in the same table, so any ingestions affected by this change will fail and provide a descriptive error message instead of exhibiting unexpected behavior.
+
+The `arrayIngestMode` option of `none` has been removed. It was introduced prior to the table validation logic as a means for cluster operators to force query writers to explicitly set `array` or `mvd` on their query contexts, but provides little utility in Druid 31.
+
+See the following topics for more information:
+* [Ingest multi-value dimensions](https://druid.apache.org/docs/latest/querying/multi-value-dimensions.md#sql-based-ingestion) for how to ingest multi-value strings.
+* [Ingest arrays](https://druid.apache.org/docs/latest/querying/arrays.md#sql-based-ingestion) for ingesting arrays.
+
+[#16789](https://github.com/apache/druid/pull/16789)
+
+#### Removed task action audit logging
+
+The deprecated task action audit logging has been removed. This change includes the following updates:
+
+- The endpoint `/indexer/v1/task/{taskId}/segments` is no longer supported.
+- Druid doesn't write to or read from the metadata table `druid_taskLog`.
+- Druid ignores the property `druid.indexer.auditlog.enabled`.
+- Druid doesn't emit the metric `task/action/log/time`.
+
+These changes are backward compatible with all existing metadata storage extensions.
+
+[#16309](https://github.com/apache/druid/pull/16309)
+
+#### Removed Firehose and FirehoseFactory
+
+Removed Firehose and FirehoseFactory and remaining implementations.
+Apache deprecated support for Druid firehoses in version 0.17. Support for firehose ingestion was removed in version 26.0.
+
+[#16758](https://github.com/apache/druid/pull/16758)
+
+### Incompatible changes
+
+#### Removed the scan query legacy mode
+
+The native scan query legacy mode has been removed. It was introduced in Druid 0.11 to maintain compatibility during an upgrade from older versions of Druid where the scan query was part of a `contrib` extension.
+
+[#16659](https://github.com/apache/druid/pull/16659)
+
+Hard-coded `"legacy":false` following removal of the legacy mode to prevent error during rolling upgrades or downgrades.
+
+[#16793](https://github.com/apache/druid/pull/16793)
+
+#### ZK-based segment loading
+
+ZK-based segment loading is now disabled. ZK `servedSegmentsPath` was deprecated in Druid 0.7.1. This legacy path has been replaced by `liveSegmentsPath`.
+
+Segment-serving processes such as Peons, Historicals and Indexers no longer create ZK `loadQueuePath` entries. The `druid.zk.paths.loadQueuePath` and `druid.zk.paths.servedSegmentsPath` properties are no longer used.
+
+Move to HTTP-based segment loading first and then perform the version upgrade.
+## 30.0.0
+
+### Upgrade notes
+
+#### Append JsonPath function
+
+The `append` function for JsonPath for ORC format now fails with an exception. Previously, it would run but not append anything.
+
+[#15772](https://github.com/apache/druid/pull/15772)
+
+#### Kinesis ingestion tuning
+
+The following properties have been deprecated as part of simplifying the memory tuning for Kinesis ingestion:
+
+- `recordBufferSize`,  use `recordBufferSizeBytes` instead
+- `maxRecordsPerPoll`, use `maxBytesPerPoll` instead
+
+[#15360](https://github.com/apache/druid/pull/15360)
+
+#### Improved Supervisor rolling restarts
+
+The `stopTaskCount` config now prioritizes stopping older tasks first. As part of this change, you must also explicitly set a value for `stopTaskCount`. It no longer defaults to the same value as `taskCount`.
+
+[#15859](https://github.com/apache/druid/pull/15859)
+
+#### Changes to Coordinator default values
+
+The following are the changes to the default values for the Coordinator service:
+
+* The default value for `druid.coordinator.kill.period` (if unspecified) has changed from `P1D` to the value of `druid.coordinator.period.indexingPeriod`. Operators can choose to override `druid.coordinator.kill.period` and that takes precedence over the default behavior.
+* The default value for the dynamic configuration property `killTaskSlotRatio` has been updated from `1.0` to `0.1`. This ensures that kill tasks take up only one task slot by default instead of consuming all available task slots.
+
+[#16247](https://github.com/apache/druid/pull/16247)
+
+#### `GoogleTaskLogs` upload buffer size
+
+Changed the upload buffer size in `GoogleTaskLogs` to 1 MB instead of 15 MB to allow more uploads in parallel and prevent the Middle Manager service from running out of memory.
+
+[#16236](https://github.com/apache/druid/pull/16236)
+
+### Incompatible changes
+
+#### Changes to `targetDataSource` in EXPLAIN queries
+
+Druid 30.0.0 includes a breaking change that restores the behavior for `targetDataSource` to its 28.0.0 and earlier state, different from Druid 29.0.0 and only 29.0.0. In 29.0.0, `targetDataSource` returns a JSON object that includes the datasource name. In all other versions, `targetDataSource` returns a string containing the name of the datasource.
+
+If you're upgrading from any version other than 29.0.0, there is no change in behavior.
+
+If you are upgrading from 29.0.0, this is an incompatible change.
+
+[#16004](https://github.com/apache/druid/pull/16004)
+
+#### Removed ZooKeeper-based segment loading
+
+ZooKeeper-based segment loading is being removed due to known issues.
+It has been deprecated for several releases.
+Recent improvements to the Druid Coordinator have significantly enhanced performance with HTTP-based segment loading.
+
+[#15705](https://github.com/apache/druid/pull/15705)
+
+#### Removed Coordinator configs
+
+Removed the following Coordinator configs:
+
+* `druid.coordinator.load.timeout`: Not needed as the default value of this parameter (15 minutes) is known to work well for all clusters.
+* `druid.coordinator.loadqueuepeon.type`: Not needed as this value is always `http`.
+* `druid.coordinator.curator.loadqueuepeon.numCallbackThreads`: Not needed as ZooKeeper(curator)-based segment loading isn't an option anymore.
+
+Auto-cleanup of compaction configs of inactive datasources is now enabled by default.
+
+[#15705](https://github.com/apache/druid/pull/15705)
+
+#### Changed `useMaxMemoryEstimates` for Hadoop jobs
+
+The default value of the `useMaxMemoryEstimates` parameter for Hadoop jobs is now `false`.
+
+[#16280](https://github.com/apache/druid/pull/16280)
+
+## 29.0.1
+
+### Incompatible changes
+
+#### Changes to `targetDataSource` in EXPLAIN queries
+
+Druid 29.0.1 includes a breaking change that restores the behavior for `targetDataSource` to its 28.0.0 and earlier state, different from Druid 29.0.0 and only 29.0.0. In 29.0.0, `targetDataSource` returns a JSON object that includes the datasource name. In all other versions, `targetDataSource` returns a string containing the name of the datasource.
+
+If you're upgrading from any version other than 29.0.0, there is no change in behavior.
+
+If you are upgrading from 29.0.0, this is an incompatible change.
+
+[#16004](https://github.com/apache/druid/pull/16004)
+
+## 29.0.0
+
+### Upgrade notes
+
+#### Changed `equals` filter for native queries
+
+The [equality filter](https://druid.apache.org/docs/latest/querying/filters#equality-filter) on mixed type `auto` columns that contain arrays must now be filtered as their presenting type. This means that if any rows are arrays (for example, the segment metadata and `information_schema` reports the type as some array type), then the native queries must also filter as if they are some array type.
+ 
+This change impacts mixed type `auto` columns that contain both scalars and arrays. It doesn't impact SQL, which already has this limitation due to how the type presents itself.
+
+[#15503](https://github.com/apache/druid/pull/15503)
+
+#### Console automatically sets `arrayIngestMode` for MSQ queries
+
+Druid console now configures the `arrayIngestMode` parameter in the data loading flow, and its value can persist across the SQL tab unless manually updated. When loading multi-value dimensions or arrays in the Druid console, note the value of the `arrayIngestMode` parameter to prevent mixing multi-value dimensions and arrays in the same column of a data source.
+
+[#15588](https://github.com/apache/druid/pull/15588)
+
+#### Improved concurrent append and replace (experimental)
+
+You no longer have to manually determine the task lock type for concurrent append and replace (experimental) with the `taskLockType` task context. Instead, Druid can now determine it automatically for you. You can use the context parameter `"useConcurrentLocks": true` for individual tasks and datasources or enable concurrent append and replace at a cluster level using `druid.indexer.task.default.context`.
+
+[#15684](https://github.com/apache/druid/pull/15684)
+
+#### Enabled empty ingest queries
+
+The MSQ task engine now allows empty ingest queries by default. For queries that don't generate any output rows, the MSQ task engine reports zero values for `numTotalRows` and `totalSizeInBytes` instead of null. Previously, ingest queries that produced no data would fail with the `InsertCannotBeEmpty` MSQ fault.
+
+To revert to the original behavior, set the MSQ query parameter `failOnEmptyInsert` to `true`.
+
+[#15495](https://github.com/apache/druid/pull/15495) [#15674](https://github.com/apache/druid/pull/15674)
+
+#### Enabled query request queuing by default when total laning is turned on
+
+When query scheduler threads are less than server HTTP threads, total laning turns on.
+This reserves some HTTP threads for non-query requests such as health checks.
+The total laning previously would reject any query request that exceeds the lane capacity.
+Now, excess requests will instead be queued with a timeout equal to `MIN(Integer.MAX_VALUE, druid.server.http.maxQueryTimeout)`.
+
+[#15440](https://github.com/apache/druid/pull/15440)
+
+#### Changed how empty or null array columns are stored
+
+Columns ingested with the auto column indexer that contain only empty or null arrays are now stored as `ARRAY\<LONG\>` instead of `COMPLEX<json\>`.
+
+[#15505](https://github.com/apache/druid/pull/15505)
+
+#### Changed how Druid allocates weekly segments
+
+When the requested granularity is a month or larger but a segment can't be allocated, Druid resorts to day partitioning.
+Unless explicitly specified, Druid skips week-granularity segments for data partitioning because these segments don't align with the end of the month or more coarse-grained intervals.
+
+Previously, if Druid couldn't allocate segments by month, it tried allocating them by week next.
+In the new behavior, Druid skips partitioning by week and goes directly to day. Week segments can only be allocated if the chosen partitioning in the append task is WEEK.
+
+[#15589](https://github.com/apache/druid/pull/15589)
+
+#### Removed the `auto` search strategy
+
+Removed the `auto` search strategy from the native search query. Setting `searchStrategy` to `auto` is now equivalent to `useIndexes`.
+
+[#15550](https://github.com/apache/druid/pull/15550)
+
+## 28.0.0
+
+### Upgrade notes
+
+#### Upgrade Druid segments table
+
+Druid 28.0.0 adds a new column to the Druid metadata table that requires an update to the table.
+
+If `druid.metadata.storage.connector.createTables` is set to `true` and the metadata store user has DDL privileges, the segments table gets automatically updated at startup to include the new `used_status_last_updated` column. No additional work is needed for the upgrade.
+
+If either of those requirements are not met, pre-upgrade steps are required. You must make these updates before you upgrade to Druid 28.0.0, or the Coordinator and Overlord processes fail.
+
+Although you can manually alter your table to add the new `used_status_last_updated` column, Druid also provides a [CLI tool](https://druid.apache.org/docs/latest/operations/metadata-migration/#create-druid-tables) to do it.
+
+[#12599](https://github.com/apache/druid/pull/12599) [#14868](https://github.com/apache/druid/pull/14868)
+
+In the example commands below:
+
+- `lib` is the Druid lib directory
+- `extensions` is the Druid extensions directory
+- `base` corresponds to the value of `druid.metadata.storage.tables.base` in the configuration, `druid` by default.
+- The `--connectURI` parameter corresponds to the value of `druid.metadata.storage.connector.connectURI`.
+- The `--user` parameter corresponds to the value of `druid.metadata.storage.connector.user`.
+- The `--password` parameter corresponds to the value of `druid.metadata.storage.connector.password`.
+- The `--action` parameter corresponds to the update action you are executing. In this case, it is `add-last-used-to-segments`
+
+##### Upgrade step for MySQL
+
+```bash
+cd ${DRUID_ROOT}
+java -classpath "lib/*" -Dlog4j.configurationFile=conf/druid/cluster/_common/log4j2.xml -Ddruid.extensions.directory="extensions" -Ddruid.extensions.loadList=[\"mysql-metadata-storage\"] -Ddruid.metadata.storage.type=mysql org.apache.druid.cli.Main tools metadata-update --connectURI="<mysql-uri>" --user USER --password PASSWORD --base druid --action add-used-flag-last-updated-to-segments
+```
+
+##### Upgrade step for PostgreSQL
+
+```bash
+cd ${DRUID_ROOT}
+java -classpath "lib/*" -Dlog4j.configurationFile=conf/druid/cluster/_common/log4j2.xml -Ddruid.extensions.directory="extensions" -Ddruid.extensions.loadList=[\"postgresql-metadata-storage\"] -Ddruid.metadata.storage.type=postgresql org.apache.druid.cli.Main tools metadata-update --connectURI="<postgresql-uri>" --user  USER --password PASSWORD --base druid --action add-used-flag-last-updated-to-segments
+```
+
+##### Manual upgrade step
+
+```SQL
+ALTER TABLE druid_segments
+ADD used_status_last_updated varchar(255);
+```
+
+#### Recommended syntax for SQL UNNEST
+
+The recommended syntax for SQL UNNEST has changed. We recommend using CROSS JOIN instead of commas for most queries to prevent issues with precedence. For example, use:
+
+```sql
+SELECT column_alias_name1 FROM datasource CROSS JOIN UNNEST(source_expression1) AS table_alias_name1(column_alias_name1) CROSS JOIN UNNEST(source_expression2) AS table_alias_name2(column_alias_name2), ...
+```
+
+Do not use:
+
+```sql
+SELECT column_alias_name FROM datasource, UNNEST(source_expression1) AS table_alias_name1(column_alias_name1), UNNEST(source_expression2) AS table_alias_name2(column_alias_name2), ...
+```
+
+#### Dynamic parameters
+
+The Apache Calcite version has been upgraded from 1.21 to 1.35. As part of the Calcite upgrade, the behavior of type inference for dynamic parameters has changed. To avoid any type interference issues, explicitly `CAST` all dynamic parameters as a specific data type in SQL queries. For example, use:
+
+```sql
+SELECT (1 * CAST (? as DOUBLE))/2 as tmp
+```
+
+Do not use:
+
+```sql
+SELECT (1 * ?)/2 as tmp
+```
+
+#### Nested column format
+
+`json` type columns created with Druid 28.0.0 are not backwards compatible with Druid versions older than 26.0.0.
+If you are upgrading from a version prior to Druid 26.0.0 and you use `json` columns, upgrade to Druid 26.0.0 before you upgrade to Druid 28.0.0.
+Additionally, to downgrade to a version older than Druid 26.0.0, any new segments created in Druid 28.0.0 should be re-ingested using Druid 26.0.0 or 27.0.0 prior to further downgrading.
+
+When upgrading from a previous version, you can continue to write nested columns in a backwards compatible format (version 4).
+
+In a classic batch ingestion job, include `formatVersion` in the `dimensions` list of the `dimensionsSpec` property. For example:
+
+```json
+      "dimensionsSpec": {
+        "dimensions": [
+          "product",
+          "department",
+          {
+            "type": "json",
+            "name": "shipTo",
+            "formatVersion": 4
+          }
+        ]
+      },
+```
+
+To set the default nested column version, set the desired format version in the common runtime properties. For example:
+
+```java
+druid.indexing.formats.nestedColumnFormatVersion=4
+```
+
+#### SQL compatibility
+
+Starting with Druid 28.0.0, the default way Druid treats nulls and booleans has changed.
+
+For nulls, Druid now differentiates between an empty string and a record with no data as well as between an empty numerical record and `0`.  
+You can revert to the previous behavior by setting `druid.generic.useDefaultValueForNull` to `true`.
+
+This property affects both storage and querying, and must be set on all Druid service types to be available at both ingestion time and query time. Reverting this setting to the old value restores the previous behavior without reingestion.
+
+For booleans, Druid now strictly uses `1` (true) or `0` (false). Previously, true and false could be represented either as `true` and `false` as well as `1` and `0`, respectively. In addition, Druid now returns a null value for boolean comparisons like `True && NULL`.
+
+You can revert to the previous behavior by setting `druid.expressions.useStrictBooleans` to `false`.
+This property affects both storage and querying, and must be set on all Druid service types to be available at both ingestion time and query time. Reverting this setting to the old value restores the previous behavior without reingestion.
+
+The following table illustrates some example scenarios and the impact of the changes.
+
+<details>
+<summary>Show the table</summary>
+
+| Query| Druid 27.0.0 and earlier| Druid 28.0.0 and later|
+|------|------------------------|----------------------|
+| Query empty string| Empty string (`''`) or null| Empty string (`''`)|
+| Query null string| Null or empty| Null|
+| COUNT(*)| All rows, including nulls| All rows, including nulls|
+| COUNT(column)| All rows excluding empty strings| All rows including empty strings but excluding nulls|
+| Expression 100 && 11| 11| 1|
+| Expression 100 &#124;&#124; 11| 100| 1|
+| Null FLOAT/DOUBLE column| 0.0| Null|
+| Null LONG column| 0| Null|
+| Null `__time` column| 0, meaning 1970-01-01 00:00:00 UTC| 1970-01-01 00:00:00 UTC|
+| Null MVD column| `''`| Null|
+| ARRAY| Null| Null|
+| COMPLEX| none| Null|
+</details>
+
+Before upgrading to Druid 28.0.0, update your queries to account for the changed behavior as described in the following sections.
+
+##### NULL filters
+
+If your queries use NULL in the filter condition to match both nulls and empty strings, you should add an explicit filter clause for empty strings. For example, update `s IS NULL` to `s IS NULL OR s = ''`.
+
+##### COUNT functions
+
+`COUNT(column)` now counts empty strings. If you want to continue excluding empty strings from the count, replace `COUNT(column)` with `COUNT(column) FILTER(WHERE column <> '')`.
+
+##### GroupBy queries
+
+GroupBy queries on columns containing null values can now have additional entries as nulls can co-exist with empty strings.
+
+#### Stop Supervisors that ingest from multiple Kafka topics before downgrading
+
+If you have added supervisors that ingest from multiple Kafka topics in Druid 28.0.0 or later, stop those supervisors before downgrading to a version prior to Druid 28.0.0 because the supervisors will fail in versions prior to Druid 28.0.0.
+
+#### `lenientAggregatorMerge` deprecated
+
+`lenientAggregatorMerge` property in segment metadata queries has been deprecated. It will be removed in future releases.
+Use `aggregatorMergeStrategy` instead. `aggregatorMergeStrategy` also supports the `latest` and `earliest` strategies in addition to `strict` and `lenient` strategies from `lenientAggregatorMerge`.
+
+[#14560](https://github.com/apache/druid/pull/14560)
+[#14598](https://github.com/apache/druid/pull/14598)
+
+#### Broker parallel merge config options
+
+The paths for `druid.processing.merge.pool.*` and `druid.processing.merge.task.*` have been flattened to use `druid.processing.merge.*` instead. The legacy paths for the configs are now deprecated and will be removed in a future release. Migrate your settings to use the new paths because the old paths will be ignored in the future.
+
+[#14695](https://github.com/apache/druid/pull/14695)
+
+#### Ingestion options for ARRAY typed columns
+
+Starting with Druid 28.0.0, the MSQ task engine can detect and ingest arrays as ARRAY typed columns when you set the query context parameter `arrayIngestMode` to `array`.
+The `arrayIngestMode` context parameter controls how ARRAY type values are stored in Druid segments.
+
+When you set `arrayIngestMode` to `array` (recommended for SQL compliance), the MSQ task engine stores all ARRAY typed values in [ARRAY typed columns](https://druid.apache.org/docs/latest/querying/arrays) and supports storing both VARCHAR and numeric typed arrays.
+
+For backwards compatibility, `arrayIngestMode` defaults to `mvd`. When `"arrayIngestMode":"mvd"`, Druid only supports VARCHAR typed arrays and stores them as [multi-value string columns](https://druid.apache.org/docs/latest/querying/multi-value-dimensions).
+
+When you set `arrayIngestMode` to `none`, Druid throws an exception when trying to store any type of arrays.
+
+For more information on how to ingest `ARRAY` typed columns with SQL-based ingestion, see [SQL data types](https://druid.apache.org/docs/latest/querying/sql-data-types#arrays) and [Array columns](https://druid.apache.org/docs/latest/querying/arrays).
+
+### Incompatible changes
+
+#### Removed Hadoop 2
+
+Support for Hadoop 2 has been removed.
+Migrate to SQL-based ingestion or JSON-based batch ingestion if you are using Hadoop 2.x for ingestion today.
+If migrating to Druid's built-in ingestion is not possible, you must upgrade your Hadoop infrastructure to 3.x+ before upgrading to Druid 28.0.0.
+
+[#14763](https://github.com/apache/druid/pull/14763)
+
+#### Removed GroupBy v1 
+
+The GroupBy v1 engine has been removed. Use the GroupBy v2 engine instead, which has been the default GroupBy engine for several releases.
+There should be no impact on your queries.
+
+Additionally, `AggregatorFactory.getRequiredColumns` has been deprecated and will be removed in a future release. If you have an extension that implements `AggregatorFactory`, then this method should be removed from your implementation.
+
+[#14866](https://github.com/apache/druid/pull/14866)
+
+#### Removed Coordinator dynamic configs
+
+The `decommissioningMaxPercentOfMaxSegmentsToMove` config has been removed.
+The use case for this config is handled by smart segment loading now, which is enabled by default.
+
+[#14923](https://github.com/apache/druid/pull/14923)
+
+#### Removed `cachingCost` strategy
+
+The `cachingCost` strategy for segment loading has been removed.
+Use `cost` instead, which has the same benefits as `cachingCost`.
+
+If you have `cachingCost` set, the system ignores this setting and automatically uses `cost`.
+
+[#14798](https://github.com/apache/druid/pull/14798)
+
+#### Removed `InsertCannotOrderByDescending`
+
+The deprecated MSQ fault `InsertCannotOrderByDescending` has been removed.
+
+[#14588](https://github.com/apache/druid/pull/14588)
+
+#### Removed the backward compatibility code for the Handoff API
+
+The backward compatibility code for the Handoff API in `CoordinatorBasedSegmentHandoffNotifier` has been removed.
+If you are upgrading from a Druid version older than 0.14.0, upgrade to a newer version of Druid before upgrading to Druid 28.0.0.
+
+[#14652](https://github.com/apache/druid/pull/14652)
+
+## 27.0.0
+
+### Upgrade notes
+
+#### Worker input bytes for SQL-based ingestion
+
+The maximum input bytes for each worker for SQL-based ingestion is now 512 MiB (previously 10 GiB).
+
+[#14307](https://github.com/apache/druid/pull/14307)
+
+#### Parameter execution changes for Kafka
+
+When using the built-in `FileConfigProvider` for Kafka, interpolations are now intercepted by the JsonConfigurator instead of being passed down to the Kafka provider. This breaks existing deployments.
+
+For more information, see [KIP-297](https://cwiki.apache.org/confluence/display/KAFKA/KIP-297%3A+Externalizing+Secrets+for+Connect+Configurations).
+
+[#13023](https://github.com/apache/druid/pull/13023)
+
+#### Hadoop 2 deprecated
+
+Many of the important dependent libraries that Druid uses no longer support Hadoop 2. In order for Druid to stay current and have pathways to mitigate security vulnerabilities, the community has decided to deprecate support for Hadoop 2.x releases starting this release. Starting with Druid 28.x, Hadoop 3.x is the only supported Hadoop version.
+
+Consider migrating to SQL-based ingestion or native ingestion if you are using Hadoop 2.x for ingestion today. If migrating to Druid ingestion is not possible, plan to upgrade your Hadoop infrastructure before upgrading to the next Druid release.
+
+#### GroupBy v1 deprecated
+
+GroupBy queries using the v1 legacy engine has been deprecated. It will be removed in future releases. Use v2 instead. Note that v2 has been the default GroupBy engine.
+
+For more information, see [GroupBy queries](https://druid.apache.org/docs/latest/querying/groupbyquery.html).
+
+#### Push-based real-time ingestion deprecated
+
+Support for push-based real-time ingestion has been deprecated. It will be removed in future releases.
+
+#### `cachingCost` segment balancing strategy deprecated
+
+The `cachingCost` strategy has been deprecated and will be removed in future releases. Use an alternate segment balancing strategy instead, such as `cost`.
+
+#### Segment loading config changes
+
+The following segment related configs are now deprecated and will be removed in future releases: 
+
+* `maxSegmentsInNodeLoadingQueue`
+* `maxSegmentsToMove`
+* `replicationThrottleLimit`
+* `useRoundRobinSegmentAssignment`
+* `replicantLifetime`
+* `maxNonPrimaryReplicantsToLoad`
+* `decommissioningMaxPercentOfMaxSegmentsToMove`
+
+Use `smartSegmentLoading` mode instead, which calculates values for these variables automatically.
+
+Additionally, the defaults for the following Coordinator dynamic configs have changed:
+
+* `maxsegmentsInNodeLoadingQueue` : 500, previously 100
+* `maxSegmentsToMove`: 100, previously 5
+* `replicationThrottleLimit`: 500, previously 10
+
+These new defaults can improve performance for most use cases.
+
+[#13197](https://github.com/apache/druid/pull/13197)
+[#14269](https://github.com/apache/druid/pull/14269)
+
+#### `SysMonitor` support deprecated
+
+Switch to `OshiSysMonitor` as `SysMonitor` is now deprecated and will be removed in future releases.
+
+### Incompatible changes
+
+#### Removed property for setting max bytes for dimension lookup cache
+
+`druid.processing.columnCache.sizeBytes` has been removed since it provided limited utility after a number of internal changes. Leaving this config is harmless, but it does nothing.
+
+[#14500](https://github.com/apache/druid/pull/14500)
+
+#### Removed Coordinator dynamic configs
+
+The following Coordinator dynamic configs have been removed:
+
+* `emitBalancingStats`: Stats for errors encountered while balancing will always be emitted. Other debugging stats will not be emitted but can be logged by setting the appropriate `debugDimensions`.
+* `useBatchedSegmentSampler` and `percentOfSegmentsToConsiderPerMove`: Batched segment sampling is now the standard and will always be on.
+
+Use the new [smart segment loading](https://druid.apache.org/docs/latest/configuration/#smart-segment-loading) mode instead.
+
+[#14524](https://github.com/apache/druid/pull/14524)
+
+## 26.0.0
+
+### Upgrade notes
+
+#### Real-time tasks
+
+Optimized query performance by lowering the default maxRowsInMemory for real-time ingestion, which might lower overall ingestion throughput.
+
+[#13939](https://github.com/apache/druid/pull/13939)
+
+### Incompatible changes
+
+#### Firehose ingestion removed
+
+The firehose/parser specification used by legacy Druid streaming formats is removed.
+Firehose ingestion was deprecated in version 0.17, and support for this ingestion was removed in version 24.0.0.
+
+[#12852](https://github.com/apache/druid/pull/12852)
+
+#### Information schema now uses numeric column types
+
+The Druid system table (`INFORMATION_SCHEMA`) now uses SQL types instead of Druid types for columns. This change makes the `INFORMATION_SCHEMA` table behave more like standard SQL. You may need to update your queries in the following scenarios in order to avoid unexpected results if you depend either of the following:
+
+* Numeric fields being treated as strings.
+* Column numbering starting at 0. Column numbering is now 1-based.
+
+[#13777](https://github.com/apache/druid/pull/13777)
+
+#### `frontCoded` segment format change
+
+The `frontCoded` type of `stringEncodingStrategy` on `indexSpec` with a new segment format version, which typically has faster read speeds and reduced segment size. This improvement is backwards incompatible with Druid 25.0.0.
+
+## 25.0.0
+
+### Upgrade notes
+
+#### Default HTTP-based segment discovery and task management
+
+The default segment discovery method now uses HTTP instead of ZooKeeper.
+
+This update changes the defaults for the following properties:
+
+|Property|New default|Previous default|
+|--------|-----------|----------------|
+|`druid.serverview.type` for segment management|http|batch|
+|`druid.coordinator.loadqueuepeon.type` for segment management|http| curator|
+|`druid.indexer.runner.type` for the Overlord|httpRemote|local|
+
+To use ZooKeeper instead of HTTP, change the values for the properties back to the previous defaults. ZooKeeper-based implementations for these properties are deprecated and will be removed in a subsequent release.
+
+[#13092](https://github.com/apache/druid/pull/13092)
+
+#### Finalizing HLL and quantiles sketch aggregates
+
+The aggregation functions for HLL and quantiles sketches returned sketches or numbers when they are finalized depending on where they were in the native query plan.
+
+Druid no longer finalizes aggregators in the following two cases:
+
+* aggregators appear in the outer level of a query
+* aggregators are used as input to an expression or finalizing-field-access post-aggregator
+
+This change aligns the behavior of HLL and quantiles sketches with theta sketches.
+
+To restore old behavior, you can set `sqlFinalizeOuterSketches=true` in the query context.
+
+[#13247](https://github.com/apache/druid/pull/13247)
+
+#### Kill tasks mark segments as unused only if specified
+
+When you issue a kill task, Druid marks the underlying segments as unused only if explicitly specified. For more information, see the [API reference](https://druid.apache.org/docs/latest/api-reference/data-management-api).
+
+[#13104](https://github.com/apache/druid/pull/13104)
+
+### Incompatible changes
+
+#### Upgrade curator to 5.3.0
+
+Apache Curator upgraded to the latest version, 5.3.0. This version drops support for ZooKeeper 3.4 but Druid has already officially dropped support in 0.22. In 5.3.0, Curator has removed support for Exhibitor so all related configurations and tests have been removed.
+
+[#12939](https://github.com/apache/druid/pull/12939)
+
+#### Fixed Parquet list conversion
+
+The behavior of the parquet reader for lists of structured objects has been changed to be consistent with other parquet logical list conversions. The data is now fetched directly, more closely matching its expected structure.
+
+[#13294](https://github.com/apache/druid/pull/13294)
+
+## 24.0.0
+
+### Upgrade notes
+
+#### Permissions for multi-stage query engine
+
+To read external data using the multi-stage query task engine, you must have READ permissions for the EXTERNAL resource type. Users without the correct permission encounter a 403 error when trying to run SQL queries that include EXTERN.
+
+The way you assign the permission depends on your authorizer. For example, with [basic security](https://github.com/apache/druid/blob/druid-24.0.0/docs/operations/security-user-auth.md) in Druid, add the EXTERNAL READ permission by sending a POST request to the [roles API](https://github.com/apache/druid/blob/druid-24.0.0/docs/development/extensions-core/druid-basic-security.md#permissions).
+
+The example adds permissions for users with the admin role using a basic authorizer named MyBasicMetadataAuthorizer. The following permissions are granted:
+
+* DATASOURCE READ
+* DATASOURCE WRITE
+* CONFIG READ
+* CONFIG WRITE
+* STATE READ
+* STATE WRITE
+* EXTERNAL READ
+
+```
+curl --location --request POST 'http://localhost:8081/druid-ext/basic-security/authorization/db/MyBasicMetadataAuthorizer/roles/admin/permissions' \
+--header 'Content-Type: application/json' \
+--data-raw '[
+{
+  "resource": {
+    "name": ".*",
+    "type": "DATASOURCE"
+  },
+  "action": "READ"
+},
+{
+  "resource": {
+    "name": ".*",
+    "type": "DATASOURCE"
+  },
+  "action": "WRITE"
+},
+{
+  "resource": {
+    "name": ".*",
+    "type": "CONFIG"
+  },
+  "action": "READ"
+},
+{
+  "resource": {
+    "name": ".*",
+    "type": "CONFIG"
+  },
+  "action": "WRITE"
+},
+{
+  "resource": {
+    "name": ".*",
+    "type": "STATE"
+  },
+  "action": "READ"
+},
+{
+  "resource": {
+    "name": ".*",
+    "type": "STATE"
+  },
+  "action": "WRITE"
+},
+{
+  "resource": {
+    "name": "EXTERNAL",
+    "type": "EXTERNAL"
+  },
+  "action": "READ"
+}
+]'
+```
+
+#### Behavior for unused segments
+
+Druid automatically retains any segments marked as unused. Previously, Druid permanently deleted unused segments from metadata store and deep storage after their duration to retain passed. This behavior was reverted from 0.23.0.
+
+[#12693](https://github.com/apache/druid/pull/12693)
+
+#### Default for `druid.processing.fifo`
+
+The default for `druid.processing.fifo` is now true. This means that tasks of equal priority are treated in a FIFO manner. For most use cases, this change can improve performance on heavily loaded clusters.
+
+[#12571](https://github.com/apache/druid/pull/12571)
+
+#### Update to JDBC statement closure
+
+In previous releases, Druid automatically closed the JDBC Statement when the ResultSet was closed. Druid closed the ResultSet on EOF. Druid closed the statement on any exception. This behavior is, however, non-standard.
+In this release, Druid's JDBC driver follows the JDBC standards more closely:
+The ResultSet closes automatically on EOF, but does not close the Statement or PreparedStatement. Your code must close these statements, perhaps by using a try-with-resources block.
+The PreparedStatement can now be used multiple times with different parameters. (Previously this was not true since closing the ResultSet closed the PreparedStatement.)
+If any call to a Statement or PreparedStatement raises an error, the client code must still explicitly close the statement. According to the JDBC standards, statements are not closed automatically on errors. This allows you to obtain information about a failed statement before closing it.
+If you have code that depended on the old behavior, you may have to change your code to add the required close statement.
+
+[#12709](https://github.com/apache/druid/pull/12709)
+
+## 0.23.0
+
+### Upgrade notes
+
+#### Auto-killing of segments
+
+In 0.23.0, Auto killing of segments is now enabled by default [(#12187)](https://github.com/apache/druid/pull/12187). The new defaults should kill all unused segments older than 90 days. If users do not want this behavior on an upgrade, they should explicitly disable the behavior. This is a risky change since depending on the interval, segments will be killed immediately after being marked unused. this behavior will be reverted or changed in the next druid release. Please see [(#12693)](https://github.com/apache/druid/pull/12693) for more details.
+
+#### Other changes
+
+# Other changes
+
+- Kinesis ingestion requires `listShards` API access on the stream.
+- Kafka clients libraries have been upgraded to 3.0.0 [(#11735)](https://github.com/apache/druid/pull/11735)
+- The dynamic coordinator config, `percentOfSegmentsToConsiderPerMove` has been deprecated and will be removed in a future release of Druid. It is being replaced by a new segment picking strategy introduced in [(#11257)](https://github.com/apache/druid/pull/11257). This new strategy is currently toggled off by default, but can be toggled on if you set the dynamic coordinator config `useBatchedSegmentSampler` to true. Setting this as such, will disable the use of the deprecated `percentOfSegmentsToConsiderPerMove`. In a future release, `useBatchedSegmentSampler` will become permanently true. [(#11960)](https://github.com/apache/druid/pull/11960)
+
+## 0.22.0
+
+### Upgrade notes
+
+#### Dropped support for Apache ZooKeeper 3.4
+
+Following up to 0.21, which officially deprecated support for ZooKeeper 3.4, [which has been end-of-life for a while](https://lists.apache.org/thread/xckr6nnsg9rxchkbvltkvt7hr2d0mhbo), support for ZooKeeper 3.4 is now removed in 0.22.0. Be sure to upgrade your ZooKeeper cluster prior to upgrading your Druid cluster to 0.22.0.
+
+[#10780](https://github.com/apache/druid/issues/10780)
+[#11073](https://github.com/apache/druid/pull/11073)
+
+#### Native batch ingestion segment allocation fix
+
+Druid 0.22.0 includes an important bug-fix in native batch indexing where transient failures of indexing sub-tasks can result in non-contiguous partitions in the result segments, which will never become queryable due to logic which checks for the 'complete' set. This issue has been resolved in the latest version of Druid, but required a change in the protocol which batch tasks use to allocate segments, and this change can cause issues during rolling downgrades if you decide to roll back from Druid 0.22.0 to an earlier version.
+
+To avoid task failure during a rolling-downgrade, set
+
+```
+druid.indexer.task.default.context={ "useLineageBasedSegmentAllocation" : false }
+```
+
+in the overlord runtime properties, and wait for all tasks which have `useLineageBasedSegmentAllocation` set to true to complete before initiating the downgrade. After these tasks have all completed the downgrade shouldn't have any further issue and the setting can be removed from the overlord configuration (recommended, as you will want this setting enabled if you are running Druid 0.22.0 or newer).
+
+[#11189](https://github.com/apache/druid/pull/11189)
+
+#### SQL timeseries no longer skip empty buckets with all granularity
+
+Prior to Druid 0.22, an SQL group by query which is using a single universal grouping key (e.g. only aggregators) such as `SELECT COUNT(*), SUM(x) FROM y WHERE z = 'someval'` would produce an empty result set instead of `[0, null]` that might be expected from this query matching no results. This was because underneath this would plan into a timeseries query with 'ALL' granularity, and skipEmptyBuckets set to true in the query context. This latter option caused the results of such a query to return no results, as there are no buckets with values to aggregate and so they are skipped, making an empty result set instead of a 'nil' result set. This behavior has been changed to behave in line with other SQL implementations, but the previous behavior can be obtained by explicitly setting `skipEmptyBuckets` on the query context.
+
+[#11188](https://github.com/apache/druid/pull/11188)
+
+#### Druid reingestion incompatible changes
+
+Batch tasks using a 'Druid' input source to reingest segment data will no longer accept the 'dimensions' and 'metrics' sections of their task spec, and now will internally use a new columns filter to specify which columns from the original segment should be retained. Additionally, timestampSpec is no longer ignored, allowing the __time column to be modified or replaced with a different column. These changes additionally fix a bug where transformed columns would be ignored and unavailable on the new segments.
+
+[#10267](https://github.com/apache/druid/pull/10267)
+
+#### Druid web-console no longer supports IE11 and other older browsers
+
+Some things might still work, but it is no longer officially supported so that newer Javascript features can be used to develop the web-console.
+
+[#11357](https://github.com/apache/druid/pull/11357)
+
+#### Changed default maximum segment loading queue size
+
+Druid coordinator `maxSegmentsInNodeLoadingQueue` dynamic configuration has been changed from unlimited (`0`) to `100`. This should make the coordinator behave in a much more relaxed manner during periods of cluster volatility, such as a rolling upgrade, but caps the total number of segments that will be loaded in any given coordinator cycle to 100 per server, which can slow down the speed at which a completely stopped cluster is started and loaded from deep storage.
+
+[#11540](https://github.com/apache/druid/pull/11540)
+
+## 0.21.0
+
+#### Improved HTTP status codes for query errors
+
+Before this release, Druid returned the "internal error (500)" for most of the query errors. Now Druid returns different error codes based on their cause. The following table lists the errors and their corresponding codes that has changed:
+
+| Exception | Description| Old code | New code |
+|-----|-|--|-----|
+| SqlParseException and ValidationException from Calcite | Query planning failed | 500 | 400 |
+| QueryTimeoutException | Query execution didn't finish in timeout | 500 | 504 |
+| ResourceLimitExceededException | Query asked more resources than configured threshold | 500 | 400 |
+| InsufficientResourceException | Query failed to schedule because of lack of merge buffers available at the time when it was submitted | 500 | 429, merged to QueryCapacityExceededException |
+| QueryUnsupportedException | Unsupported functionality | 400 | 501 |
+
+[#10464](https://github.com/apache/druid/pull/10464)
+[#10746](https://github.com/apache/druid/pull/10746)
+
+####  Query interrupted metric
+`query/interrupted/count` no longer counts the queries that timed out. These queries are counted by `query/timeout/count`.
+
+#### context dimension in query metrics
+
+`context` is now a default dimension emitted for all query metrics. `context` is a JSON-formatted string containing the query context for the query that the emitted metric refers to. The addition of a dimension that was not previously alters some metrics emitted by Druid. You should plan to handle this new `context` dimension in your metrics pipeline. Since the dimension is a JSON-formatted string, a common solution is to parse the dimension and either flatten it or extract the bits you want and discard the full JSON-formatted string blob.
+
+[#10578](https://github.com/apache/druid/pull/10578)
+
+#### Deprecated support for Apache ZooKeeper 3.4
+
+As [ZooKeeper 3.4 has been end-of-life for a while](https://mail-archives.apache.org/mod_mbox/zookeeper-user/202004.mbox/%3C41A7EC67-D8F4-4C3A-B2DB-C2741C2EECA3%40apache.org%3E), support for ZooKeeper 3.4 is deprecated in 0.21.0 and will be removed in the near future.
+
+[#10780](https://github.com/apache/druid/issues/10780)
+
+#### Consistent serialization format and column naming convention for the sys.segments table
+
+All columns in the `sys.segments` table are now serialized in the JSON format to make them consistent with other system tables. Column names now use the same "snake case" convention.
+
+[#10481](https://github.com/apache/druid/pull/10481)
diff --git a/docs/35.0.0/tutorials/cluster.md b/docs/35.0.0/tutorials/cluster.md
new file mode 100644
index 0000000000..f347411301
--- /dev/null
+++ b/docs/35.0.0/tutorials/cluster.md
@@ -0,0 +1,482 @@
+---
+id: cluster
+title: Clustered deployment
+sidebar_label: Clustered deployment
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+Apache Druid is designed to be deployed as a scalable, fault-tolerant cluster.
+
+In this document, we'll set up a simple cluster and discuss how it can be further configured to meet
+your needs.
+
+This simple cluster will feature:
+
+ - A Master server to host the Coordinator and Overlord processes
+ - Two scalable, fault-tolerant Data servers running Historical and Middle Manager processes
+ - A query server, hosting the Druid Broker and Router processes
+
+In production, we recommend deploying multiple Master servers and multiple Query servers in a fault-tolerant configuration based on your specific fault-tolerance needs, but you can get started quickly with one Master and one Query server and add more servers later.
+
+## Select hardware
+
+### Fresh Deployment
+
+If you do not have an existing Druid cluster, and wish to start running Druid in a clustered deployment, this guide provides an example clustered deployment with pre-made configurations.
+
+#### Master server
+
+The Coordinator and Overlord processes are responsible for handling the metadata and coordination needs of your cluster. They can be colocated together on the same server.
+
+In this example, we will be deploying the equivalent of one AWS [m5.2xlarge](https://aws.amazon.com/ec2/instance-types/m5/) instance.
+
+This hardware offers:
+
+- 8 vCPUs
+- 32 GiB RAM
+
+Example Master server configurations that have been sized for this hardware can be found under `conf/druid/cluster/master`.
+
+#### Data server
+
+Historicals and Middle Managers can be colocated on the same server to handle the actual data in your cluster. These servers benefit greatly from CPU, RAM,
+and SSDs.
+
+In this example, we will be deploying the equivalent of two AWS [i3.4xlarge](https://aws.amazon.com/ec2/instance-types/i3/) instances.
+
+This hardware offers:
+
+- 16 vCPUs
+- 122 GiB RAM
+- 2 * 1.9TB SSD storage
+
+Example Data server configurations that have been sized for this hardware can be found under `conf/druid/cluster/data`.
+
+#### Query server
+
+Druid Brokers accept queries and farm them out to the rest of the cluster. They also optionally maintain an
+in-memory query cache. These servers benefit greatly from CPU and RAM.
+
+In this example, we will be deploying the equivalent of one AWS [m5.2xlarge](https://aws.amazon.com/ec2/instance-types/m5/) instance.
+
+This hardware offers:
+
+- 8 vCPUs
+- 32 GiB RAM
+
+You can consider co-locating any open source UIs or query libraries on the same server that the Broker is running on.
+
+Example Query server configurations that have been sized for this hardware can be found under `conf/druid/cluster/query`.
+
+#### Other Hardware Sizes
+
+The example cluster above is chosen as a single example out of many possible ways to size a Druid cluster.
+
+You can choose smaller/larger hardware or less/more servers for your specific needs and constraints.
+
+If your use case has complex scaling requirements, you can also choose to not co-locate Druid processes (e.g., standalone Historical servers).
+
+The information in the [basic cluster tuning guide](../operations/basic-cluster-tuning.md) can help with your decision-making process and with sizing your configurations.
+
+### Migrating from a single-server deployment
+
+If you have an existing single-server deployment, such as the ones from the [single-server deployment examples](../operations/single-server.md), and you wish to migrate to a clustered deployment of similar scale, the following section contains guidelines for choosing equivalent hardware using the Master/Data/Query server organization.
+
+#### Master server
+
+The main considerations for the Master server are available CPUs and RAM for the Coordinator and Overlord heaps.
+
+Sum up the allocated heap sizes for your Coordinator and Overlord from the single-server deployment, and choose Master server hardware with enough RAM for the combined heaps, with some extra RAM for other processes on the machine.
+
+For CPU cores, you can choose hardware with approximately 1/4th of the cores of the single-server deployment.
+
+#### Data server
+
+When choosing Data server hardware for the cluster, the main considerations are available CPUs and RAM, and using SSD storage if feasible.
+
+In a clustered deployment, having multiple Data servers is a good idea for fault-tolerance purposes.
+
+When choosing the Data server hardware, you can choose a split factor `N`, divide the original CPU/RAM of the single-server deployment by `N`, and deploy `N` Data servers of reduced size in the new cluster.
+
+Instructions for adjusting the Historical/Middle Manager configs for the split are described in a later section in this guide.
+
+#### Query server
+
+The main considerations for the Query server are available CPUs and RAM for the Broker heap + direct memory, and Router heap.
+
+Sum up the allocated memory sizes for your Broker and Router from the single-server deployment, and choose Query server hardware with enough RAM to cover the Broker/Router, with some extra RAM for other processes on the machine.
+
+For CPU cores, you can choose hardware with approximately 1/4th of the cores of the single-server deployment.
+
+The [basic cluster tuning guide](../operations/basic-cluster-tuning.md) has information on how to calculate Broker/Router memory usage.
+
+## Select OS
+
+We recommend running your favorite Linux distribution. You will also need 
+
+* [Java 17](../operations/java.md)
+* Python 3
+
+:::info
+ If needed, you can specify where to find Java using the environment variables
+ `DRUID_JAVA_HOME` or `JAVA_HOME`. For more details run the `bin/verify-java` script.
+:::
+
+For information about installing Java, see the documentation for your OS package manager. If your Ubuntu-based OS does not have a recent enough version of Java, Linux Uprising offers [packages for those
+OSes](https://launchpad.net/~linuxuprising/+archive/ubuntu/java).
+
+## Download the distribution
+
+First, download and unpack the release archive. It's best to do this on a single machine at first,
+since you will be editing the configurations and then copying the modified distribution out to all
+of your servers.
+
+[Download](https://www.apache.org/dyn/closer.cgi?path=/druid/35.0.0/apache-druid35.0.0-bin.tar.gz)
+the 35.0.0 release.
+
+Extract Druid by running the following commands in your terminal:
+
+```bash
+tar -xzf apache-druid-35.0.0-bin.tar.gz
+cd apache-druid-35.0.0
+```
+
+In the package, you should find:
+
+* `LICENSE` and `NOTICE` files
+* `bin/*` - scripts related to the [single-machine quickstart](index.md)
+* `conf/druid/cluster/*` - template configurations for a clustered setup
+* `extensions/*` - core Druid extensions
+* `hadoop-dependencies/*` - Druid Hadoop dependencies
+* `lib/*` - libraries and dependencies for core Druid
+* `quickstart/*` - files related to the [single-machine quickstart](index.md)
+
+We'll be editing the files in `conf/druid/cluster/` in order to get things running.
+
+### Migrating from Single-Server Deployments
+
+In the following sections we will be editing the configs under `conf/druid/cluster`.
+
+If you have an existing single-server deployment, please copy your existing configs to `conf/druid/cluster` to preserve any config changes you have made.
+
+## Configure metadata storage and deep storage
+
+### Migrating from Single-Server Deployments
+
+If you have an existing single-server deployment and you wish to preserve your data across the migration, please follow the instructions at [metadata migration](../operations/metadata-migration.md) and [deep storage migration](../operations/deep-storage-migration.md) before updating your metadata/deep storage configs.
+
+These guides are targeted at single-server deployments that use the Derby metadata store and local deep storage. If you are already using a non-Derby metadata store in your single-server cluster, you can reuse the existing metadata store for the new cluster.
+
+These guides also provide information on migrating segments from local deep storage. A clustered deployment requires distributed deep storage like S3 or HDFS. If your single-server deployment was already using distributed deep storage, you can reuse the existing deep storage for the new cluster.
+
+### Metadata storage
+
+In `conf/druid/cluster/_common/common.runtime.properties`, replace
+"metadata.storage.*" with the address of the machine that you will use as your metadata store:
+
+- `druid.metadata.storage.connector.connectURI`
+- `druid.metadata.storage.connector.host`
+
+In a production deployment, we recommend running a dedicated metadata store such as MySQL or PostgreSQL with replication, deployed separately from the Druid servers.
+
+The [MySQL extension](../development/extensions-core/mysql.md) and [PostgreSQL extension](../development/extensions-core/postgresql.md) docs have instructions for extension configuration and initial database setup.
+
+### Deep storage
+
+Druid relies on a distributed filesystem or large object (blob) store for data storage. The most
+commonly used deep storage implementations are S3 (popular for those on AWS) and HDFS (popular if
+you already have a Hadoop deployment).
+
+#### S3
+
+In `conf/druid/cluster/_common/common.runtime.properties`,
+
+- Add "druid-s3-extensions" to `druid.extensions.loadList`.
+
+- Comment out the configurations for local storage under "Deep Storage" and "Indexing service logs".
+
+- Uncomment and configure appropriate values in the "For S3" sections of "Deep Storage" and
+"Indexing service logs".
+
+After this, you should have made the following changes:
+
+```
+druid.extensions.loadList=["druid-s3-extensions"]
+
+#druid.storage.type=local
+#druid.storage.storageDirectory=var/druid/segments
+
+druid.storage.type=s3
+druid.storage.bucket=your-bucket
+druid.storage.baseKey=druid/segments
+druid.s3.accessKey=...
+druid.s3.secretKey=...
+
+#druid.indexer.logs.type=file
+#druid.indexer.logs.directory=var/druid/indexing-logs
+
+druid.indexer.logs.type=s3
+druid.indexer.logs.s3Bucket=your-bucket
+druid.indexer.logs.s3Prefix=druid/indexing-logs
+```
+
+Please see the [S3 extension](../development/extensions-core/s3.md) documentation for more info.
+
+#### HDFS
+
+In `conf/druid/cluster/_common/common.runtime.properties`,
+
+- Add "druid-hdfs-storage" to `druid.extensions.loadList`.
+
+- Comment out the configurations for local storage under "Deep Storage" and "Indexing service logs".
+
+- Uncomment and configure appropriate values in the "For HDFS" sections of "Deep Storage" and
+"Indexing service logs".
+
+After this, you should have made the following changes:
+
+```
+druid.extensions.loadList=["druid-hdfs-storage"]
+
+#druid.storage.type=local
+#druid.storage.storageDirectory=var/druid/segments
+
+druid.storage.type=hdfs
+druid.storage.storageDirectory=/druid/segments
+
+#druid.indexer.logs.type=file
+#druid.indexer.logs.directory=var/druid/indexing-logs
+
+druid.indexer.logs.type=hdfs
+druid.indexer.logs.directory=/druid/indexing-logs
+```
+
+Also,
+
+- Place your Hadoop configuration XMLs (core-site.xml, hdfs-site.xml, yarn-site.xml,
+mapred-site.xml) on the classpath of your Druid processes. You can do this by copying them into
+`conf/druid/cluster/_common/`.
+
+Please see the [HDFS extension](../development/extensions-core/hdfs.md) documentation for more info.
+
+<a name="hadoop"></a>
+
+## Configure for connecting to Hadoop (optional)
+
+If you will be loading data from a Hadoop cluster, then at this point you should configure Druid to be aware
+of your cluster:
+
+- Update `druid.indexer.task.hadoopWorkingPath` in `conf/druid/cluster/middleManager/runtime.properties` to
+a path on HDFS that you'd like to use for temporary files required during the indexing process.
+`druid.indexer.task.hadoopWorkingPath=/tmp/druid-indexing` is a common choice.
+
+- Place your Hadoop configuration XMLs (core-site.xml, hdfs-site.xml, yarn-site.xml,
+mapred-site.xml) on the classpath of your Druid processes. You can do this by copying them into
+`conf/druid/cluster/_common/core-site.xml`, `conf/druid/cluster/_common/hdfs-site.xml`, and so on.
+
+Note that you don't need to use HDFS deep storage in order to load data from Hadoop. For example, if
+your cluster is running on Amazon Web Services, we recommend using S3 for deep storage even if you
+are loading data using Hadoop or Elastic MapReduce.
+
+For more info, please see the [Hadoop-based ingestion](../ingestion/hadoop.md) page.
+
+## Configure Zookeeper connection
+
+In a production cluster, we recommend using a dedicated ZK cluster in a quorum, deployed separately from the Druid servers.
+
+In `conf/druid/cluster/_common/common.runtime.properties`, set
+`druid.zk.service.host` to a [connection string](https://zookeeper.apache.org/doc/current/zookeeperProgrammers.html)
+containing a comma separated list of host:port pairs, each corresponding to a ZooKeeper server in your ZK quorum.
+(e.g. "127.0.0.1:4545" or "127.0.0.1:3000,127.0.0.1:3001,127.0.0.1:3002")
+
+You can also choose to run ZK on the Master servers instead of having a dedicated ZK cluster. If doing so, we recommend deploying 3 Master servers so that you have a ZK quorum.
+
+## Configuration Tuning
+
+### Migrating from a Single-Server Deployment
+
+#### Master
+
+If you are using an example configuration from [single-server deployment examples](../operations/single-server.md), these examples combine the Coordinator and Overlord processes into one combined process.
+
+The example configs under `conf/druid/cluster/master/coordinator-overlord` also combine the Coordinator and Overlord processes.
+
+You can copy your existing `coordinator-overlord` configs from the single-server deployment to `conf/druid/cluster/master/coordinator-overlord`.
+
+#### Data
+
+Suppose we are migrating from a single-server deployment that had 32 CPU and 256GiB RAM. In the old deployment, the following configurations for Historicals and Middle Managers were applied:
+
+Historical (Single-server)
+
+```
+druid.processing.buffer.sizeBytes=500MiB
+druid.processing.numMergeBuffers=8
+druid.processing.numThreads=31
+```
+
+Middle Manager (Single-server)
+
+```
+druid.worker.capacity=8
+druid.indexer.fork.property.druid.processing.numMergeBuffers=2
+druid.indexer.fork.property.druid.processing.buffer.sizeBytes=100MiB
+druid.indexer.fork.property.druid.processing.numThreads=1
+```
+
+In the clustered deployment, we can choose a split factor (2 in this example), and deploy 2 Data servers with 16CPU and 128GiB RAM each. The areas to scale are the following:
+
+Historical
+
+- `druid.processing.numThreads`: Set to `(num_cores - 1)` based on the new hardware
+- `druid.processing.numMergeBuffers`: Divide the old value from the single-server deployment by the split factor
+- `druid.processing.buffer.sizeBytes`: Keep this unchanged
+
+Middle Manager:
+
+- `druid.worker.capacity`: Divide the old value from the single-server deployment by the split factor
+- `druid.indexer.fork.property.druid.processing.numMergeBuffers`: Keep this unchanged
+- `druid.indexer.fork.property.druid.processing.buffer.sizeBytes`: Keep this unchanged
+- `druid.indexer.fork.property.druid.processing.numThreads`: Keep this unchanged
+
+The resulting configs after the split:
+
+New Historical (on 2 Data servers)
+
+```
+druid.processing.buffer.sizeBytes=500MiB
+druid.processing.numMergeBuffers=4
+druid.processing.numThreads=15
+```
+
+New Middle Manager (on 2 Data servers)
+
+```
+druid.worker.capacity=4
+druid.indexer.fork.property.druid.processing.numMergeBuffers=2
+druid.indexer.fork.property.druid.processing.buffer.sizeBytes=100MiB
+druid.indexer.fork.property.druid.processing.numThreads=1
+```
+
+#### Query
+
+You can copy your existing Broker and Router configs to the directories under `conf/druid/cluster/query`, no modifications are needed, as long as the new hardware is sized accordingly.
+
+### Fresh deployment
+
+If you are using the example cluster described above:
+- 1 Master server (m5.2xlarge)
+- 2 Data servers (i3.4xlarge)
+- 1 Query server (m5.2xlarge)
+
+The configurations under `conf/druid/cluster` have already been sized for this hardware and you do not need to make further modifications for general use cases.
+
+If you have chosen different hardware, the [basic cluster tuning guide](../operations/basic-cluster-tuning.md) can help you size your configurations.
+
+## Open ports (if using a firewall)
+
+If you're using a firewall or some other system that only allows traffic on specific ports, allow
+inbound connections on the following:
+
+### Master Server
+- 1527 (Derby metadata store; not needed if you are using a separate metadata store like MySQL or PostgreSQL)
+- 2181 (ZooKeeper; not needed if you are using a separate ZooKeeper cluster)
+- 8081 (Coordinator)
+- 8090 (Overlord)
+
+### Data Server
+- 8083 (Historical)
+- 8091, 8100&ndash;8199 (Druid Middle Manager; you may need higher than port 8199 if you have a very high `druid.worker.capacity`)
+
+### Query Server
+- 8082 (Broker)
+- 8088 (Router, if used)
+
+:::info
+ In production, we recommend deploying ZooKeeper and your metadata store on their own dedicated hardware,
+ rather than on the Master server.
+:::
+
+## Start Master Server
+
+Copy the Druid distribution and your edited configurations to your Master server.
+
+If you have been editing the configurations on your local machine, you can use *rsync* to copy them:
+
+```bash
+rsync -az apache-druid-35.0.0/ MASTER_SERVER:apache-druid-35.0.0/
+```
+
+### No Zookeeper on Master
+
+From the distribution root, run the following command to start the Master server:
+
+```
+bin/start-cluster-master-no-zk-server
+```
+
+### With Zookeeper on Master
+
+If you plan to run ZK on Master servers, first update `conf/zoo.cfg` to reflect how you plan to run ZK. Then, you
+can start the Master server processes together with ZK using:
+
+```
+bin/start-cluster-master-with-zk-server
+```
+
+:::info
+ In production, we also recommend running a ZooKeeper cluster on its own dedicated hardware.
+:::
+
+## Start Data Server
+
+Copy the Druid distribution and your edited configurations to your Data servers.
+
+From the distribution root, run the following command to start the Data server:
+
+```
+bin/start-cluster-data-server
+```
+
+You can add more Data servers as needed.
+
+:::info
+ For clusters with complex resource allocation needs, you can break apart Historicals and Middle Managers and scale the components individually.
+ This also allows you take advantage of Druid's built-in Middle Manager autoscaling facility.
+:::
+
+## Start Query Server
+
+Copy the Druid distribution and your edited configurations to your Query servers.
+
+From the distribution root, run the following command to start the Query server:
+
+```
+bin/start-cluster-query-server
+```
+
+You can add more Query servers as needed based on query load. If you increase the number of Query servers, be sure to adjust the connection pools on your Historicals and Tasks as described in the [basic cluster tuning guide](../operations/basic-cluster-tuning.md).
+
+## Loading data
+
+Congratulations, you now have a Druid cluster! The next step is to learn about recommended ways to load data into
+Druid based on your use case. Read more about [loading data](../ingestion/index.md).
diff --git a/docs/35.0.0/tutorials/docker.md b/docs/35.0.0/tutorials/docker.md
new file mode 100644
index 0000000000..76e29fd54b
--- /dev/null
+++ b/docs/35.0.0/tutorials/docker.md
@@ -0,0 +1,137 @@
+---
+id: docker
+title:  Run with Docker
+sidebar_label: Run with Docker
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+This quickstart guides you through the steps to download the Apache Druid image from [Docker Hub](https://hub.docker.com/r/apache/druid) and deploy it on a single machine using [Docker](https://www.docker.com/get-started) and [Docker Compose](https://docs.docker.com/compose/).
+After you finish the initial setup, the cluster will be ready to load data.
+
+Before beginning the quickstart, it is helpful to read the [general Druid overview](../design/index.md) and the [ingestion overview](../ingestion/index.md), because the tutorials refer to concepts discussed on those pages. It also helps to be familiar with [Docker](https://www.docker.com/get-started).
+
+This tutorial assumes you will download the required files from GitHub. The files are also available in a Druid installation and in the Druid sources.
+
+## Prerequisites
+
+* [Docker](https://www.docker.com/get-started)
+
+### Docker memory requirements
+
+The default `docker-compose.yml` launches eight containers: Zookeeper, PostgreSQL, and six Druid containers based upon the [micro quickstart configuration](../operations/single-server.md#single-server-reference-configurations-deprecated).
+Each Druid service is configured to use up to 7 GiB of memory (6 GiB direct memory and 1 GiB heap). However, the quickstart will not use all the available memory.
+
+For this setup, Docker needs at least 6 GiB of memory available for the Druid cluster. For Docker Desktop on Mac OS, adjust the memory settings in the [Docker Desktop preferences](https://docs.docker.com/desktop/mac/). If you experience a crash with a 137 error code you likely don't have enough memory allocated to Docker.
+
+You can modify the value of `DRUID_SINGLE_NODE_CONF` in the Docker [`environment`](#environment-file) to use different single-server mode. For example to use the nano quickstart: `DRUID_SINGLE_NODE_CONF=nano-quickstart`.
+
+
+## Getting started
+
+Create a directory to hold the Druid Docker files.
+
+The Druid source code contains [an example `docker-compose.yml`](https://github.com/apache/druid/blob/35.0.0/distribution/docker/docker-compose.yml) which pulls an image from Docker Hub and is suited to be used as an example environment and to experiment with Docker based Druid configuration and deployments. [Download](https://raw.githubusercontent.com/apache/druid/35.0.0/distribution/docker/docker-compose.yml) this file to the directory created above.
+
+### Compose file
+
+The example `docker-compose.yml` will create a container for each Druid service, as well as ZooKeeper and a PostgreSQL container as the metadata store.
+
+It will also create a named volume `druid_shared` as deep storage to keep and share segments and task logs among Druid services. The volume is mounted as `opt/shared` in the container.
+
+### Environment file
+
+The Druid `docker-compose.yml` example uses an [environment file](https://docs.docker.com/compose/environment-variables/#the-env_file-configuration-option) to specify the complete Druid configuration, including the environment variables described in [Configuration](#configuration). This file is named `environment` by default, and must be in the same directory as the `docker-compose.yml` file. [Download](https://raw.githubusercontent.com/apache/druid/35.0.0/distribution/docker/environment) the example `environment` file to the directory created above. The options in this file work well for trying Druid and for using the tutorial.
+
+The single-file approach is inadequate for a production system. Instead we suggest using either `DRUID_COMMON_CONFIG` and `DRUID_CONFIG_${service}` or specially tailored, service-specific environment files.
+
+### Configuration
+
+Configuration of the Druid Docker container is done via environment variables set within the container. Docker Compose passes the values from the `environment file` into the container. The variables may additionally specify paths to [the standard Druid configuration files](../configuration/index.md) which must be available within the container.
+
+The default values are fine for the Quickstart. Production systems will want to modify the defaults.
+
+Basic configuration:
+
+* `DRUID_MAXDIRECTMEMORYSIZE` -- set Java max direct memory size. Default is 6 GiB.
+* `DRUID_XMX` -- set Java `Xmx`, the maximum heap size. Default is 1 GB.
+
+Production configuration:
+
+* `DRUID_CONFIG_COMMON` -- full path to a file for Druid common properties
+* `DRUID_CONFIG_${service}` -- full path to a file for Druid service properties
+* `JAVA_OPTS` -- set Java options
+
+Logging configuration:
+
+* `DRUID_LOG4J` -- set the entire [`log4j.xml` configuration file](https://logging.apache.org/log4j/2.x/manual/configuration.html#XML)  verbatim. ([Example](https://github.com/apache/druid/blob/35.0.0/distribution/docker/environment#L52))
+* `DRUID_LOG_LEVEL` -- override the default [Log4j log level](https://en.wikipedia.org/wiki/Log4j#Log4j_log_levels)
+* `DRUID_SERVICE_LOG4J` -- set the entire [`log4j.xml` configuration file](https://logging.apache.org/log4j/2.x/manual/configuration.html#XML)  verbatim specific to a service.
+* `DRUID_SERVICE_LOG_LEVEL` -- override the default [Log4j log level](https://en.wikipedia.org/wiki/Log4j#Log4j_log_levels) in the service specific log4j.
+
+Advanced memory configuration:
+
+* `DRUID_XMS` -- set Java [`Xms`](https://docs.oracle.com/cd/E19900-01/819-4742/abeik/index.html), the initial heap size. Default is 1 GB.
+* `DRUID_MAXNEWSIZE` -- set [Java max new size](https://docs.oracle.com/cd/E19900-01/819-4742/abeik/index.html)
+* `DRUID_NEWSIZE` -- set [Java new size](https://docs.oracle.com/cd/E19900-01/819-4742/abeik/index.html)
+
+In addition to the special environment variables, the script which launches Druid in the container will use any environment variable starting with the `druid_` prefix as command-line configuration. For example, an environment variable
+
+`druid_metadata_storage_type=postgresql`
+
+is translated into the following option in the Java launch command for the Druid process in the container:
+
+`-Ddruid.metadata.storage.type=postgresql`
+
+Note that Druid uses port 8888 for the console. This port is also used by Jupyter and other tools. To avoid conflicts, you can change the port in the [`ports`](https://github.com/apache/druid/blob/0.21.1/distribution/docker/docker-compose.yml#L125) section of the `docker-compose.yml` file. For example, to expose the console on port 9999 of the host:
+
+```yaml
+    container_name: router
+    ...
+    ports:
+      - "9999:8888"
+```
+
+## Launching the cluster
+
+`cd` into the directory that contains the configuration files. This is the directory you created above, or the `distribution/docker/` in your Druid installation directory if you installed Druid locally.
+
+Run `docker compose up` to launch the cluster with a shell attached, or `docker compose up -d` to run the cluster in the background.
+
+Once the cluster has started, you can navigate to the [web console](../operations/web-console.md) at [http://localhost:8888](http://localhost:8888). The [Druid router process](../design/router.md) serves the UI.
+
+![web console](../assets/tutorial-quickstart-01.png "web console")
+
+It takes a few seconds for all the Druid processes to fully start up. If you open the console immediately after starting the services, you may see some errors that you can safely ignore.
+
+## Using the cluster
+
+From here you can follow along with the [Quickstart](./index.md#load-data). For production use, refine your `docker-compose.yml` file to add any additional external service dependencies as necessary.
+
+You can explore the Druid containers using Docker to start a shell:
+
+```sh
+docker exec -ti <id> sh
+```
+
+Where `<id>` is the container id found with `docker ps`. Druid is installed in `/opt/druid`. The [script](https://github.com/apache/druid/blob/35.0.0/distribution/docker/druid.sh) which consumes the environment variables mentioned above, and which launches Druid, is located at `/druid.sh`.
+
+Run `docker compose down` to shut down the cluster. Your data is persisted as a set of [Docker volumes](https://docs.docker.com/storage/volumes/) and will be available when you restart your Druid cluster.
+
diff --git a/docs/35.0.0/tutorials/index.md b/docs/35.0.0/tutorials/index.md
new file mode 100644
index 0000000000..390f7ebc10
--- /dev/null
+++ b/docs/35.0.0/tutorials/index.md
@@ -0,0 +1,225 @@
+---
+id: index
+title: "Local quickstart"
+sidebar_label: Local quickstart
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+This quickstart helps you install Apache Druid and introduces you to Druid ingestion and query features. For this tutorial, you need a machine with at least 6 GiB of RAM.
+
+In this quickstart, you'll:
+- install Druid
+- start up Druid services
+- use SQL to ingest and query data
+
+Druid supports a variety of ingestion options. Once you're done with this tutorial, refer to the
+[Ingestion](../ingestion/index.md) page to determine which ingestion method is right for you.
+
+## Prerequisites
+
+You can follow these steps on a relatively modest machine, such as a workstation or virtual server with 6 GiB of RAM.
+
+The software requirements for the installation machine are:
+
+* Linux, Mac OS X, or other Unix-like OS. (Windows is not supported)
+* [Java 17](../operations/java.md)
+* Python 3 
+* Perl 5
+
+Java must be available. Either it is on your path, or set one of the `JAVA_HOME` or `DRUID_JAVA_HOME` environment variables.
+You can run `apache-druid-35.0.0/bin/verify-java` to verify Java requirements for your environment.
+
+Before installing a production Druid instance, be sure to review the [security
+overview](../operations/security-overview.md). In general, avoid running Druid as root user. Consider creating a
+dedicated user account for running Druid.  
+
+## Install Druid
+
+Download the [35.0.0 release](https://druid.apache.org/downloads/) from Apache Druid. 
+
+In your terminal, extract the file and change directories to the distribution directory:
+
+```bash
+tar -xzf apache-druid-35.0.0-bin.tar.gz
+cd apache-druid-35.0.0
+```
+
+The distribution directory contains `LICENSE` and `NOTICE` files and subdirectories for executable files, configuration files, sample data and more.
+
+## Start up Druid services
+
+Start up Druid services using the automatic single-machine configuration.
+This configuration includes default settings that are appropriate for this tutorial, such as loading the `druid-multi-stage-query` extension by default so that you can use the MSQ task engine.
+
+You can view the default settings in the configuration files located in `conf/druid/auto`.
+
+From the `apache-druid-35.0.0` package root, run the following command:
+
+```bash
+./bin/start-druid
+```
+
+This launches instances of ZooKeeper and the Druid services.
+For example:
+
+```bash
+$ ./bin/start-druid
+[Tue Nov 29 16:31:06 2022] Starting Apache Druid.
+[Tue Nov 29 16:31:06 2022] Open http://localhost:8888/ in your browser to access the web console.
+[Tue Nov 29 16:31:06 2022] Or, if you have enabled TLS, use https on port 9088.
+[Tue Nov 29 16:31:06 2022] Starting services with log directory [/apache-druid-35.0.0/log].
+[Tue Nov 29 16:31:06 2022] Running command[zk]: bin/run-zk conf
+[Tue Nov 29 16:31:06 2022] Running command[broker]: bin/run-druid broker /apache-druid-35.0.0/conf/druid/single-server/quickstart '-Xms1187m -Xmx1187m -XX:MaxDirectMemorySize=791m'
+[Tue Nov 29 16:31:06 2022] Running command[router]: bin/run-druid router /apache-druid-35.0.0/conf/druid/single-server/quickstart '-Xms128m -Xmx128m'
+[Tue Nov 29 16:31:06 2022] Running command[coordinator-overlord]: bin/run-druid coordinator-overlord /apache-druid-35.0.0/conf/druid/single-server/quickstart '-Xms1290m -Xmx1290m'
+[Tue Nov 29 16:31:06 2022] Running command[historical]: bin/run-druid historical /apache-druid-35.0.0/conf/druid/single-server/quickstart '-Xms1376m -Xmx1376m -XX:MaxDirectMemorySize=2064m'
+[Tue Nov 29 16:31:06 2022] Running command[middleManager]: bin/run-druid middleManager /apache-druid-35.0.0/conf/druid/single-server/quickstart '-Xms64m -Xmx64m' '-Ddruid.worker.capacity=2 -Ddruid.indexer.runner.javaOptsArray=["-server","-Duser.timezone=UTC","-Dfile.encoding=UTF-8","-XX:+ExitOnOutOfMemoryError","-Djava.util.logging.manager=org.apache.logging.log4j.jul.LogManager","-Xms256m","-Xmx256m","-XX:MaxDirectMemorySize=256m"]'
+```
+
+Druid may use up to 80% of the total available system memory.
+To explicitly set the total memory available to Druid, pass a value for the memory parameter. For example, `./bin/start-druid -m 16g`. 
+
+Druid stores all persistent state data, such as the cluster metadata store and data segments, in `apache-druid-35.0.0/var`.
+Each service writes to a log file under `apache-druid-35.0.0/log`.
+
+At any time, you can revert Druid to its original, post-installation state by deleting the entire `var` directory. You may want to do this, for example, between Druid tutorials or after experimentation, to start with a fresh instance. 
+
+To stop Druid at any time, use CTRL+C in the terminal. This exits the `bin/start-druid` script and terminates all Druid processes.
+
+## Open the web console 
+
+After starting the Druid services, open the [web console](../operations/web-console.md) at [http://localhost:8888](http://localhost:8888). 
+
+![web console](../assets/tutorial-quickstart-01.png "web console")
+
+It may take a few seconds for all Druid services to finish starting, including the [Druid router](../design/router.md), which serves the console. If you attempt to open the web console before startup is complete, you may see errors in the browser. Wait a few moments and try again.
+
+In this quickstart, you use the the web console to perform ingestion. The MSQ task engine specifically uses the **Query** view to edit and run SQL queries.
+For a complete walkthrough of the **Query** view as it relates to the multi-stage query architecture and the MSQ task engine, see [UI walkthrough](../operations/web-console.md).
+
+## Load data
+
+The Druid distribution bundles the `wikiticker-2015-09-12-sampled.json.gz` sample dataset that you can use for testing. The sample dataset is located in the `quickstart/tutorial/` folder, accessible from the Druid root directory, and represents Wikipedia page edits for a given day. 
+
+Follow these steps to load the sample Wikipedia dataset:
+
+1. In the **Query** view, click **Connect external data**.
+2. Select the **Local disk** tile and enter the following values:
+
+   - **Base directory**: `quickstart/tutorial/`
+
+   - **File filter**: `wikiticker-2015-09-12-sampled.json.gz` 
+
+   ![Data location](../assets/tutorial-quickstart-02.png "Data location")
+
+   Entering the base directory and [wildcard file filter](https://commons.apache.org/proper/commons-io/apidocs/org/apache/commons/io/filefilter/WildcardFileFilter.html) separately, as afforded by the UI, allows you to specify multiple files for ingestion at once.
+
+3. Click **Connect data**. 
+4. On the **Parse** page, you can examine the raw data and perform the following optional actions before loading data into Druid: 
+   - Expand a row to see the corresponding source data.
+   - Customize how the data is handled by selecting from the **Input format** options.
+   - Adjust the primary timestamp column for the data.
+   Druid requires data to have a primary timestamp column (internally stored in a column called `__time`).
+   If your dataset doesn't have a timestamp, Druid uses the default value of `1970-01-01 00:00:00`.
+
+   ![Data sample](../assets/tutorial-quickstart-03.png "Data sample")
+
+5. Click **Done**. You're returned to the **Query** view that displays the newly generated query.
+   The query inserts the sample data into the table named `wikiticker-2015-09-12-sampled`.
+
+   <details>
+   <summary>Show the query</summary>
+
+   ```sql
+   REPLACE INTO "wikiticker-2015-09-12-sampled" OVERWRITE ALL
+   WITH input_data AS (SELECT *
+   FROM TABLE(
+     EXTERN(
+       '{"type":"local","baseDir":"quickstart/tutorial/","filter":"wikiticker-2015-09-12-sampled.json.gz"}',
+       '{"type":"json"}',
+       '[{"name":"time","type":"string"},{"name":"channel","type":"string"},{"name":"cityName","type":"string"},{"name":"comment","type":"string"},{"name":"countryIsoCode","type":"string"},{"name":"countryName","type":"string"},{"name":"isAnonymous","type":"string"},{"name":"isMinor","type":"string"},{"name":"isNew","type":"string"},{"name":"isRobot","type":"string"},{"name":"isUnpatrolled","type":"string"},{"name":"metroCode","type":"long"},{"name":"namespace","type":"string"},{"name":"page","type":"string"},{"name":"regionIsoCode","type":"string"},{"name":"regionName","type":"string"},{"name":"user","type":"string"},{"name":"delta","type":"long"},{"name":"added","type":"long"},{"name":"deleted","type":"long"}]'
+        )
+      ))
+   SELECT
+     TIME_PARSE("time") AS __time,
+     channel,
+     cityName,
+     comment,
+     countryIsoCode,
+     countryName,
+     isAnonymous,
+     isMinor,
+     isNew,
+     isRobot,
+     isUnpatrolled,
+     metroCode,
+     namespace,
+     page,
+     regionIsoCode,
+     regionName,
+     user,
+     delta,
+     added,
+     deleted
+   FROM input_data
+   PARTITIONED BY DAY
+   ```
+   </details>
+
+6. Optionally, click **Preview** to see the general shape of the data before you ingest it.
+7. Edit the first line of the query and change the default destination datasource name from `wikiticker-2015-09-12-sampled` to `wikipedia`.
+8. Click **Run** to execute the query. The task may take a minute or two to complete. When done, the task displays its duration and the number of rows inserted into the table. The view is set to automatically refresh, so you don't need to refresh the browser to see the status change.
+
+    ![Run query](../assets/tutorial-quickstart-04.png "Run query")
+
+   A successful task means that Druid data servers have picked up one or more segments.
+
+## Query data
+
+Once the ingestion job is complete, you can query the data. 
+
+In the **Query** view, run the following query to produce a list of top channels:
+
+```sql
+SELECT
+  channel,
+  COUNT(*)
+FROM "wikipedia"
+GROUP BY channel
+ORDER BY COUNT(*) DESC
+```
+
+![Query view](../assets/tutorial-quickstart-05.png "Query view")
+
+Congratulations! You've gone from downloading Druid to querying data with the MSQ task engine in just one quickstart.
+
+## Next steps
+
+See the following topics for more information:
+
+* [Druid SQL overview](../querying/sql.md) or the [Query tutorial](./tutorial-query.md) to learn about how to query the data you just ingested.
+* [Ingestion overview](../ingestion/index.md) to explore options for ingesting more data.
+* [Tutorial: Load files using SQL](./tutorial-msq-extern.md) to learn how to generate a SQL query that loads external data into a Druid datasource.
+* [Tutorial: Load data with native batch ingestion](tutorial-batch-native.md) to load and query data with Druid's native batch ingestion feature.
+* [Tutorial: Load stream data from Apache Kafka](./tutorial-kafka.md) to load streaming data from a Kafka topic.
+* [Extensions](../configuration/extensions.md) for details on Druid extensions.
+
+Remember that after stopping Druid services, you can start clean next time by deleting the `var` directory from the Druid root directory and running the `bin/start-druid` script again. You may want to do this before using other data ingestion tutorials, since they use the same Wikipedia datasource.
diff --git a/docs/35.0.0/tutorials/tutorial-append-data.md b/docs/35.0.0/tutorials/tutorial-append-data.md
new file mode 100644
index 0000000000..acdb054425
--- /dev/null
+++ b/docs/35.0.0/tutorials/tutorial-append-data.md
@@ -0,0 +1,133 @@
+---
+id: tutorial-append-data
+title: Append data
+sidebar_label: Append data
+description: Learn how to append data to a datasource without changing the existing data in Apache Druid.
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+This tutorial shows you how to use the Apache Druid SQL [INSERT](../multi-stage-query/reference.md#insert) function to append data to a [datasource](../design/storage.md) without changing the existing data.
+The examples in the tutorial use the [multi-stage query (MSQ)](../multi-stage-query/index.md) task engine to executes SQL statements.
+
+## Prerequisites
+
+Before you follow the steps in this tutorial, download Druid as described in [Quickstart (local)](index.md) and have it running on your local machine. You don't need to load any data into the Druid cluster.
+
+You should be familiar with data querying in Druid. If you haven't already, go through the [Query data](../tutorials/tutorial-query.md) tutorial first.
+
+## Load sample data
+
+Load a sample dataset using [INSERT](../multi-stage-query/reference.md#insert) and [EXTERN](../multi-stage-query/reference.md#extern-function) functions. The EXTERN function lets you read external data or write to an external location.
+
+In the Druid [web console](../operations/web-console.md), go to the **Query** view and run the following query:
+
+```sql
+INSERT INTO "append_tutorial"
+SELECT
+  TIME_PARSE("timestamp") AS "__time",
+  "animal",
+  "number"
+FROM TABLE(
+  EXTERN(
+    '{"type":"inline","data":"{\"timestamp\":\"2024-01-01T07:01:35Z\",\"animal\":\"octopus\", \"number\":115}\n{\"timestamp\":\"2024-01-01T05:01:35Z\",\"animal\":\"mongoose\", \"number\":737}\n{\"timestamp\":\"2024-01-01T06:01:35Z\",\"animal\":\"snake\", \"number\":1234}\n{\"timestamp\":\"2024-01-01T01:01:35Z\",\"animal\":\"lion\", \"number\":300}\n{\"timestamp\":\"2024-01-02T07:01:35Z\",\"animal\":\"seahorse\", \"number\":115}\n{\"timestamp\":\"2024-01-02T05:01:35Z\",\"animal\":\"skunk\", \"number\":737}\n{\"timestamp\":\"2024-01-02T06:01:35Z\",\"animal\":\"iguana\", \"number\":1234}\n{\"timestamp\":\"2024-01-02T01:01:35Z\",\"animal\":\"opossum\", \"number\":300}"}',
+      '{"type":"json"}'
+    )
+  ) EXTEND ("timestamp" VARCHAR, "animal" VARCHAR, "number" BIGINT)
+PARTITIONED BY DAY
+```
+
+The resulting `append_tutorial` datasource contains records for eight animals over two days.
+To view the results, open a new tab and run the following query:
+
+```sql
+SELECT * FROM "append_tutorial"
+```
+
+<details>
+<summary> View the results</summary>
+
+| `__time` | `animal` | `number`|
+| -- | -- | -- |
+| `2024-01-01T01:01:35.000Z`| `lion`| 300 |
+| `2024-01-01T05:01:35.000Z`| `mongoose`| 737 |
+| `2024-01-01T06:01:35.000Z`| `snake`| 1234 |
+| `2024-01-01T07:01:35.000Z`| `octopus`| 115 |
+| `2024-01-02T01:01:35.000Z`| `opossum`| 300 |
+| `2024-01-02T05:01:35.000Z`| `skunk`| 737 |
+| `2024-01-02T06:01:35.000Z`| `iguana`| 1234 |
+| `2024-01-02T07:01:35.000Z`| `seahorse`| 115 |
+
+</details>
+
+## Append data
+
+You can use the INSERT function to append data to the datasource without changing the existing data.
+In a new tab, run the following query to ingest and append data to the `append_tutorial` datasource:
+
+```sql
+INSERT INTO "append_tutorial"
+SELECT
+  TIME_PARSE("timestamp") AS "__time",
+  "animal",
+  "number"
+FROM TABLE(
+  EXTERN(
+    '{"type":"inline","data":"{\"timestamp\":\"2024-01-03T01:09:35Z\",\"animal\":\"zebra\", \"number\":233}\n{\"timestamp\":\"2024-01-04T07:01:35Z\",\"animal\":\"bear\", \"number\":577}\n{\"timestamp\":\"2024-01-04T05:01:35Z\",\"animal\":\"falcon\", \"number\":848}\n{\"timestamp\":\"2024-01-04T06:01:35Z\",\"animal\":\"giraffe\", \"number\":113}\n{\"timestamp\":\"2024-01-04T01:01:35Z\",\"animal\":\"rhino\", \"number\":473}"}',
+    '{"type":"json"}'
+    )
+  ) EXTEND ("timestamp" VARCHAR, "animal" VARCHAR, "number" BIGINT)
+PARTITIONED BY DAY
+```
+
+Druid adds rows for the subsequent days after `seahorse`.
+When the task completes, open a new tab and run the following query to view the results:
+
+```sql
+SELECT * FROM "append_tutorial"
+```
+
+<details>
+<summary> View the results</summary>
+
+| `__time` | `animal` | `number`|
+| -- | -- | -- |
+| `2024-01-01T01:01:35.000Z`| `lion`| 300 |
+| `2024-01-01T05:01:35.000Z`| `mongoose`| 737 |
+| `2024-01-01T06:01:35.000Z`| `snake`| 1234 |
+| `2024-01-01T07:01:35.000Z`| `octopus`| 115 |
+| `2024-01-02T01:01:35.000Z`| `opossum`| 300 |
+| `2024-01-02T05:01:35.000Z`| `skunk`| 737 |
+| `2024-01-02T06:01:35.000Z`| `iguana`| 1234 |
+| `2024-01-02T07:01:35.000Z`| `seahorse`| 115 |
+| `2024-01-03T01:09:35.000Z`| `zebra`| 233 |
+| `2024-01-04T01:01:35.000Z`| `rhino`| 473 |
+| `2024-01-04T05:01:35.000Z`| `falcon`| 848 |
+| `2024-01-04T06:01:35.000Z`| `giraffe`| 113 |
+| `2024-01-04T07:01:35.000Z`| `bear`| 577 |
+
+</details>
+
+## Learn more
+
+See the following topics for more information:
+
+* [SQL-based ingestion reference](../multi-stage-query/reference.md) for a reference on MSQ architecture.
+* [SQL-based ingestion query examples](../multi-stage-query/examples.md) for example queries using the MSQ task engine.
\ No newline at end of file
diff --git a/docs/35.0.0/tutorials/tutorial-batch-hadoop.md b/docs/35.0.0/tutorials/tutorial-batch-hadoop.md
new file mode 100644
index 0000000000..10ec1aa288
--- /dev/null
+++ b/docs/35.0.0/tutorials/tutorial-batch-hadoop.md
@@ -0,0 +1,252 @@
+---
+id: tutorial-batch-hadoop
+title: Load batch data using Apache Hadoop
+sidebar_label: Load from Apache Hadoop
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::caution[Deprecated]
+
+Hadoop-based ingestion is deprecated. For more information, see the [upgrade notes](../release-info/upgrade-notes.md#hadoop-based-ingestion).
+
+:::
+
+
+This tutorial shows you how to load data files into Apache Druid using a remote Hadoop cluster.
+
+For this tutorial, we'll assume that you've already completed the previous
+[batch ingestion tutorial](tutorial-batch.md) using Druid's native batch ingestion system and are using the
+automatic single-machine configuration as described in the [quickstart](../operations/single-server.md).
+
+## Install Docker
+
+This tutorial requires [Docker](https://docs.docker.com/install/) to be installed on the tutorial machine.
+
+Once the Docker install is complete, please proceed to the next steps in the tutorial.
+
+## Build the Hadoop docker image
+
+For this tutorial, we've provided a Dockerfile for a Hadoop 3.3.6 cluster, which we'll use to run the batch indexing task.
+
+This Dockerfile and related files are located at `quickstart/tutorial/hadoop/docker`.
+
+From the `apache-druid-35.0.0` package root, run the following commands to build a Docker image named "druid-hadoop-demo" with version tag "3.3.6":
+
+```bash
+cd quickstart/tutorial/hadoop/docker
+docker build -t druid-hadoop-demo:3.3.6 .
+```
+
+This will start building the Hadoop image. Once the image build is done, you should see the message `Successfully tagged druid-hadoop-demo:3.3.6` printed to the console.
+
+## Setup the Hadoop docker cluster
+
+### Create temporary shared directory
+
+We'll need a shared folder between the host and the Hadoop container for transferring some files.
+
+Let's create some folders under `/tmp`, we will use these later when starting the Hadoop container:
+
+```bash
+mkdir -p /tmp/shared
+```
+
+### Configure /etc/hosts
+
+On the host machine, add the following entry to `/etc/hosts`:
+
+```
+127.0.0.1 druid-hadoop-demo
+```
+
+### Start the Hadoop container
+
+Once the `/tmp/shared` folder has been created and the `etc/hosts` entry has been added, run the following command to start the Hadoop container.
+
+```bash
+docker run -it  -h druid-hadoop-demo --name druid-hadoop-demo -p 2049:2049 -p 2122:2122 -p 8020-8042:8020-8042 -p 8088:8088 -p 8443:8443 -p 9000:9000 -p 9820:9820 -p 9860-9880:9860-9880 -p 10020:10020 -p 19888:19888 -p 34455:34455 -p 49707:49707 -p 50010:50010 -p 50020:50020 -p 50030:50030 -p 50060:50060 -p 50070:50070 -p 50075:50075 -p 50090:50090 -p 51111:51111 -v /tmp/shared:/shared druid-hadoop-demo:3.3.6 /etc/bootstrap.sh -bash
+```
+
+Once the container is started, your terminal will attach to a bash shell running inside the container:
+
+```bash
+Starting namenodes on [druid-hadoop-demo]
+Starting datanodes
+Starting secondary namenodes [druid-hadoop-demo]
+WARNING: YARN_CONF_DIR has been replaced by HADOOP_CONF_DIR. Using value of YARN_CONF_DIR.
+WARNING: YARN_OPTS has been replaced by HADOOP_OPTS. Using value of YARN_OPTS.
+Starting resourcemanager
+WARNING: YARN_OPTS has been replaced by HADOOP_OPTS. Using value of YARN_OPTS.
+Starting nodemanagers
+WARNING: YARN_OPTS has been replaced by HADOOP_OPTS. Using value of YARN_OPTS.
+localhost: WARNING: YARN_OPTS has been replaced by HADOOP_OPTS. Using value of YARN_OPTS.
+WARNING: YARN_CONF_DIR has been replaced by HADOOP_CONF_DIR. Using value of YARN_CONF_DIR.
+WARNING: YARN_OPTS has been replaced by HADOOP_OPTS. Using value of YARN_OPTS.
+WARNING: Use of this script to start the MR JobHistory daemon is deprecated.
+WARNING: Attempting to execute replacement "mapred --daemon start" instead.
+ * initialize hdfs for first run
+bash-4.1#
+```
+
+The `Unable to load native-hadoop library for your platform... using builtin-java classes where applicable` warning messages can be safely ignored.
+
+#### Accessing the Hadoop container shell
+
+To open another shell to the Hadoop container, run the following command:
+
+```
+docker exec -it druid-hadoop-demo bash
+```
+
+### Test data
+
+The startup script `bootstrap.sh`:
+* creates the necessary directories
+* loads an input file to HDFS
+* places the hadoop configuration into the shared volume as `hadoop-conf.tgz`
+
+## Configure Druid to use Hadoop
+
+Some additional steps are needed to configure the Druid cluster for Hadoop batch indexing.
+
+### Provide Hadoop configuration for Druid
+
+From the Hadoop container's shell, run the following command to copy the Hadoop .xml configuration files to the shared folder:
+
+```bash
+cp /usr/local/hadoop/etc/hadoop/*.xml /shared/hadoop_xml
+```
+
+From the host machine, run the following, where `PATH_TO_DRUID` is replaced by the path to the Druid package.
+
+```bash
+cd $PATH_TO_DRUID
+mkdir -p conf/druid/single-server/micro-quickstart/_common/hadoop-xml
+tar xzf /tmp/shared/hadoop-conf.tgz -C conf/druid/single-server/micro-quickstart/_common/hadoop-xml
+```
+
+### Update Druid segment and log storage
+
+In your favorite text editor, open `conf/druid/single-server/micro-quickstart/_common/common.runtime.properties`, and make the following edits:
+
+#### Disable local deep storage and enable HDFS deep storage
+
+```
+#
+# Deep storage
+#
+
+# For local disk (only viable in a cluster if this is a network mount):
+#druid.storage.type=local
+#druid.storage.storageDirectory=var/druid/segments
+
+# For HDFS:
+druid.storage.type=hdfs
+druid.storage.storageDirectory=/druid/segments
+```
+
+
+#### Disable local log storage and enable HDFS log storage
+
+```
+#
+# Indexing service logs
+#
+
+# For local disk (only viable in a cluster if this is a network mount):
+#druid.indexer.logs.type=file
+#druid.indexer.logs.directory=var/druid/indexing-logs
+
+# For HDFS:
+druid.indexer.logs.type=hdfs
+druid.indexer.logs.directory=/druid/indexing-logs
+
+```
+
+### Restart Druid cluster
+
+Once the Hadoop .xml files have been copied to the Druid cluster and the segment/log storage configuration has been updated to use HDFS, the Druid cluster needs to be restarted for the new configurations to take effect.
+
+If the cluster is still running, CTRL-C to terminate it if running - and start it with:
+```
+bin/start-druid -c conf/druid/single-server/micro-quickstart
+```
+
+## Load batch data
+
+We've included a sample of Wikipedia edits from September 12, 2015 to get you started.
+
+To load this data into Druid, you can submit an *ingestion task* pointing to the file. We've included
+a task that loads the `wikiticker-2015-09-12-sampled.json.gz` file included in the archive.
+
+Let's submit the `wikipedia-index-hadoop3.json` task:
+
+```bash
+bin/post-index-task --file quickstart/tutorial/wikipedia-index-hadoop3.json --url http://localhost:8081
+```
+
+## Querying your data
+
+After the data load is complete, please follow the [query tutorial](../tutorials/tutorial-query.md) to run some example queries on the newly loaded data.
+
+## Cleanup
+
+This tutorial is only meant to be used together with the [query tutorial](../tutorials/tutorial-query.md).
+
+If you wish to go through any of the other tutorials, you will need to:
+* Shut down the cluster and reset the cluster state by removing the contents of the `var` directory under the druid package.
+* Revert the deep storage and task storage config back to local types in `conf/druid/single-server/micro-quickstart/_common/common.runtime.properties`
+* Restart the cluster
+
+This is necessary because the other ingestion tutorials will write to the same "wikipedia" datasource, and later tutorials expect the cluster to use local deep storage.
+
+Example reverted config:
+
+```
+#
+# Deep storage
+#
+
+# For local disk (only viable in a cluster if this is a network mount):
+druid.storage.type=local
+druid.storage.storageDirectory=var/druid/segments
+
+# For HDFS:
+#druid.storage.type=hdfs
+#druid.storage.storageDirectory=/druid/segments
+
+#
+# Indexing service logs
+#
+
+# For local disk (only viable in a cluster if this is a network mount):
+druid.indexer.logs.type=file
+druid.indexer.logs.directory=var/druid/indexing-logs
+
+# For HDFS:
+#druid.indexer.logs.type=hdfs
+#druid.indexer.logs.directory=/druid/indexing-logs
+
+```
+
+## Further reading
+
+For more information on loading batch data with Hadoop, please see [the Hadoop batch ingestion documentation](../ingestion/hadoop.md).
diff --git a/docs/35.0.0/tutorials/tutorial-batch-native.md b/docs/35.0.0/tutorials/tutorial-batch-native.md
new file mode 100644
index 0000000000..e264b27b57
--- /dev/null
+++ b/docs/35.0.0/tutorials/tutorial-batch-native.md
@@ -0,0 +1,159 @@
+---
+id: tutorial-batch-native
+title: "Load data with native batch ingestion"
+sidebar_label: Load data with native batch ingestion
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+This topic shows you how to load and query data files in Apache Druid using its native batch ingestion feature. 
+
+## Prerequisites
+
+Install Druid, start up Druid services, and open the web console as described in the [Druid quickstart](index.md).
+
+## Load data
+
+Ingestion specs define the schema of the data Druid reads and stores. You can write ingestion specs by hand or using the _data loader_, 
+as we'll do here to perform batch file loading with Druid's native batch ingestion.
+
+The Druid distribution bundles sample data we can use. The sample data located in `quickstart/tutorial/wikiticker-2015-09-12-sampled.json.gz` 
+in the Druid root directory represents Wikipedia page edits for a given day. 
+
+1. Click **Load data** from the web console header (![Load data](../assets/tutorial-batch-data-loader-00.png)).
+
+2. Select the **Local disk** tile and then click **Connect data**.
+
+   ![Data loader init](../assets/tutorial-batch-data-loader-01.png "Data loader init")
+
+3. Enter the following values: 
+
+   - **Base directory**: `quickstart/tutorial/`
+
+   - **File filter**: `wikiticker-2015-09-12-sampled.json.gz` 
+
+   ![Data location](../assets/tutorial-batch-data-loader-015.png "Data location")
+
+   Entering the base directory and [wildcard file filter](https://commons.apache.org/proper/commons-io/apidocs/org/apache/commons/io/filefilter/WildcardFileFilter.html) separately, as afforded by the UI, allows you to specify multiple files for ingestion at once.
+
+4. Click **Apply**. 
+
+   The data loader displays the raw data, giving you a chance to verify that the data 
+   appears as expected. 
+
+   ![Data loader sample](../assets/tutorial-batch-data-loader-02.png "Data loader sample")
+
+   Notice that your position in the sequence of steps to load data, **Connect** in our case, appears at the top of the console, as shown below. 
+   You can click other steps to move forward or backward in the sequence at any time.
+
+   ![Load data](../assets/tutorial-batch-data-loader-12.png)  
+
+
+5. Click **Next: Parse data**. 
+
+   The data loader tries to determine the parser appropriate for the data format automatically. In this case 
+   it identifies the data format as `json`, as shown in the **Input format** field at the bottom right.
+
+   ![Data loader parse data](../assets/tutorial-batch-data-loader-03.png "Data loader parse data")
+
+   Feel free to select other **Input format** options to get a sense of their configuration settings 
+   and how Druid parses other types of data.  
+
+6. With the JSON parser selected, click **Next: Parse time**. The **Parse time** settings are where you view and adjust the 
+   primary timestamp column for the data.
+
+   ![Data loader parse time](../assets/tutorial-batch-data-loader-04.png "Data loader parse time")
+
+   Druid requires data to have a primary timestamp column (internally stored in a column called `__time`).
+   If you do not have a timestamp in your data, select `Constant value`. In our example, the data loader 
+   determines that the `time` column is the only candidate that can be used as the primary time column.
+
+7. Click **Next: Transform**, **Next: Filter**, and then **Next: Configure schema**, skipping a few steps.
+
+   You do not need to adjust transformation or filtering settings, as applying ingestion time transforms and 
+   filters are out of scope for this tutorial.
+
+8. The Configure schema settings are where you configure what [dimensions](../ingestion/schema-model.md#dimensions) 
+   and [metrics](../ingestion/schema-model.md#metrics) are ingested. The outcome of this configuration represents exactly how the 
+   data will appear in Druid after ingestion. 
+
+   Since our dataset is very small, you can turn off [rollup](../ingestion/rollup.md) 
+   by unsetting the **Rollup** switch and confirming the change when prompted.
+
+   ![Data loader schema](../assets/tutorial-batch-data-loader-05.png "Data loader schema")
+
+
+9. Click **Next: Partition** to configure how the data will be split into segments. In this case, choose `DAY` as the **Segment granularity**. 
+
+    ![Data loader partition](../assets/tutorial-batch-data-loader-06.png "Data loader partition")
+
+    Since this is a small dataset, we can have just a single segment, which is what selecting `DAY` as the 
+    segment granularity gives us. 
+
+10. Click **Next: Tune** and **Next: Publish**.
+
+11. The Publish settings are where you specify the datasource name in Druid. Let's change the default name from  `wikiticker-2015-09-12-sampled` to `wikipedia`. 
+
+    ![Data loader publish](../assets/tutorial-batch-data-loader-07.png "Data loader publish")
+
+12. Click **Next: Edit spec** to review the ingestion spec we've constructed with the data loader. 
+
+    ![Data loader spec](../assets/tutorial-batch-data-loader-08.png "Data loader spec")
+
+    Feel free to go back and change settings from previous steps to see how doing so updates the spec.
+    Similarly, you can edit the spec directly and see it reflected in the previous steps. 
+
+    For other ways to load ingestion specs in Druid, see [Tutorial: Loading a file](./tutorial-batch.md). 
+13. Once you are satisfied with the spec, click **Submit**.
+
+
+    The new task for our wikipedia datasource now appears in the Ingestion view. 
+
+    ![Tasks view](../assets/tutorial-batch-data-loader-09.png "Tasks view")
+
+    The task may take a minute or two to complete. When done, the task status should be "SUCCESS", with
+    the duration of the task indicated. Note that the view is set to automatically 
+    refresh, so you do not need to refresh the browser to see the status change.
+
+    A successful task means that one or more segments have been built and are now picked up by our data servers.
+
+
+## Query the data 
+
+You can now see the data as a datasource in the console and try out a query, as follows: 
+
+1. Click **Datasources** from the console header. 
+
+   If the wikipedia datasource doesn't appear, wait a few moments for the segment to finish loading. A datasource is 
+   queryable once it is shown to be "Fully available" in the **Availability** column. 
+
+2. When the datasource is available, open the Actions menu (![Actions](../assets/datasources-action-button.png)) for that 
+   datasource and choose **Query with SQL**.
+
+   ![Datasource view](../assets/tutorial-batch-data-loader-10.png "Datasource view")
+
+:::info
+ Notice the other actions you can perform for a datasource, including configuring retention rules, compaction, and more.
+:::
+
+3. Run the prepopulated query, `SELECT * FROM "wikipedia"` to see the results.
+
+   ![Query view](../assets/tutorial-batch-data-loader-11.png "Query view")
diff --git a/docs/35.0.0/tutorials/tutorial-batch.md b/docs/35.0.0/tutorials/tutorial-batch.md
new file mode 100644
index 0000000000..ced8f67441
--- /dev/null
+++ b/docs/35.0.0/tutorials/tutorial-batch.md
@@ -0,0 +1,179 @@
+---
+id: tutorial-batch
+title: "Load a file"
+sidebar_label: "Load files natively"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+This tutorial demonstrates how to load data into Apache Druid from a file using Apache Druid's native batch ingestion feature.
+
+You initiate data loading in Druid by submitting an *ingestion task* spec to the Druid Overlord. You can write ingestion 
+specs by hand or using the _data loader_ built into the web console. 
+
+For production environments, it's likely that you'll want to automate data ingestion. This tutorial starts by showing
+you how to submit an ingestion spec directly in the web console, and then introduces ways to ingest batch data that
+lend themselves to automation&mdash;from the command line and from a script. 
+
+## Loading data with a spec (via console)
+
+The Druid package includes the following sample native batch ingestion task spec at `quickstart/tutorial/wikipedia-index.json`, shown here for convenience,
+which has been configured to read the `quickstart/tutorial/wikiticker-2015-09-12-sampled.json.gz` input file:
+
+```json
+{
+  "type" : "index_parallel",
+  "spec" : {
+    "dataSchema" : {
+      "dataSource" : "wikipedia",
+      "dimensionsSpec" : {
+        "dimensions" : [
+          "channel",
+          "cityName",
+          "comment",
+          "countryIsoCode",
+          "countryName",
+          "isAnonymous",
+          "isMinor",
+          "isNew",
+          "isRobot",
+          "isUnpatrolled",
+          "metroCode",
+          "namespace",
+          "page",
+          "regionIsoCode",
+          "regionName",
+          "user",
+          { "name": "added", "type": "long" },
+          { "name": "deleted", "type": "long" },
+          { "name": "delta", "type": "long" }
+        ]
+      },
+      "timestampSpec": {
+        "column": "time",
+        "format": "iso"
+      },
+      "metricsSpec" : [],
+      "granularitySpec" : {
+        "type" : "uniform",
+        "segmentGranularity" : "day",
+        "queryGranularity" : "none",
+        "intervals" : ["2015-09-12/2015-09-13"],
+        "rollup" : false
+      }
+    },
+    "ioConfig" : {
+      "type" : "index_parallel",
+      "inputSource" : {
+        "type" : "local",
+        "baseDir" : "quickstart/tutorial/",
+        "filter" : "wikiticker-2015-09-12-sampled.json.gz"
+      },
+      "inputFormat" :  {
+        "type": "json"
+      },
+      "appendToExisting" : false
+    },
+    "tuningConfig" : {
+      "type" : "index_parallel",
+      "partitionsSpec": {
+        "type": "dynamic"
+      },
+      "maxRowsInMemory" : 25000
+    }
+  }
+}
+```
+
+This spec creates a datasource named "wikipedia".
+
+From the Ingestion view, click the ellipses next to Tasks and choose `Submit JSON task`.
+
+![Tasks view add task](../assets/tutorial-batch-submit-task-01.png "Tasks view add task")
+
+This brings up the spec submission dialog where you can paste the spec above.
+
+![Query view](../assets/tutorial-batch-submit-task-02.png "Query view")
+
+Once the spec is submitted, wait a few moments for the data to load, after which you can query it.
+
+
+## Loading data with a spec (via command line)
+
+For convenience, the Druid package includes a batch ingestion helper script at `bin/post-index-task`.
+
+This script will POST an ingestion task to the Druid Overlord and poll Druid until the data is available for querying.
+
+Run the following command from Druid package root:
+
+```bash
+bin/post-index-task --file quickstart/tutorial/wikipedia-index.json --url http://localhost:8081
+```
+
+You should see output like the following:
+
+```bash
+Beginning indexing data for wikipedia
+Task started: index_wikipedia_2018-07-27T06:37:44.323Z
+Task log:     http://localhost:8081/druid/indexer/v1/task/index_wikipedia_2018-07-27T06:37:44.323Z/log
+Task status:  http://localhost:8081/druid/indexer/v1/task/index_wikipedia_2018-07-27T06:37:44.323Z/status
+Task index_wikipedia_2018-07-27T06:37:44.323Z still running...
+Task index_wikipedia_2018-07-27T06:37:44.323Z still running...
+Task finished with status: SUCCESS
+Completed indexing data for wikipedia. Now loading indexed data onto the cluster...
+wikipedia loading complete! You may now query your data
+```
+
+Once the spec is submitted, you can follow the same instructions as above to wait for the data to load and then query it.
+
+
+## Loading data without the script
+
+Let's briefly discuss how we would've submitted the ingestion task without using the script. You do not need to run these commands.
+
+To submit the task, POST it to Druid in a new terminal window from the `apache-druid-35.0.0` directory:
+
+```bash
+curl -X 'POST' -H 'Content-Type:application/json' -d @quickstart/tutorial/wikipedia-index.json http://localhost:8081/druid/indexer/v1/task
+```
+
+Which will print the ID of the task if the submission was successful:
+
+```bash
+{"task":"index_wikipedia_2018-06-09T21:30:32.802Z"}
+```
+
+You can monitor the status of this task from the console as outlined above.
+
+
+## Querying your data
+
+Once the data is loaded, please follow the [query tutorial](../tutorials/tutorial-query.md) to run some example queries on the newly loaded data.
+
+
+## Cleanup
+
+If you wish to go through any of the other ingestion tutorials, you will need to shut down the cluster and reset the cluster state by removing the contents of the `var` directory under the druid package, as the other tutorials will write to the same "wikipedia" datasource.
+
+
+## Further reading
+
+For more information on loading batch data, please see [the native batch ingestion documentation](../ingestion/native-batch.md).
diff --git a/docs/35.0.0/tutorials/tutorial-compaction.md b/docs/35.0.0/tutorials/tutorial-compaction.md
new file mode 100644
index 0000000000..c4a918897a
--- /dev/null
+++ b/docs/35.0.0/tutorials/tutorial-compaction.md
@@ -0,0 +1,190 @@
+---
+id: tutorial-compaction
+title: Compact segments
+sidebar_label: Compact segments
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+This tutorial demonstrates how to compact existing segments into fewer but larger segments in Apache Druid.
+
+There is some per-segment memory and processing overhead during query processing.
+Therefore, it can be beneficial to reduce the total number of segments.
+See [Segment size optimization](../operations/segment-optimization.md) for details.
+
+## Prerequisites
+
+This tutorial assumes you have already downloaded Apache Druid as described in
+the [single-machine quickstart](index.md) and have it running on your local machine.
+
+If you haven't already, you should finish the following tutorials first:
+- [Tutorial: Loading a file](../tutorials/tutorial-batch.md)
+- [Tutorial: Querying data](../tutorials/tutorial-query.md)
+
+## Load the initial data
+
+This tutorial uses the Wikipedia edits sample data included with the Druid distribution.
+To load the initial data, you use an ingestion spec that loads batch data with segment granularity of `HOUR` and creates between one and three segments per hour.
+
+You can review the ingestion spec at `quickstart/tutorial/compaction-init-index.json`.
+Submit the spec as follows to create a datasource called `compaction-tutorial`:
+
+```bash
+bin/post-index-task --file quickstart/tutorial/compaction-init-index.json --url http://localhost:8081
+```
+
+:::info
+ `maxRowsPerSegment` in the tutorial ingestion spec is set to 1000 to generate multiple segments per hour for demonstration purposes. Do not use this spec in production.
+:::
+
+After the ingestion completes, navigate to [http://localhost:8888/unified-console.html#datasources](http://localhost:8888/unified-console.html#datasources) in a browser to see the new datasource in the web console.
+
+![compaction-tutorial datasource](../assets/tutorial-compaction-01.png "compaction-tutorial datasource")
+
+In the **Availability** column for the `compaction-tutorial` datasource, click the link for **51 segments** to view segments information for the datasource.
+
+The datasource comprises 51 segments, between one and three segments per hour from the input data:
+
+![Original segments](../assets/tutorial-compaction-02.png "Original segments")
+
+Run a COUNT query on the datasource to verify there are 39,244 rows:
+
+```bash
+dsql> select count(*) from "compaction-tutorial";
+┌────────┐
+│ EXPR$0 │
+├────────┤
+│  39244 │
+└────────┘
+Retrieved 1 row in 1.38s.
+```
+
+## Compact the data
+
+Now you compact these 51 small segments and retain the segment granularity of `HOUR`.
+The Druid distribution includes a compaction task spec for this tutorial datasource at `quickstart/tutorial/compaction-keep-granularity.json`:
+
+```json
+{
+  "type": "compact",
+  "dataSource": "compaction-tutorial",
+  "interval": "2015-09-12/2015-09-13",
+  "tuningConfig" : {
+    "type" : "index_parallel",
+    "partitionsSpec": {
+        "type": "dynamic"
+    },
+    "maxRowsInMemory" : 25000
+  }
+}
+```
+
+This compacts all segments for the interval `2015-09-12/2015-09-13` in the `compaction-tutorial` datasource.
+
+The parameters in the `tuningConfig` control the maximum number of rows present in each compacted segment and thus affect the number of segments in the compacted set.
+
+This datasource only has 39,244 rows. 39,244 is below the default limit of 5,000,000 `maxRowsPerSegment` for [dynamic partitioning](../ingestion/native-batch.md#dynamic-partitioning). Therefore, Druid only creates one compacted segment per hour.
+
+Submit the compaction task now:
+
+```bash
+bin/post-index-task --file quickstart/tutorial/compaction-keep-granularity.json --url http://localhost:8081
+```
+
+After the task finishes, refresh the [segments view](http://localhost:8888/unified-console.html#segments).
+
+Over time the Coordinator marks the original 51 segments as unused and subsequently removes them to leave only the new compacted segments.
+
+By default, the Coordinator does not mark segments as unused until the Coordinator has been running for at least 15 minutes.
+During that time, you may see 75 total segments comprised of the old segment set and the new compacted set:
+
+![Compacted segments intermediate state 1](../assets/tutorial-compaction-03.png "Compacted segments intermediate state 1")
+
+![Compacted segments intermediate state 2](../assets/tutorial-compaction-04.png "Compacted segments intermediate state 2")
+
+The new compacted segments have a more recent version than the original segments.
+Even though the web console displays both sets of segments, queries only read from the new compacted segments.
+
+Run a COUNT query on `compaction-tutorial` again to verify the number of rows remains 39,244:
+
+```bash
+dsql> select count(*) from "compaction-tutorial";
+┌────────┐
+│ EXPR$0 │
+├────────┤
+│  39244 │
+└────────┘
+Retrieved 1 row in 1.30s.
+```
+
+After the Coordinator has been running for at least 15 minutes, the segments view only shows the new 24 segments, one for each hour:
+
+![Compacted segments hourly granularity 1](../assets/tutorial-compaction-05.png "Compacted segments hourly granularity 1")
+
+![Compacted segments hourly granularity 2](../assets/tutorial-compaction-06.png "Compacted segments hourly granularity 2")
+
+## Compact the data with new segment granularity
+
+You can also change the segment granularity in a compaction task to produce compacted segments with a different granularity from that of the input segments.
+
+The Druid distribution includes a compaction task spec to create `DAY` granularity segments at `quickstart/tutorial/compaction-day-granularity.json`:
+
+```json
+{
+  "type": "compact",
+  "dataSource": "compaction-tutorial",
+  "interval": "2015-09-12/2015-09-13",
+  "tuningConfig" : {
+    "type" : "index_parallel",
+    "partitionsSpec": {
+        "type": "dynamic"
+    },
+    "maxRowsInMemory" : 25000,
+    "forceExtendableShardSpecs" : true
+  },
+  "granularitySpec" : {
+    "segmentGranularity" : "DAY",
+    "queryGranularity" : "none"
+  }
+}
+```
+
+Note that `segmentGranularity` is set to `DAY` in this compaction task spec.
+
+Submit this task now:
+
+```bash
+bin/post-index-task --file quickstart/tutorial/compaction-day-granularity.json --url http://localhost:8081
+```
+
+It takes some time before the Coordinator marks the old input segments as unused, so you may see an intermediate state with 25 total segments. Eventually, only one DAY granularity segment remains:
+
+![Compacted segments day granularity 1](../assets/tutorial-compaction-07.png "Compacted segments day granularity 1")
+
+![Compacted segments day granularity 2](../assets/tutorial-compaction-08.png "Compacted segments day granularity 2")
+
+## Learn more
+
+This tutorial demonstrated how to use a compaction task spec to manually compact segments and how to optionally change the segment granularity for segments.
+
+
+- For more details, see [Compaction](../data-management/compaction.md).
+- To learn about the benefits of compaction, see [Segment optimization](../operations/segment-optimization.md).
diff --git a/docs/35.0.0/tutorials/tutorial-delete-data.md b/docs/35.0.0/tutorials/tutorial-delete-data.md
new file mode 100644
index 0000000000..93173470c4
--- /dev/null
+++ b/docs/35.0.0/tutorials/tutorial-delete-data.md
@@ -0,0 +1,187 @@
+---
+id: tutorial-delete-data
+title: "Tutorial: Deleting data"
+sidebar_label: "Deleting data"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+This tutorial demonstrates how to delete existing data.
+
+This tutorial requires the following:
+* A running Apache Druid instance. If you don't have Druid, see the [single-machine quickstart](index.md) to get started.
+* The command-line JSON processor, [jq](https://stedolan.github.io/jq/download/).
+
+## Load initial data
+
+In this tutorial, we will use the Wikipedia edits data, with an indexing spec that creates hourly segments. This spec is located at `quickstart/tutorial/deletion-index.json`, and it creates a datasource called `deletion-tutorial`.
+
+Let's load this initial data:
+
+```bash
+bin/post-index-task --file quickstart/tutorial/deletion-index.json --url http://localhost:8081
+```
+
+When the load finishes, open [http://localhost:8888/unified-console.md#datasources](http://localhost:8888/unified-console.html#datasources) in a browser.
+
+## How to permanently delete data
+
+Permanent deletion of a Druid segment has two steps:
+
+1. The segment must first be marked as "unused". This occurs when a user manually disables a segment through the Coordinator API.
+2. After segments have been marked as "unused", a Kill Task will delete any "unused" segments from Druid's metadata store as well as deep storage.
+
+Let's drop some segments now, by using the coordinator API to drop data by interval and segmentIds.
+
+## Disable segments by interval
+
+Let's disable segments in a specified interval. This will mark all segments in the interval as "unused", but not remove them from deep storage.
+Let's disable segments in interval `2015-09-12T18:00:00.000Z/2015-09-12T20:00:00.000Z` i.e. between hour 18 and 20.
+
+```bash
+curl -X 'POST' -H 'Content-Type:application/json' -d '{ "interval" : "2015-09-12T18:00:00.000Z/2015-09-12T20:00:00.000Z" }' http://localhost:8081/druid/coordinator/v1/datasources/deletion-tutorial/markUnused
+```
+
+When the request completes, the Segments view of the web console no longer displays the segments for hours 18 and 19.
+![Segments 1](../assets/tutorial-deletion-01.png "Segments 1")
+
+Note that the hour 18 and 19 segments are still present in deep storage:
+
+```bash
+$ ls -l1 var/druid/segments/deletion-tutorial/
+2015-09-12T00:00:00.000Z_2015-09-12T01:00:00.000Z
+2015-09-12T01:00:00.000Z_2015-09-12T02:00:00.000Z
+2015-09-12T02:00:00.000Z_2015-09-12T03:00:00.000Z
+2015-09-12T03:00:00.000Z_2015-09-12T04:00:00.000Z
+2015-09-12T04:00:00.000Z_2015-09-12T05:00:00.000Z
+2015-09-12T05:00:00.000Z_2015-09-12T06:00:00.000Z
+2015-09-12T06:00:00.000Z_2015-09-12T07:00:00.000Z
+2015-09-12T07:00:00.000Z_2015-09-12T08:00:00.000Z
+2015-09-12T08:00:00.000Z_2015-09-12T09:00:00.000Z
+2015-09-12T09:00:00.000Z_2015-09-12T10:00:00.000Z
+2015-09-12T10:00:00.000Z_2015-09-12T11:00:00.000Z
+2015-09-12T11:00:00.000Z_2015-09-12T12:00:00.000Z
+2015-09-12T12:00:00.000Z_2015-09-12T13:00:00.000Z
+2015-09-12T13:00:00.000Z_2015-09-12T14:00:00.000Z
+2015-09-12T14:00:00.000Z_2015-09-12T15:00:00.000Z
+2015-09-12T15:00:00.000Z_2015-09-12T16:00:00.000Z
+2015-09-12T16:00:00.000Z_2015-09-12T17:00:00.000Z
+2015-09-12T17:00:00.000Z_2015-09-12T18:00:00.000Z
+2015-09-12T18:00:00.000Z_2015-09-12T19:00:00.000Z
+2015-09-12T19:00:00.000Z_2015-09-12T20:00:00.000Z
+2015-09-12T20:00:00.000Z_2015-09-12T21:00:00.000Z
+2015-09-12T21:00:00.000Z_2015-09-12T22:00:00.000Z
+2015-09-12T22:00:00.000Z_2015-09-12T23:00:00.000Z
+2015-09-12T23:00:00.000Z_2015-09-13T00:00:00.000Z
+```
+
+## Disable segments by segment IDs
+
+Let's disable some segments by their segmentID. This will again mark the segments as "unused", but not remove them from deep storage. You can see the full segmentID for a segment using the web console.
+
+In the [segments view](http://localhost:8888/unified-console.html#segments), click one of the segment rows to open the segment metadata dialog:
+
+![Segments_2](../assets/tutorial-deletion-02.png "Segments 2")
+
+The `identifier` field in the metadata dialog shows the full segment ID. For example, the hour 23 segment has segment ID `deletion-tutorial_2015-09-12T23:00:00.000Z_2015-09-13T00:00:00.000Z_2023-05-16T00:04:12.091Z`.
+
+Disable the last two segments, hour 22 and 23 segments, by sending a POST request to the Coordinator with the corresponding segment IDs.
+The following command queries the Coordinator for segment IDs and uses `jq` to parse and extract the IDs of the last two segments.
+The segment IDs are stored in an environment variable named `unusedSegmentIds`.
+```bash
+unusedSegmentIds=$(curl -X 'GET' -H 'Content-Type:application/json' http://localhost:8081/druid/coordinator/v1/datasources/deletion-tutorial/segments | jq '.[-2:]')
+```
+
+The following request marks the segments unused:
+```bash
+curl -X 'POST' -H 'Content-Type:application/json' -d "{\"segmentIds\": $unusedSegmentIds}" http://localhost:8081/druid/coordinator/v1/datasources/deletion-tutorial/markUnused
+```
+
+When the request completes, the Segments view of the web console no longer displays the segments for hours 22 and 23.
+
+![Segments 3](../assets/tutorial-deletion-03.png "Segments 3")
+
+Note that the hour 22 and 23 segments are still in deep storage:
+
+```bash
+$ ls -l1 var/druid/segments/deletion-tutorial/
+2015-09-12T00:00:00.000Z_2015-09-12T01:00:00.000Z
+2015-09-12T01:00:00.000Z_2015-09-12T02:00:00.000Z
+2015-09-12T02:00:00.000Z_2015-09-12T03:00:00.000Z
+2015-09-12T03:00:00.000Z_2015-09-12T04:00:00.000Z
+2015-09-12T04:00:00.000Z_2015-09-12T05:00:00.000Z
+2015-09-12T05:00:00.000Z_2015-09-12T06:00:00.000Z
+2015-09-12T06:00:00.000Z_2015-09-12T07:00:00.000Z
+2015-09-12T07:00:00.000Z_2015-09-12T08:00:00.000Z
+2015-09-12T08:00:00.000Z_2015-09-12T09:00:00.000Z
+2015-09-12T09:00:00.000Z_2015-09-12T10:00:00.000Z
+2015-09-12T10:00:00.000Z_2015-09-12T11:00:00.000Z
+2015-09-12T11:00:00.000Z_2015-09-12T12:00:00.000Z
+2015-09-12T12:00:00.000Z_2015-09-12T13:00:00.000Z
+2015-09-12T13:00:00.000Z_2015-09-12T14:00:00.000Z
+2015-09-12T14:00:00.000Z_2015-09-12T15:00:00.000Z
+2015-09-12T15:00:00.000Z_2015-09-12T16:00:00.000Z
+2015-09-12T16:00:00.000Z_2015-09-12T17:00:00.000Z
+2015-09-12T17:00:00.000Z_2015-09-12T18:00:00.000Z
+2015-09-12T18:00:00.000Z_2015-09-12T19:00:00.000Z
+2015-09-12T19:00:00.000Z_2015-09-12T20:00:00.000Z
+2015-09-12T20:00:00.000Z_2015-09-12T21:00:00.000Z
+2015-09-12T21:00:00.000Z_2015-09-12T22:00:00.000Z
+2015-09-12T22:00:00.000Z_2015-09-12T23:00:00.000Z
+2015-09-12T23:00:00.000Z_2015-09-13T00:00:00.000Z
+```
+
+## Run a kill task
+
+Now that we have disabled some segments, we can submit a Kill Task, which will delete the disabled segments from metadata and deep storage.
+
+A Kill Task spec has been provided at `quickstart/tutorial/deletion-kill.json`. Submit this task to the Overlord with the following command:
+
+```bash
+curl -X 'POST' -H 'Content-Type:application/json' -d @quickstart/tutorial/deletion-kill.json http://localhost:8081/druid/indexer/v1/task
+```
+
+When the task finishes, note that Druid deleted the disabled segments from deep storage.
+
+
+```bash
+$ ls -l1 var/druid/segments/deletion-tutorial/
+2015-09-12T00:00:00.000Z_2015-09-12T01:00:00.000Z
+2015-09-12T01:00:00.000Z_2015-09-12T02:00:00.000Z
+2015-09-12T02:00:00.000Z_2015-09-12T03:00:00.000Z
+2015-09-12T03:00:00.000Z_2015-09-12T04:00:00.000Z
+2015-09-12T04:00:00.000Z_2015-09-12T05:00:00.000Z
+2015-09-12T05:00:00.000Z_2015-09-12T06:00:00.000Z
+2015-09-12T06:00:00.000Z_2015-09-12T07:00:00.000Z
+2015-09-12T07:00:00.000Z_2015-09-12T08:00:00.000Z
+2015-09-12T08:00:00.000Z_2015-09-12T09:00:00.000Z
+2015-09-12T09:00:00.000Z_2015-09-12T10:00:00.000Z
+2015-09-12T10:00:00.000Z_2015-09-12T11:00:00.000Z
+2015-09-12T11:00:00.000Z_2015-09-12T12:00:00.000Z
+2015-09-12T12:00:00.000Z_2015-09-12T13:00:00.000Z
+2015-09-12T13:00:00.000Z_2015-09-12T14:00:00.000Z
+2015-09-12T14:00:00.000Z_2015-09-12T15:00:00.000Z
+2015-09-12T15:00:00.000Z_2015-09-12T16:00:00.000Z
+2015-09-12T16:00:00.000Z_2015-09-12T17:00:00.000Z
+2015-09-12T17:00:00.000Z_2015-09-12T18:00:00.000Z
+2015-09-12T20:00:00.000Z_2015-09-12T21:00:00.000Z
+2015-09-12T21:00:00.000Z_2015-09-12T22:00:00.000Z
+```
diff --git a/docs/35.0.0/tutorials/tutorial-extern.md b/docs/35.0.0/tutorials/tutorial-extern.md
new file mode 100644
index 0000000000..a58ed13a67
--- /dev/null
+++ b/docs/35.0.0/tutorials/tutorial-extern.md
@@ -0,0 +1,206 @@
+---
+id: tutorial-extern
+title: Export query results
+sidebar_label: Export results
+description: How to use EXTERN to export query results.
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+import Tabs from '@theme/Tabs';
+import TabItem from '@theme/TabItem';
+
+This tutorial demonstrates how to use the Apache Druid&circledR; SQL [EXTERN](../multi-stage-query/reference.md#extern-function) function to export data.
+
+## Prerequisites
+
+Before you follow the steps in this tutorial, download Druid as described in the [Local quickstart](index.md).
+Don't start Druid, you'll do that as part of the tutorial.
+
+You should be familiar with ingesting and querying data in Druid.
+If you haven't already, go through the [Query data](../tutorials/tutorial-query.md) tutorial first.
+
+## Export query results to the local file system
+
+This example demonstrates how to configure Druid to export data to the local file system.
+While you can use this approach to learn about EXTERN syntax for exporting data, it's not suitable for production scenarios.
+
+### Configure Druid local export directory 
+
+The following commands set the base path for the Druid exports to `/tmp/druid/`.
+If the account running Druid doesn't have access to `/tmp/druid/`, change the path.
+For example: `/Users/Example/druid`.
+If you change the path in this step, use the updated path in all subsequent steps.
+
+From the root of the Druid distribution, run the following:
+
+```bash
+export export_path="/tmp/druid"
+sed -i -e $'$a\\\n\\\n\\\n#\\\n###Local export\\\n#\\\ndruid.export.storage.baseDir='$export_path' conf/druid/auto/_common/common.runtime.properties
+```
+
+This adds the following section to the Druid `common.runtime.properties` configuration file located in `conf/druid/auto/_common`:
+
+```
+#
+###Local export
+#
+druid.export.storage.baseDir=/tmp/druid/
+```
+
+### Start Druid and load sample data
+
+1. From the root of the Druid distribution, launch Druid as follows:
+
+     ```bash
+    ./bin/start-druid
+     ```
+1. After Druid starts, open [http://localhost:8888/](http://localhost:8888/) in your browser to access the Web Console.
+1. From the [Query view](http://localhost:8888/unified-console.html#workbench), run the following command to load the Wikipedia example data set:
+     ```sql
+     REPLACE INTO "wikipedia" OVERWRITE ALL
+     WITH "ext" AS (
+       SELECT *
+       FROM TABLE(
+         EXTERN(
+           '{"type":"http","uris":["https://druid.apache.org/data/wikipedia.json.gz"]}',
+           '{"type":"json"}'
+         )
+       ) EXTEND ("isRobot" VARCHAR, "channel" VARCHAR, "timestamp" VARCHAR, "flags" VARCHAR, "isUnpatrolled" VARCHAR, "page" VARCHAR, "diffUrl" VARCHAR, "added" BIGINT, "comment" VARCHAR, "commentLength" BIGINT, "isNew" VARCHAR, "isMinor" VARCHAR, "delta" BIGINT, "isAnonymous" VARCHAR, "user" VARCHAR, "deltaBucket" BIGINT, "deleted" BIGINT, "namespace" VARCHAR, "cityName" VARCHAR, "countryName" VARCHAR, "regionIsoCode" VARCHAR, "metroCode" BIGINT, "countryIsoCode" VARCHAR, "regionName" VARCHAR)
+     )
+     SELECT
+       TIME_PARSE("timestamp") AS "__time",
+       "isRobot",
+       "channel",
+       "flags",
+       "isUnpatrolled",
+       "page",
+       "diffUrl",
+       "added",
+       "comment",
+       "commentLength",
+       "isNew",
+       "isMinor",
+       "delta",
+       "isAnonymous",
+       "user",
+       "deltaBucket",
+       "deleted",
+       "namespace",
+       "cityName",
+       "countryName",
+       "regionIsoCode",
+       "metroCode",
+       "countryIsoCode",
+       "regionName"
+     FROM "ext"
+     PARTITIONED BY DAY
+     ```
+
+### Query to export data
+
+Open a new tab and run the following query to export query results to the path:
+`/tmp/druid/wiki_example`.
+The path must be a subdirectory of the `druid.export.storage.baseDir`.
+
+
+```sql
+INSERT INTO
+  EXTERN(
+    local(exportPath => '/tmp/druid/wiki_example')
+        )
+AS CSV
+SELECT "channel",
+  SUM("delta") AS "changes"
+FROM "wikipedia"
+GROUP BY 1
+LIMIT 10
+```
+
+Druid exports the results of the query to the `/tmp/druid/wiki_example` directory.
+Run the following command to list the contents of 
+
+```bash
+ls /tmp/druid/wiki_example
+```
+
+The results are a CSV file export of the data and a directory.
+
+## Export query results to cloud storage
+
+The steps to export to cloud storage are similar to exporting to the local file system.
+Druid supports Amazon S3 or Google Cloud Storage (GCS) as cloud storage destinations.
+
+1. Enable the extension for your cloud storage destination. See [Loading core extensions](../configuration/extensions.md#loading-core-extensions).
+   - **Amazon S3**: `druid-s3-extensions`
+   - **GCS**: `google-extensions`
+  See [Loading core extensions](../configuration/extensions.md#loading-core-extensions) for more information.
+1. Configure the additional properties for your cloud storage destination. Replace `{CLOUD}` with `s3` or `google` accordingly:
+   - `druid.export.storage.{CLOUD}.tempLocalDir`:  Local temporary directory where the query engine stages files to export.
+   - `druid.export.storage.{CLOUD}.allowedExportPaths`: S3 or GS prefixes allowed as Druid export locations. For example `[\"s3://bucket1/export/\",\"s3://bucket2/export/\"]` or `[\"gs://bucket1/export/\", \"gs://bucket2/export/\"]`.
+   - `druid.export.storage.{CLOUD}.maxRetry`: Maximum number of times to attempt cloud API calls to avoid failures from transient errors.
+   - `druid.export.storage.s3.chunkSize`: Maximum size of individual data chunks to store in the temporary directory.
+1. Verify the instance role has the correct permissions to the bucket and folders: read, write, create, and delete. See [Permissions for durable storage](../multi-stage-query/security.md#permissions-for-durable-storage).
+1. Use the query syntax for your cloud storage type. For example:
+
+   <Tabs>
+
+   <TabItem value="1" label="S3">
+
+    ```sql
+    INSERT INTO
+    EXTERN(
+      s3(bucket => 'your_bucket', prefix => 'prefix/to/files'))
+    AS CSV
+    SELECT "channel",
+    SUM("delta") AS "changes"
+    FROM "wikipedia"
+    GROUP BY 1
+    LIMIT 10
+    ```
+
+   </TabItem>
+
+   <TabItem value="2" label="GCS">
+
+   ```sql
+   INSERT INTO
+   EXTERN
+    google(bucket => 'your_bucket', prefix => 'prefix/to/files')
+   AS CSV
+   SELECT "channel",
+   SUM("delta") AS "changes"
+   FROM "wikipedia"
+   GROUP BY 1
+   LIMIT 10
+   ``` 
+
+   </TabItem>
+
+   </Tabs>
+
+1. When querying, use the `rowsPerPage` query context parameter to restrict the output file size. While it's possible to add a very large LIMIT at the end of your query to force Druid to create a single file, we don't recommend this technique.
+
+## Learn more
+
+See the following topics for more information:
+
+* [Export to a destination](../multi-stage-query/reference.md#extern-to-export-to-a-destination) for a reference of the EXTERN.
+* [SQL-based ingestion security](../multi-stage-query/security.md#permissions-for-durable-storage) for cloud permission requirements for MSQ.
diff --git a/docs/35.0.0/tutorials/tutorial-ingestion-spec.md b/docs/35.0.0/tutorials/tutorial-ingestion-spec.md
new file mode 100644
index 0000000000..3f7ea42c79
--- /dev/null
+++ b/docs/35.0.0/tutorials/tutorial-ingestion-spec.md
@@ -0,0 +1,607 @@
+---
+id: tutorial-ingestion-spec
+title: Write an ingestion spec
+sidebar_label: Write an ingestion spec
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+This tutorial will guide the reader through the process of defining an ingestion spec, pointing out key considerations and guidelines.
+
+For this tutorial, we'll assume you've already downloaded Apache Druid as described in
+the [single-machine quickstart](index.md) and have it running on your local machine.
+
+It will also be helpful to have finished [Tutorial: Loading a file](../tutorials/tutorial-batch.md), [Tutorial: Querying data](../tutorials/tutorial-query.md), and [Tutorial: Rollup](../tutorials/tutorial-rollup.md).
+
+## Example data
+
+Suppose we have the following network flow data:
+
+* `srcIP`: IP address of sender
+* `srcPort`: Port of sender
+* `dstIP`: IP address of receiver
+* `dstPort`: Port of receiver
+* `protocol`: IP protocol number
+* `packets`: number of packets transmitted
+* `bytes`: number of bytes transmitted
+* `cost`: the cost of sending the traffic
+
+```json
+{"ts":"2018-01-01T01:01:35Z","srcIP":"1.1.1.1", "dstIP":"2.2.2.2", "srcPort":2000, "dstPort":3000, "protocol": 6, "packets":10, "bytes":1000, "cost": 1.4}
+{"ts":"2018-01-01T01:01:51Z","srcIP":"1.1.1.1", "dstIP":"2.2.2.2", "srcPort":2000, "dstPort":3000, "protocol": 6, "packets":20, "bytes":2000, "cost": 3.1}
+{"ts":"2018-01-01T01:01:59Z","srcIP":"1.1.1.1", "dstIP":"2.2.2.2", "srcPort":2000, "dstPort":3000, "protocol": 6, "packets":30, "bytes":3000, "cost": 0.4}
+{"ts":"2018-01-01T01:02:14Z","srcIP":"1.1.1.1", "dstIP":"2.2.2.2", "srcPort":5000, "dstPort":7000, "protocol": 6, "packets":40, "bytes":4000, "cost": 7.9}
+{"ts":"2018-01-01T01:02:29Z","srcIP":"1.1.1.1", "dstIP":"2.2.2.2", "srcPort":5000, "dstPort":7000, "protocol": 6, "packets":50, "bytes":5000, "cost": 10.2}
+{"ts":"2018-01-01T01:03:29Z","srcIP":"1.1.1.1", "dstIP":"2.2.2.2", "srcPort":5000, "dstPort":7000, "protocol": 6, "packets":60, "bytes":6000, "cost": 4.3}
+{"ts":"2018-01-01T02:33:14Z","srcIP":"7.7.7.7", "dstIP":"8.8.8.8", "srcPort":4000, "dstPort":5000, "protocol": 17, "packets":100, "bytes":10000, "cost": 22.4}
+{"ts":"2018-01-01T02:33:45Z","srcIP":"7.7.7.7", "dstIP":"8.8.8.8", "srcPort":4000, "dstPort":5000, "protocol": 17, "packets":200, "bytes":20000, "cost": 34.5}
+{"ts":"2018-01-01T02:35:45Z","srcIP":"7.7.7.7", "dstIP":"8.8.8.8", "srcPort":4000, "dstPort":5000, "protocol": 17, "packets":300, "bytes":30000, "cost": 46.3}
+```
+
+Save the JSON contents above into a file called `ingestion-tutorial-data.json` in `quickstart/`.
+
+Let's walk through the process of defining an ingestion spec that can load this data.
+
+For this tutorial, we will be using the native batch indexing task. When using other task types, some aspects of the ingestion spec will differ, and this tutorial will point out such areas.
+
+## Defining the schema
+
+The core element of a Druid ingestion spec is the `dataSchema`. The `dataSchema` defines how to parse input data into a set of columns that will be stored in Druid.
+
+Let's start with an empty `dataSchema` and add fields to it as we progress through the tutorial.
+
+Create a new file called `ingestion-tutorial-index.json` in `quickstart/` with the following contents:
+
+```json
+"dataSchema" : {}
+```
+
+We will be making successive edits to this ingestion spec as we progress through the tutorial.
+
+### Datasource name
+
+The datasource name is specified by the `dataSource` parameter in the `dataSchema`.
+
+```json
+"dataSchema" : {
+  "dataSource" : "ingestion-tutorial",
+}
+```
+
+Let's call the tutorial datasource `ingestion-tutorial`.
+
+### Time column
+
+The `dataSchema` needs to know how to extract the main timestamp field from the input data.
+
+The timestamp column in our input data is named "ts", containing ISO 8601 timestamps, so let's add a `timestampSpec` with that information to the `dataSchema`:
+
+```json
+"dataSchema" : {
+  "dataSource" : "ingestion-tutorial",
+  "timestampSpec" : {
+    "format" : "iso",
+    "column" : "ts"
+  }
+}
+```
+
+### Column types
+
+Now that we've defined the time column, let's look at definitions for other columns.
+
+Druid supports the following column types: String, Long, Float, Double. We will see how these are used in the following sections.
+
+Before we move on to how we define our other non-time columns, let's discuss `rollup` first.
+
+### Rollup
+
+When ingesting data, we must consider whether we wish to use rollup or not.
+
+* If rollup is enabled, we will need to separate the input columns into two categories, "dimensions" and "metrics". "Dimensions" are the grouping columns for rollup, while "metrics" are the columns that will be aggregated.
+
+* If rollup is disabled, then all columns are treated as "dimensions" and no pre-aggregation occurs.
+
+For this tutorial, let's enable rollup. This is specified with a `granularitySpec` on the `dataSchema`.
+
+```json
+"dataSchema" : {
+  "dataSource" : "ingestion-tutorial",
+  "timestampSpec" : {
+    "format" : "iso",
+    "column" : "ts"
+  },
+  "granularitySpec" : {
+    "rollup" : true
+  }
+}
+```
+
+#### Choosing dimensions and metrics
+
+For this example dataset, the following is a sensible split for "dimensions" and "metrics":
+
+* Dimensions: srcIP, srcPort, dstIP, dstPort, protocol
+* Metrics: packets, bytes, cost
+
+The dimensions here are a group of properties that identify a unidirectional flow of IP traffic, while the metrics represent facts about the IP traffic flow specified by a dimension grouping.
+
+Let's look at how to define these dimensions and metrics within the ingestion spec.
+
+#### Dimensions
+
+Dimensions are specified with a `dimensionsSpec` inside the `dataSchema`.
+
+```json
+"dataSchema" : {
+  "dataSource" : "ingestion-tutorial",
+  "timestampSpec" : {
+    "format" : "iso",
+    "column" : "ts"
+  },
+  "dimensionsSpec" : {
+    "dimensions": [
+      "srcIP",
+      { "name" : "srcPort", "type" : "long" },
+      { "name" : "dstIP", "type" : "string" },
+      { "name" : "dstPort", "type" : "long" },
+      { "name" : "protocol", "type" : "string" }
+    ]
+  },
+  "granularitySpec" : {
+    "rollup" : true
+  }
+}
+```
+
+Each dimension has a `name` and a `type`, where `type` can be "long", "float", "double", or "string".
+
+Note that `srcIP` is a "string" dimension; for string dimensions, it is enough to specify just a dimension name, since "string" is the default dimension type.
+
+Also note that `protocol` is a numeric value in the input data, but we are ingesting it as a "string" column; Druid will coerce the input longs to strings during ingestion.
+
+##### Strings vs. Numerics
+
+Should a numeric input be ingested as a numeric dimension or as a string dimension?
+
+Numeric dimensions have the following pros/cons relative to String dimensions:
+* Pros: Numeric representation can result in smaller column sizes on disk and lower processing overhead when reading values from the column
+* Cons: Numeric dimensions do not have indices, so filtering on them will often be slower than filtering on an equivalent String dimension (which has bitmap indices)
+
+#### Metrics
+
+Metrics are specified with a `metricsSpec` inside the `dataSchema`:
+
+```json
+"dataSchema" : {
+  "dataSource" : "ingestion-tutorial",
+  "timestampSpec" : {
+    "format" : "iso",
+    "column" : "ts"
+  },
+  "dimensionsSpec" : {
+    "dimensions": [
+      "srcIP",
+      { "name" : "srcPort", "type" : "long" },
+      { "name" : "dstIP", "type" : "string" },
+      { "name" : "dstPort", "type" : "long" },
+      { "name" : "protocol", "type" : "string" }
+    ]
+  },
+  "metricsSpec" : [
+    { "type" : "count", "name" : "count" },
+    { "type" : "longSum", "name" : "packets", "fieldName" : "packets" },
+    { "type" : "longSum", "name" : "bytes", "fieldName" : "bytes" },
+    { "type" : "doubleSum", "name" : "cost", "fieldName" : "cost" }
+  ],
+  "granularitySpec" : {
+    "rollup" : true
+  }
+}
+```
+
+When defining a metric, it is necessary to specify what type of aggregation should be performed on that column during rollup.
+
+Here we have defined long sum aggregations on the two long metric columns, `packets` and `bytes`, and a double sum aggregation for the `cost` column.
+
+Note that the `metricsSpec` is on a different nesting level than `dimensionSpec` or `parseSpec`; it belongs on the same nesting level as `parser` within the `dataSchema`.
+
+Note that we have also defined a `count` aggregator. The count aggregator will track how many rows in the original input data contributed to a "rolled up" row in the final ingested data.
+
+### No rollup
+
+If we were not using rollup, all columns would be specified in the `dimensionsSpec`, e.g.:
+
+```json
+      "dimensionsSpec" : {
+        "dimensions": [
+          "srcIP",
+          { "name" : "srcPort", "type" : "long" },
+          { "name" : "dstIP", "type" : "string" },
+          { "name" : "dstPort", "type" : "long" },
+          { "name" : "protocol", "type" : "string" },
+          { "name" : "packets", "type" : "long" },
+          { "name" : "bytes", "type" : "long" },
+          { "name" : "srcPort", "type" : "double" }
+        ]
+      },
+```
+
+
+### Define granularities
+
+At this point, we are done defining the `parser` and `metricsSpec` within the `dataSchema` and we are almost done writing the ingestion spec.
+
+There are some additional properties we need to set in the `granularitySpec`:
+* Type of granularitySpec: the `uniform` granularity spec defines segments with uniform interval sizes. For example, all segments cover an hour's worth of data.
+* The segment granularity: what size of time interval should a single segment contain data for? e.g., `DAY`, `WEEK`
+* The bucketing granularity of the timestamps in the time column (referred to as `queryGranularity`)
+
+#### Segment granularity
+
+Segment granularity is configured by the `segmentGranularity` property in the `granularitySpec`. For this tutorial, we'll create hourly segments:
+
+```json
+"dataSchema" : {
+  "dataSource" : "ingestion-tutorial",
+  "timestampSpec" : {
+    "format" : "iso",
+    "column" : "ts"
+  },
+  "dimensionsSpec" : {
+    "dimensions": [
+      "srcIP",
+      { "name" : "srcPort", "type" : "long" },
+      { "name" : "dstIP", "type" : "string" },
+      { "name" : "dstPort", "type" : "long" },
+      { "name" : "protocol", "type" : "string" }
+    ]
+  },
+  "metricsSpec" : [
+    { "type" : "count", "name" : "count" },
+    { "type" : "longSum", "name" : "packets", "fieldName" : "packets" },
+    { "type" : "longSum", "name" : "bytes", "fieldName" : "bytes" },
+    { "type" : "doubleSum", "name" : "cost", "fieldName" : "cost" }
+  ],
+  "granularitySpec" : {
+    "type" : "uniform",
+    "segmentGranularity" : "HOUR",
+    "rollup" : true
+  }
+}
+```
+
+Our input data has events from two separate hours, so this task will generate two segments.
+
+#### Query granularity
+
+The query granularity is configured by the `queryGranularity` property in the `granularitySpec`. For this tutorial, let's use minute granularity:
+
+```json
+"dataSchema" : {
+  "dataSource" : "ingestion-tutorial",
+  "timestampSpec" : {
+    "format" : "iso",
+    "column" : "ts"
+  },
+  "dimensionsSpec" : {
+    "dimensions": [
+      "srcIP",
+      { "name" : "srcPort", "type" : "long" },
+      { "name" : "dstIP", "type" : "string" },
+      { "name" : "dstPort", "type" : "long" },
+      { "name" : "protocol", "type" : "string" }
+    ]
+  },
+  "metricsSpec" : [
+    { "type" : "count", "name" : "count" },
+    { "type" : "longSum", "name" : "packets", "fieldName" : "packets" },
+    { "type" : "longSum", "name" : "bytes", "fieldName" : "bytes" },
+    { "type" : "doubleSum", "name" : "cost", "fieldName" : "cost" }
+  ],
+  "granularitySpec" : {
+    "type" : "uniform",
+    "segmentGranularity" : "HOUR",
+    "queryGranularity" : "MINUTE",
+    "rollup" : true
+  }
+}
+```
+
+To see the effect of the query granularity, let's look at this row from the raw input data:
+
+```json
+{"ts":"2018-01-01T01:03:29Z","srcIP":"1.1.1.1", "dstIP":"2.2.2.2", "srcPort":5000, "dstPort":7000, "protocol": 6, "packets":60, "bytes":6000, "cost": 4.3}
+```
+
+When this row is ingested with minute queryGranularity, Druid will floor the row's timestamp to minute buckets:
+
+```json
+{"ts":"2018-01-01T01:03:00Z","srcIP":"1.1.1.1", "dstIP":"2.2.2.2", "srcPort":5000, "dstPort":7000, "protocol": 6, "packets":60, "bytes":6000, "cost": 4.3}
+```
+
+#### Define an interval (batch only)
+
+For batch tasks, it is necessary to define a time interval. Input rows with timestamps outside of the time interval will not be ingested.
+
+The interval is also specified in the `granularitySpec`:
+
+```json
+"dataSchema" : {
+  "dataSource" : "ingestion-tutorial",
+  "timestampSpec" : {
+    "format" : "iso",
+    "column" : "ts"
+  },
+  "dimensionsSpec" : {
+    "dimensions": [
+      "srcIP",
+      { "name" : "srcPort", "type" : "long" },
+      { "name" : "dstIP", "type" : "string" },
+      { "name" : "dstPort", "type" : "long" },
+      { "name" : "protocol", "type" : "string" }
+    ]
+  },
+  "metricsSpec" : [
+    { "type" : "count", "name" : "count" },
+    { "type" : "longSum", "name" : "packets", "fieldName" : "packets" },
+    { "type" : "longSum", "name" : "bytes", "fieldName" : "bytes" },
+    { "type" : "doubleSum", "name" : "cost", "fieldName" : "cost" }
+  ],
+  "granularitySpec" : {
+    "type" : "uniform",
+    "segmentGranularity" : "HOUR",
+    "queryGranularity" : "MINUTE",
+    "intervals" : ["2018-01-01/2018-01-02"],
+    "rollup" : true
+  }
+}
+```
+
+## Define the task type
+
+We've now finished defining our `dataSchema`. The remaining steps are to place the `dataSchema` we created into an ingestion task spec, and specify the input source.
+
+The `dataSchema` is shared across all task types, but each task type has its own specification format. For this tutorial, we will use the native batch ingestion task:
+
+```json
+{
+  "type" : "index_parallel",
+  "spec" : {
+    "dataSchema" : {
+      "dataSource" : "ingestion-tutorial",
+      "timestampSpec" : {
+        "format" : "iso",
+        "column" : "ts"
+      },
+      "dimensionsSpec" : {
+        "dimensions": [
+          "srcIP",
+          { "name" : "srcPort", "type" : "long" },
+          { "name" : "dstIP", "type" : "string" },
+          { "name" : "dstPort", "type" : "long" },
+          { "name" : "protocol", "type" : "string" }
+        ]
+      },
+      "metricsSpec" : [
+        { "type" : "count", "name" : "count" },
+        { "type" : "longSum", "name" : "packets", "fieldName" : "packets" },
+        { "type" : "longSum", "name" : "bytes", "fieldName" : "bytes" },
+        { "type" : "doubleSum", "name" : "cost", "fieldName" : "cost" }
+      ],
+      "granularitySpec" : {
+        "type" : "uniform",
+        "segmentGranularity" : "HOUR",
+        "queryGranularity" : "MINUTE",
+        "intervals" : ["2018-01-01/2018-01-02"],
+        "rollup" : true
+      }
+    }
+  }
+}
+```
+
+## Define the input source
+
+Now let's define our input source, which is specified in an `ioConfig` object. Each task type has its own type of `ioConfig`. To read input data, we need to specify an `inputSource`. The example netflow data we saved earlier needs to be read from a local file, which is configured below:
+
+
+```json
+    "ioConfig" : {
+      "type" : "index_parallel",
+      "inputSource" : {
+        "type" : "local",
+        "baseDir" : "quickstart/",
+        "filter" : "ingestion-tutorial-data.json"
+      }
+    }
+```
+
+
+### Define the format of the data
+
+Since our input data is represented as JSON strings, we'll use a `inputFormat` to `json` format:
+
+```json
+    "ioConfig" : {
+      "type" : "index_parallel",
+      "inputSource" : {
+        "type" : "local",
+        "baseDir" : "quickstart/",
+        "filter" : "ingestion-tutorial-data.json"
+      },
+      "inputFormat" : {
+        "type" : "json"
+      }
+    }
+```
+
+```json
+{
+  "type" : "index_parallel",
+  "spec" : {
+    "dataSchema" : {
+      "dataSource" : "ingestion-tutorial",
+      "timestampSpec" : {
+        "format" : "iso",
+        "column" : "ts"
+      },
+      "dimensionsSpec" : {
+        "dimensions": [
+          "srcIP",
+          { "name" : "srcPort", "type" : "long" },
+          { "name" : "dstIP", "type" : "string" },
+          { "name" : "dstPort", "type" : "long" },
+          { "name" : "protocol", "type" : "string" }
+        ]
+      },
+      "metricsSpec" : [
+        { "type" : "count", "name" : "count" },
+        { "type" : "longSum", "name" : "packets", "fieldName" : "packets" },
+        { "type" : "longSum", "name" : "bytes", "fieldName" : "bytes" },
+        { "type" : "doubleSum", "name" : "cost", "fieldName" : "cost" }
+      ],
+      "granularitySpec" : {
+        "type" : "uniform",
+        "segmentGranularity" : "HOUR",
+        "queryGranularity" : "MINUTE",
+        "intervals" : ["2018-01-01/2018-01-02"],
+        "rollup" : true
+      }
+    },
+    "ioConfig" : {
+      "type" : "index_parallel",
+      "inputSource" : {
+        "type" : "local",
+        "baseDir" : "quickstart/",
+        "filter" : "ingestion-tutorial-data.json"
+      },
+      "inputFormat" : {
+        "type" : "json"
+      }
+    }
+  }
+}
+```
+
+## Additional tuning
+
+Each ingestion task has a `tuningConfig` section that allows users to tune various ingestion parameters.
+
+As an example, let's add a `tuningConfig` that sets a target segment size for the native batch ingestion task:
+
+```json
+    "tuningConfig" : {
+      "type" : "index_parallel",
+      "partitionsSpec": {
+        "type": "dynamic",
+         "maxRowsPerSegment" : 5000000
+      }
+    }
+         
+```
+
+Note that each ingestion task has its own type of `tuningConfig`.
+
+## Final spec
+
+We've finished defining the ingestion spec, it should now look like the following:
+
+```json
+{
+  "type" : "index_parallel",
+  "spec" : {
+    "dataSchema" : {
+      "dataSource" : "ingestion-tutorial",
+      "timestampSpec" : {
+        "format" : "iso",
+        "column" : "ts"
+      },
+      "dimensionsSpec" : {
+        "dimensions": [
+          "srcIP",
+          { "name" : "srcPort", "type" : "long" },
+          { "name" : "dstIP", "type" : "string" },
+          { "name" : "dstPort", "type" : "long" },
+          { "name" : "protocol", "type" : "string" }
+        ]
+      },
+      "metricsSpec" : [
+        { "type" : "count", "name" : "count" },
+        { "type" : "longSum", "name" : "packets", "fieldName" : "packets" },
+        { "type" : "longSum", "name" : "bytes", "fieldName" : "bytes" },
+        { "type" : "doubleSum", "name" : "cost", "fieldName" : "cost" }
+      ],
+      "granularitySpec" : {
+        "type" : "uniform",
+        "segmentGranularity" : "HOUR",
+        "queryGranularity" : "MINUTE",
+        "intervals" : ["2018-01-01/2018-01-02"],
+        "rollup" : true
+      }
+    },
+    "ioConfig" : {
+      "type" : "index_parallel",
+      "inputSource" : {
+        "type" : "local",
+        "baseDir" : "quickstart/",
+        "filter" : "ingestion-tutorial-data.json"
+      },
+      "inputFormat" : {
+        "type" : "json"
+      }
+    },
+    "tuningConfig" : {
+      "type" : "index_parallel",
+      "partitionsSpec": {
+        "type": "dynamic",
+         "maxRowsPerSegment" : 5000000
+      }
+    }
+  }
+}
+```
+
+## Submit the task and query the data
+
+From the `apache-druid-35.0.0` package root, run the following command:
+
+```bash
+bin/post-index-task --file quickstart/ingestion-tutorial-index.json --url http://localhost:8081
+```
+
+After the script completes, we will query the data.
+
+In the web console, open a new tab in the **Query** view. Run the following query to view the ingested data:
+
+```sql
+select * from "ingestion-tutorial"
+```
+
+Returns the following:
+
+| `__time` | `bytes` | `cost` | `count` | `dstIP` | `dstPort` | `packets` | `protocol` | `srcIP` | `srcPort` |
+| -- | -- | -- | -- | -- | -- | -- | -- | -- | -- |
+| `2018-01-01T01:01:00.000Z` | `6000` | `4.9` | `3` | `2.2.2.2` | `3000` | `60` | `6` | `1.1.1.1` | `2000` |
+| `2018-01-01T01:02:00.000Z` |  `9000` | `18.1` | `2` | `2.2.2.2` | `7000` | `90` | `6` | `1.1.1.1` | `5000` |
+| `2018-01-01T01:03:00.000Z` | `6000` |  `4.3` | `1` | `2.2.2.2` | `7000` | `60` | `6` | `1.1.1.1` | `5000` |
+| `2018-01-01T02:33:00.000Z` | `30000` | `56.9` | `2` | `8.8.8.8` | `5000` | `300` | `17` | `7.7.7.7` | `4000` |
+| `2018-01-01T02:35:00.000Z` | `30000` | `46.3` | `1` | `8.8.8.8` | `5000` | `300` | `17` | `7.7.7.7` | `4000` |
\ No newline at end of file
diff --git a/docs/35.0.0/tutorials/tutorial-jdbc.md b/docs/35.0.0/tutorials/tutorial-jdbc.md
new file mode 100644
index 0000000000..e3462447af
--- /dev/null
+++ b/docs/35.0.0/tutorials/tutorial-jdbc.md
@@ -0,0 +1,34 @@
+---
+id: tutorial-jdbc
+title: Use the JDBC driver to query Druid
+sidebar_label: JDBC connector tutorial
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+import BrowserOnly from '@docusaurus/BrowserOnly';
+
+Redirecting you to the JDBC driver API...
+<BrowserOnly>
+      {() => {
+        window.location.replace("https://druid.apache.org/docs/latest/api-reference/sql-jdbc.html");
+        return null;
+      }}
+    </BrowserOnly>
\ No newline at end of file
diff --git a/docs/35.0.0/tutorials/tutorial-kafka.md b/docs/35.0.0/tutorials/tutorial-kafka.md
new file mode 100644
index 0000000000..a9cdd99ac1
--- /dev/null
+++ b/docs/35.0.0/tutorials/tutorial-kafka.md
@@ -0,0 +1,289 @@
+---
+id: tutorial-kafka
+title: Load streaming data from Apache Kafka
+sidebar_label: Load from Apache Kafka
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+This tutorial shows you how to load data into Apache Druid from a Kafka stream, using Druid's Kafka indexing service. 
+
+The tutorial guides you through the steps to load sample nested clickstream data from the [Koalas to the Max](https://www.koalastothemax.com/) game into a Kafka topic, then ingest the data into Druid.
+
+## Prerequisites
+
+Before you follow the steps in this tutorial, download Druid as described in the [quickstart](index.md) using the [automatic single-machine configuration](../operations/single-server.md) and have it running on your local machine. You don't need to have loaded any data.
+
+## Download and start Kafka
+
+[Apache Kafka](http://kafka.apache.org/) is a high-throughput message bus that works well with Druid. For this tutorial, use Kafka 2.7.0. 
+
+1. To download Kafka, run the following commands in your terminal:
+
+   ```bash
+   curl -O https://archive.apache.org/dist/kafka/2.7.0/kafka_2.13-2.7.0.tgz
+   tar -xzf kafka_2.13-2.7.0.tgz
+   cd kafka_2.13-2.7.0
+   ```
+2. If you're already running Kafka on the machine you're using for this tutorial, delete or rename the `kafka-logs` directory in `/tmp`.
+   
+:::info
+ Druid and Kafka both rely on [Apache ZooKeeper](https://zookeeper.apache.org/) to coordinate and manage services. Because Druid is already running, Kafka attaches to the Druid ZooKeeper instance when it starts up.<br />
+
+ In a production environment where you're running Druid and Kafka on different machines, [start the Kafka ZooKeeper](https://kafka.apache.org/quickstart) before you start the Kafka broker.
+:::
+
+3. In the Kafka root directory, run this command to start a Kafka broker:
+
+   ```bash
+   ./bin/kafka-server-start.sh config/server.properties
+   ```
+
+4. In a new terminal window, navigate to the Kafka root directory and run the following command to create a Kafka topic called `kttm`:
+
+   ```bash
+   ./bin/kafka-topics.sh --create --topic kttm --bootstrap-server localhost:9092
+   ```
+
+   Kafka returns a message when it successfully adds the topic: `Created topic kttm`.
+
+## Load data into Kafka
+
+In this section, you download sample data to the tutorial's directory and send the data to your Kafka topic.
+
+1. In your Kafka root directory, create a directory for the sample data:
+
+   ```bash
+   mkdir sample-data
+   ```
+
+2. Download the sample data to your new directory and extract it:
+
+   ```bash
+   (cd sample-data && curl -O https://static.imply.io/example-data/kttm-nested-v2/kttm-nested-v2-2019-08-25.json.gz)
+   ```
+
+3. In your Kafka root directory, run the following commands to post sample events to the `kttm` Kafka topic:
+
+   ```bash
+   export KAFKA_OPTS="-Dfile.encoding=UTF-8"
+   gzcat ./sample-data/kttm-nested-v2-2019-08-25.json.gz | ./bin/kafka-console-producer.sh --broker-list localhost:9092 --topic kttm
+   ```
+
+## Load data into Druid
+
+Now that you have data in your Kafka topic, you can use Druid's Kafka indexing service to ingest the data into Druid. 
+
+To do this, you can use the Druid console data loader or you can submit a supervisor spec. Follow the steps below to try each method.
+
+### Load data with the console data loader
+
+The Druid console data loader presents you with several screens to configure each section of the supervisor spec, then creates an ingestion task to ingest the Kafka data. 
+
+To use the console data loader:
+
+1. Navigate to [localhost:8888](http://localhost:8888) and click **Load data > Streaming**.
+
+   ![Data loader init](../assets/tutorial-kafka-data-loader-01.png "Data loader init")
+
+2. Click **Apache Kafka** and then **Connect data**.
+
+3. Enter `localhost:9092` as the bootstrap server and `kttm` as the topic, then click **Apply** and make sure you see data similar to the following:
+
+   ![Data loader sample](../assets/tutorial-kafka-data-loader-02.png "Data loader sample")
+
+4. Click **Next: Parse data**.
+
+   ![Data loader parse data](../assets/tutorial-kafka-data-loader-03.png "Data loader parse data")
+
+   The data loader automatically tries to determine the correct parser for the data. For the sample data, it selects input format `json`. You can play around with the different options to get a preview of how Druid parses your data.
+
+5. With the `json` input format selected, click **Next: Parse time**. You may need to click **Apply** first.
+
+   ![Data loader parse time](../assets/tutorial-kafka-data-loader-04.png "Data loader parse time")
+
+   Druid's architecture requires that you specify a primary timestamp column. Druid stores the timestamp in the `__time` column in your Druid datasource.
+   In a production environment, if you don't have a timestamp in your data, you can select **Parse timestamp from:** `None` to use a placeholder value. 
+
+   For the sample data, the data loader selects the `timestamp` column in the raw data as the primary time column.
+
+6. Click **Next: ...** three times to go past the **Transform** and **Filter** steps to **Configure schema**. You don't need to enter anything in these two steps because applying transforms and filters is out of scope for this tutorial.
+
+   ![Data loader schema](../assets/tutorial-kafka-data-loader-05.png "Data loader schema")
+
+7. In the **Configure schema** step, you can select data types for the columns and configure [dimensions](../ingestion/schema-model.md#dimensions) and [metrics](../ingestion/schema-model.md#metrics) to ingest into Druid. The console does most of this for you. Notice that the dimensions `event`, `agent` and `geo_ip` are of the type `json`. 
+
+8.  Click **Next: Partition** to configure how Druid partitions the data into segments.
+
+    ![Data loader partition](../assets/tutorial-kafka-data-loader-06.png "Data loader partition")
+
+9.  Select `day` as the **Segment granularity**. Since this is a small dataset, you don't need to make any further adjustments. Click **Next: Tune** to fine tune how Druid ingests data.
+   
+    ![Data loader tune](../assets/tutorial-kafka-data-loader-07.png "Data loader tune")
+
+10. In **Input tuning**, set **Use earliest offset** to `True`&mdash;this is very  important because you want to consume the data from the start of the stream. There are no other changes to make here, so click **Next: Publish**.
+
+    ![Data loader publish](../assets/tutorial-kafka-data-loader-08.png "Data loader publish")
+
+11. Name the datasource `kttm-kafka` and click **Next: Edit spec** to review your spec.
+
+    ![Data loader spec](../assets/tutorial-kafka-data-loader-09.png "Data loader spec")
+
+    The console presents the spec you've constructed. You can click the buttons above the spec to make changes in previous steps and see how the changes update the spec. You can also edit the spec directly and see it reflected in the previous steps.
+   
+12. Click **Submit** to create an ingestion task.
+
+    Druid displays the task view with the focus on the newly created supervisor.
+
+    The task view auto-refreshes, so wait until the supervisor launches a task. The status changes from **Pending** to **Running** as Druid starts to ingest data.
+
+    ![Tasks view](../assets/tutorial-kafka-data-loader-10.png "Tasks view")
+
+13. Navigate to the **Datasources** view from the header.
+
+    ![Datasource view](../assets/tutorial-kafka-data-loader-11.png "Datasource view")
+
+    When the `kttm-kafka` datasource appears here, you can query it. See [Query your data](#query-your-data) for details.
+
+:::info
+ If the datasource doesn't appear after a minute you might not have set the supervisor to read data from the start of the stream&mdash;the `Use earliest offset` setting in the **Tune** step. Go to the **Ingestion** page and terminate the supervisor using the **Actions(...)** menu. [Load the sample data](#load-data-with-the-console-data-loader) again and apply the correct setting when you get to the **Tune** step.
+:::
+
+### Submit a supervisor spec
+
+As an alternative to using the data loader, you can submit a supervisor spec to Druid. You can do this in the console or using the Druid API.
+
+#### Use the console
+
+To submit a supervisor spec using the Druid console:
+
+1. Click **Ingestion** in the console, then click the ellipses next to the refresh button and select **Submit JSON supervisor**.
+
+2. Paste this spec into the JSON window and click **Submit**.
+   ```json
+   {
+     "type": "kafka",
+     "spec": {
+       "ioConfig": {
+         "type": "kafka",
+         "consumerProperties": {
+           "bootstrap.servers": "localhost:9092"
+         },
+         "topic": "kttm",
+         "inputFormat": {
+           "type": "json"
+         },
+         "useEarliestOffset": true
+       },
+       "tuningConfig": {
+         "type": "kafka"
+       },
+       "dataSchema": {
+         "dataSource": "kttm-kafka-supervisor-console",
+         "timestampSpec": {
+           "column": "timestamp",
+           "format": "iso"
+         },
+         "dimensionsSpec": {
+           "dimensions": [
+             "session",
+             "number",
+             "client_ip",
+             "language",
+             "adblock_list",
+             "app_version",
+             "path",
+             "loaded_image",
+             "referrer",
+             "referrer_host",
+             "server_ip",
+             "screen",
+             "window",
+             {
+               "type": "long",
+               "name": "session_length"
+             },
+             "timezone",
+             "timezone_offset",
+             {
+               "type": "json",
+               "name": "event"
+             },
+             {
+               "type": "json",
+               "name": "agent"
+             },
+             {
+               "type": "json",
+               "name": "geo_ip"
+             }
+           ]
+         },
+         "granularitySpec": {
+           "queryGranularity": "none",
+           "rollup": false,
+           "segmentGranularity": "day"
+         }
+       }
+     }
+   }
+   ```
+
+
+   This starts the supervisor&mdash;the supervisor spawns tasks that start listening for incoming data.
+
+3. Click **Tasks** on the console home page to monitor the status of the job. This spec writes the data in the `kttm` topic to a datasource named `kttm-kafka-supervisor-console`.
+
+#### Use the API
+
+You can also use the Druid API to submit a supervisor spec.
+
+1. Run the following command to download the sample spec:
+
+   ```bash
+   curl -o kttm-kafka-supervisor.json https://raw.githubusercontent.com/apache/druid/master/docs/assets/files/kttm-kafka-supervisor.json
+   ```
+
+2. Run the following command to submit the spec in the `kttm-kafka-supervisor.json` file:
+
+    ```bash
+    curl -X POST -H 'Content-Type: application/json' -d @kttm-kafka-supervisor.json http://localhost:8081/druid/indexer/v1/supervisor
+    ```
+
+    After Druid successfully creates the supervisor, you get a response containing the supervisor ID: `{"id":"kttm-kafka-supervisor-api"}`.
+
+3. Click **Tasks** on the console home page to monitor the status of the job. This spec writes the data in the `kttm` topic to a datasource named `kttm-kafka-supervisor-api`.
+
+## Query your data
+
+After Druid sends data to the Kafka stream, it is immediately available for querying. Click **Query** in the Druid console to run SQL queries against the datasource.
+
+Since this tutorial ingests a small dataset, you can run the query `SELECT * FROM "kttm-kafka"` to return all of the data in the dataset you created.
+
+![Query view](../assets/tutorial-kafka-data-loader-12.png "Query view")
+
+Check out the [Querying data tutorial](../tutorials/tutorial-query.md) to run some example queries on the newly loaded data.
+
+## Further reading
+
+For more information, see the following topics:
+
+- [Apache Kafka ingestion](../ingestion/kafka-ingestion.md) for information on loading data from Kafka streams and maintaining Kafka supervisors for Druid.
diff --git a/docs/35.0.0/tutorials/tutorial-kerberos-hadoop.md b/docs/35.0.0/tutorials/tutorial-kerberos-hadoop.md
new file mode 100644
index 0000000000..0ec798e34a
--- /dev/null
+++ b/docs/35.0.0/tutorials/tutorial-kerberos-hadoop.md
@@ -0,0 +1,129 @@
+---
+id: tutorial-kerberos-hadoop
+title: Configure Apache Druid to use Kerberized Apache Hadoop as deep storage
+sidebar_label: Kerberized HDFS deep storage
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::caution[Deprecated]
+
+Hadoop-based ingestion is deprecated. For more information, see the [upgrade notes](../release-info/upgrade-notes.md#hadoop-based-ingestion).
+
+:::
+
+
+## Hadoop Setup
+
+Following are the configurations files required to be copied over to Druid conf folders:
+
+1. For HDFS as a deep storage, hdfs-site.xml, core-site.xml
+2. For ingestion, mapred-site.xml, yarn-site.xml
+
+### HDFS Folders and permissions
+
+1. Choose any folder name for the druid deep storage, for example 'druid'
+2. Create the folder in hdfs under the required parent folder. For example,
+`hdfs dfs -mkdir /druid`
+OR
+`hdfs dfs -mkdir /apps/druid`
+
+3. Give druid processes appropriate permissions for the druid processes to access this folder. This would ensure that druid is able to create necessary folders like data and indexing_log in HDFS.
+For example, if druid processes run as user 'root', then
+
+    `hdfs dfs -chown root:root /apps/druid`
+
+    OR
+
+    `hdfs dfs -chmod 777 /apps/druid`
+
+Druid creates necessary sub-folders to store data and index under this newly created folder.
+
+## Druid Setup
+
+Edit common.runtime.properties at conf/druid/_common/common.runtime.properties to include the HDFS properties. Folders used for the location are same as the ones used for example above.
+
+### common.runtime.properties
+
+```properties
+# Deep storage
+#
+# For HDFS:
+druid.storage.type=hdfs
+druid.storage.storageDirectory=/druid/segments
+# OR
+# druid.storage.storageDirectory=/apps/druid/segments
+
+#
+# Indexing service logs
+#
+
+# For HDFS:
+druid.indexer.logs.type=hdfs
+druid.indexer.logs.directory=/druid/indexing-logs
+# OR
+# druid.storage.storageDirectory=/apps/druid/indexing-logs
+```
+
+Note: Comment out Local storage and S3 Storage parameters in the file
+
+Also include hdfs-storage core extension to `conf/druid/_common/common.runtime.properties`
+
+```properties
+#
+# Extensions
+#
+
+druid.extensions.directory=dist/druid/extensions
+druid.extensions.hadoopDependenciesDir=dist/druid/hadoop-dependencies
+druid.extensions.loadList=["mysql-metadata-storage", "druid-hdfs-storage", "druid-kerberos"]
+```
+
+### Hadoop Jars
+
+Ensure that Druid has necessary jars to support the Hadoop version.
+
+Find the hadoop version using command, `hadoop version`
+
+In case there is other software used with hadoop, like `WanDisco`, ensure that
+1. the necessary libraries are available
+2. add the requisite extensions to `druid.extensions.loadlist` in `conf/druid/_common/common.runtime.properties`
+
+### Kerberos setup
+
+Create a headless keytab which would have access to the druid data and index.
+
+Edit conf/druid/_common/common.runtime.properties and add the following properties:
+
+```properties
+druid.hadoop.security.kerberos.principal
+druid.hadoop.security.kerberos.keytab
+```
+
+For example
+
+```properties
+druid.hadoop.security.kerberos.principal=hdfs-test@EXAMPLE.IO
+druid.hadoop.security.kerberos.keytab=/etc/security/keytabs/hdfs.headless.keytab
+```
+
+### Restart Druid Services
+
+With the above changes, restart Druid. This would ensure that Druid works with Kerberized Hadoop
diff --git a/docs/35.0.0/tutorials/tutorial-latest-by.md b/docs/35.0.0/tutorials/tutorial-latest-by.md
new file mode 100644
index 0000000000..4c35bb2434
--- /dev/null
+++ b/docs/35.0.0/tutorials/tutorial-latest-by.md
@@ -0,0 +1,233 @@
+---
+id: tutorial-latest-by
+title: Query for latest values
+sidebar_label: Query for latest data
+description: How to use LATEST_BY or deltas for up-to-date values.
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+This tutorial describes strategies in Apache Druid for use cases that might be handled by UPSERT in other databases. You can use the LATEST_BY aggregation at query time or "deltas" for numeric dimensions at insert time.
+
+The [Update data](./tutorial-update-data.md) tutorial demonstrates how to use batch operations to update data according to the timestamp, including UPSERT cases. However, with streaming data, you can potentially use LATEST_BY or deltas to satisfy requirements otherwise handled with updates.
+
+## Prerequisites
+
+Before you follow the steps in this tutorial, download Druid as described in the [Local quickstart](index.md) and have it running on your local machine. You don't need to load any data into the Druid cluster.
+
+You should be familiar with data querying in Druid. If you haven't already, go through the [Query data](../tutorials/tutorial-query.md) tutorial first.
+
+## Use LATEST_BY to retrieve updated values
+
+Sometimes, you want to read the latest value of one dimension or measure in relation to another dimension. In a transactional database, you might maintain dimensions or measures using UPSERT, but in Druid you can append all updates or changes during ingestion. The LATEST_BY function lets you get the most recent value for the dimension with the following type of query:
+
+```sql
+SELECT dimension,
+       LATEST_BY(changed_dimension, updated_timestamp)
+FROM my_table
+GROUP BY 1
+```
+
+In this example `update_timestamp` represents the reference timestamp to use to evaluate the "latest" value. This could be `__time` or another timestamp.
+
+For example, consider the following table of events that log the total number of points for a user:
+
+| `__time` |  `user_id`| `points`|
+| --- | --- | --- |
+| `2024-01-01T01:00:00.000Z`|`funny_bunny1`| 10 |
+| `2024-01-01T01:05:00.000Z`|`funny_bunny1`| 30 |
+| `2024-01-01T02:00:00.000Z`|`funny_bunny1`| 35 |
+| `2024-01-01T02:00:00.000Z`|`silly_monkey2`| 30 |
+| `2024-01-01T02:05:00.000Z`|`silly_monkey2`| 55 |
+| `2024-01-01T03:00:00.000Z`|`funny_bunny1`| 40 |
+
+<details>
+<summary>Insert sample data</summary>
+
+In the Druid web console, navigate to the **Query** view and run the following query to insert sample data:
+
+```sql
+REPLACE INTO "latest_by_tutorial1" OVERWRITE ALL
+WITH "ext" AS (
+  SELECT *
+  FROM TABLE(
+    EXTERN(
+     '{"type":"inline","data":"{\"timestamp\":\"2024-01-01T01:00:00Z\",\"user_id\":\"funny_bunny1\", \"points\":10}\n{\"timestamp\":\"2024-01-01T01:05:00Z\",\"user_id\":\"funny_bunny1\", \"points\":30}\n{\"timestamp\": \"2024-01-01T02:00:00Z\",\"user_id\":\"funny_bunny1\", \"points\":35}\n{\"timestamp\":\"2024-01-01T02:00:00Z\",\"user_id\":\"silly_monkey2\", \"points\":30}\n{\"timestamp\":\"2024-01-01T02:05:00Z\",\"user_id\":\"silly_monkey2\", \"points\":55}\n{\"timestamp\":\"2024-01-01T03:00:00Z\",\"user_id\":\"funny_bunny1\", \"points\":40}"}',
+     '{"type":"json"}'
+    )
+  ) EXTEND ("timestamp" VARCHAR, "user_id" VARCHAR, "points" BIGINT)
+)
+SELECT
+  TIME_PARSE("timestamp") AS "__time",
+  "user_id",
+  "points"
+FROM "ext"
+PARTITIONED BY DAY
+```
+</details>
+
+Run the following query to retrieve the most recent `points` value for each `user_id`:
+
+```sql
+SELECT user_id,
+     LATEST_BY("points", "__time") AS latest_points
+FROM latest_by_tutorial1
+GROUP BY 1
+```
+
+The results are as follows:
+
+|`user_id`|`total_points`|
+| --- | --- |
+|`silly_monkey2`| 55 |
+|`funny_bunny1`| 40 |
+
+In the example, the values increase each time, but this method works even if the values fluctuate.
+
+You can use this query shape as a subquery for additional processing. However, if there are many values for `user_id`, the query can be expensive.
+
+If you want to track the latest value at different times within a larger granularity time frame, you need an additional timestamp to record update times. This allows Druid to track the latest version. Consider the following data that represents points for various users updated within an hour time frame. `__time` is hour granularity, but `updated_timestamp` is minute granularity:
+
+| `__time` | `updated_timestamp` | `user_id`| `points`|
+| --- | --- | --- | --- |
+| `2024-01-01T01:00:00.000Z`| `2024-01-01T01:00:00.000Z`|`funny_bunny1`| 10 |
+|`2024-01-01T01:00:00.000Z`| `2024-01-01T01:05:00.000Z`|`funny_bunny1`| 30 |
+|`2024-01-01T02:00:00.000Z`| `2024-01-01T02:00:00.000Z`|`funny_bunny1`| 35 |
+|`2024-01-01T02:00:00.000Z`|`2024-01-01T02:00:00.000Z`|`silly_monkey2`| 30 |
+|`2024-01-01T02:00:00.000Z`| `2024-01-01T02:05:00.000Z`|`silly_monkey2`| 55 |
+|`2024-01-01T03:00:00.000Z`| `2024-01-01T03:00:00.000Z`|`funny_bunny1`| 40 |
+
+<details>
+<summary>Insert sample data</summary>
+
+Open a new tab in the **Query** view and run the following query to insert sample data:
+
+```sql
+REPLACE INTO "latest_by_tutorial2" OVERWRITE ALL
+WITH "ext" AS (
+  SELECT *
+  FROM TABLE(
+    EXTERN(
+     '{"type":"inline","data":"{\"timestamp\":\"2024-01-01T01:00:00Z\",\"updated_timestamp\":\"2024-01-01T01:00:00Z\",\"user_id\":\"funny_bunny1\", \"points\":10}\n{\"timestamp\":\"2024-01-01T01:05:00Z\",\"updated_timestamp\":\"2024-01-01T01:05:00Z\",\"user_id\":\"funny_bunny1\", \"points\":30}\n{\"timestamp\": \"2024-01-01T02:00:00Z\",\"updated_timestamp\":\"2024-01-01T02:00:00Z\",\"user_id\":\"funny_bunny1\", \"points\":35}\n{\"timestamp\":\"2024-01-01T02:00:00Z\",\"updated_timestamp\":\"2024-01-01T02:00:00Z\",\"user_id\":\"silly_monkey2\", \"points\":30}\n{\"timestamp\":\"2024-01-01T02:00:00Z\",\"updated_timestamp\":\"2024-01-01T02:05:00Z\",\"user_id\":\"silly_monkey2\", \"points\":55}\n{\"timestamp\":\"2024-01-01T03:00:00Z\",\"updated_timestamp\":\"2024-01-01T03:00:00Z\",\"user_id\":\"funny_bunny1\", \"points\":40}"}',
+     '{"type":"json"}'
+    )
+  ) EXTEND ("timestamp" VARCHAR, "updated_timestamp" VARCHAR, "user_id" VARCHAR, "points" BIGINT)
+)
+SELECT
+  TIME_PARSE("timestamp") AS "__time",
+  "updated_timestamp",
+  "user_id",
+  "points"
+FROM "ext"
+PARTITIONED BY DAY
+```
+</details>
+
+
+Run the following query to retrieve the latest points value by user for each hour:
+
+```sql
+SELECT FLOOR("__time" TO HOUR) AS "hour_time",
+      "user_id",
+       LATEST_BY("points", TIME_PARSE(updated_timestamp)) AS "latest_points_hour"
+FROM latest_by_tutorial2
+GROUP BY 1,2
+```
+
+The results are as follows:
+
+| `hour_time` | `user_id` | `latest_points_hour`|
+|---|---|---|
+|`2024-01-01T01:00:00.000Z`|`funny_bunny1`|20|
+|`2024-01-01T02:00:00.000Z`|`funny_bunny1`|5|
+|`2024-01-01T02:00:00.000Z`|`silly_monkey2`|25|
+|`2024-01-01T03:00:00.000Z`|`funny_bunny1`|10|
+
+LATEST_BY is an aggregation function. While it's very efficient when there are not many update rows matching a dimension, such as `user_id`, it scans all matching rows with the same dimension. For dimensions with numerous updates, such as when a user plays a game a million times, and the updates don't arrive in a timely order, Druid processes all rows matching the `user_id` to find the row with the max timestamp to provide the latest data. 
+
+For instance, if updates constitute 1-5 percent of your data, you'll get good query performance. If updates constitute 50 percent or more of your data, your queries will be slow.
+
+To mitigate this, you can set up a periodic batch ingestion job that re-indexes modified data into a new datasource for direct querying without grouping to reduce the cost of these queries by pre-computing and storing the latest values. Note that your view of the latest data will not be up to date until the next refresh happens.
+ 
+Alternatively, you can perform ingestion-time aggregation using LATEST_BY and append updates with streaming ingestion into a rolled up datasource. Appending into a time chunk adds new segments and does not perfectly roll up data, so rows may be partial rather than complete rollups, and you may have multiple partially rolled up rows. In this case, you still need to use the GROUP BY query for correct querying of the rolled up data source. You can tune automatic compaction to significantly reduce the number of stale rows and improve your performance.
+
+## Use delta values and aggregation for updated values
+
+Instead of appending the latest total value in your events, you can log the change in value with each event and use the aggregator you usually use. This method may allow you to avoid a level of aggregation and grouping in your queries.
+
+For most applications, you can send the event data directly to Druid without pre-processing. For example, when sending impression counts to Druid, don't send the total impression count since yesterday, send just the recent impression count. You can then aggregate the total in Druid during query. Druid is optimized for adding up a lot of rows, so this might be counterintuitive to people who are familiar with batching or pre-aggregating data.
+
+For example, consider a datasource with a measure column `y` that you aggregate with SUM, grouped by another dimension `x`. If you want to update the value of `y` from 3 to 2, then insert -1 for `y`. This way the aggregation `SUM(y)` is correct for any queries grouped by `x`. This may offer a significant performance advantage but the trade off is that the aggregation has to always be a SUM.
+
+In other cases, the updates to the data may already be deltas to the original, and so the data engineering required to append the updates would be simple. The same performance impact mitigation applies as in the previous example: use rollup at ingestion time combined with ongoing automatic compaction.
+
+For example, consider the following table of events that logs the number of points gained or lost for a user during a period of time:
+
+| `__time` |  `user_id`| `delta`|
+| --- | --- | --- |
+| `2024-01-01T01:00:00.000Z`|`funny_bunny1`| 10 |
+| `2024-01-01T01:05:00.000Z`|`funny_bunny1`| 10 |
+| `2024-01-01T02:00:00.000Z`|`funny_bunny1`| 5 |
+| `2024-01-01T02:00:00.000Z`|`silly_monkey2`| 30 |
+| `2024-01-01T02:05:00.000Z`|`silly_monkey2`| -5 |
+| `2024-01-01T03:00:00.000Z`|`funny_bunny1`| 10 |
+
+<details>
+<summary>Insert sample data</summary>
+
+Open a new tab in the **Query** view and run the following query to insert sample data:
+
+```sql
+REPLACE INTO "delta_tutorial" OVERWRITE ALL
+WITH "ext" AS (
+  SELECT *
+  FROM TABLE(
+    EXTERN(
+     '{"type":"inline","data":"{\"timestamp\":\"2024-01-01T01:00:00Z\",\"user_id\":\"funny_bunny1\", \"points\":10}\n{\"timestamp\":\"2024-01-01T01:05:00Z\",\"user_id\":\"funny_bunny1\", \"points\":10}\n{\"timestamp\": \"2024-01-01T02:00:00Z\",\"user_id\":\"funny_bunny1\", \"points\":5}\n{\"timestamp\":\"2024-01-01T02:00:00Z\",\"user_id\":\"silly_monkey2\", \"points\":30}\n{\"timestamp\":\"2024-01-01T02:05:00Z\",\"user_id\":\"silly_monkey2\", \"points\":-5}\n{\"timestamp\":\"2024-01-01T03:00:00Z\",\"user_id\":\"funny_bunny1\", \"points\":10}"}',
+     '{"type":"json"}'
+    )
+  ) EXTEND ("timestamp" VARCHAR, "user_id" VARCHAR, "points" BIGINT)
+)
+SELECT
+  TIME_PARSE("timestamp") AS "__time",
+  "user_id",
+  "points" AS "delta"
+FROM "ext"
+PARTITIONED BY DAY
+```
+
+</details>
+
+The following query returns the same points per hour as the second LATEST_BY example:
+
+```sql
+SELECT FLOOR("__time" TO HOUR) as "hour_time",
+       "user_id",
+       SUM("delta") AS "latest_points_hour"
+FROM "delta_tutorial"
+GROUP BY 1,2
+```
+
+## Learn more
+
+See the following topics for more information:
+
+* [Update data](./tutorial-update-data.md) for a tutorial on updating data in Druid.
+* [Data updates](../data-management/update.md) for an overview of updating data in Druid.
diff --git a/docs/35.0.0/tutorials/tutorial-msq-convert-spec.md b/docs/35.0.0/tutorials/tutorial-msq-convert-spec.md
new file mode 100644
index 0000000000..0d386bc062
--- /dev/null
+++ b/docs/35.0.0/tutorials/tutorial-msq-convert-spec.md
@@ -0,0 +1,176 @@
+---
+id: tutorial-msq-convert-spec
+title: Convert an ingestion spec for SQL-based ingestion
+sidebar_label: Convert ingestion spec to SQL
+description: How to convert an ingestion spec to a query for SQL-based ingestion in the web console.
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ This page describes SQL-based batch ingestion using the [`druid-multi-stage-query`](../multi-stage-query/index.md)
+ extension, new in Druid 24.0. Refer to the [ingestion methods](../ingestion/index.md#batch) table to determine which
+ ingestion method is right for you.
+:::
+
+If you're already ingesting data with [native batch ingestion](../ingestion/native-batch.md), you can use the [web console](../operations/web-console.md) to convert the ingestion spec to a SQL query that the multi-stage query task engine can use to ingest data.
+
+This tutorial demonstrates how to convert the ingestion spec to a query task in the web console.
+
+To convert the ingestion spec to a query task, do the following:
+
+1. In the **Query** view of the web console, navigate to the menu bar that includes **Run**.
+2. Click the ellipsis icon and select **Convert ingestion spec to SQL**.
+  ![Convert ingestion spec to SQL](../assets/multi-stage-query/tutorial-msq-convert.png "Convert ingestion spec to SQL")
+3. In the **Ingestion spec to covert** window, insert your ingestion spec. You can use your own spec or the sample ingestion spec provided in the tutorial. The sample spec uses data hosted at `https://druid.apache.org/data/wikipedia.json.gz` and loads it into a table named `wikipedia`:
+
+   <details>
+   <summary>Show the spec</summary>
+
+   ```json
+   {
+     "type": "index_parallel",
+     "spec": {
+       "ioConfig": {
+         "type": "index_parallel",
+         "inputSource": {
+           "type": "http",
+           "uris": [
+             "https://druid.apache.org/data/wikipedia.json.gz"
+           ]
+         },
+         "inputFormat": {
+           "type": "json"
+         }
+       },
+       "tuningConfig": {
+         "type": "index_parallel",
+         "partitionsSpec": {
+           "type": "dynamic"
+         }
+       },
+       "dataSchema": {
+         "dataSource": "wikipedia",
+         "timestampSpec": {
+           "column": "timestamp",
+           "format": "iso"
+         },
+         "dimensionsSpec": {
+           "dimensions": [
+             "isRobot",
+             "channel",
+             "flags",
+             "isUnpatrolled",
+             "page",
+             "diffUrl",
+             {
+               "type": "long",
+               "name": "added"
+             },
+             "comment",
+             {
+               "type": "long",
+               "name": "commentLength"
+             },
+             "isNew",
+             "isMinor",
+             {
+               "type": "long",
+               "name": "delta"
+             },
+             "isAnonymous",
+             "user",
+             {
+               "type": "long",
+               "name": "deltaBucket"
+             },
+             {
+               "type": "long",
+               "name": "deleted"
+             },
+             "namespace",
+             "cityName",
+             "countryName",
+             "regionIsoCode",
+             "metroCode",
+             "countryIsoCode",
+             "regionName"
+           ]
+         },
+         "granularitySpec": {
+           "queryGranularity": "none",
+           "rollup": false,
+           "segmentGranularity": "day"
+         }
+       }
+     }
+   }
+   ```
+
+   </details>
+
+4. Click **Submit** to submit the spec. The web console uses the JSON-based ingestion spec to generate a SQL query that you can use instead. This is what the query looks like for the sample ingestion spec:
+
+   <details>
+   <summary>Show the query</summary>
+
+   ```sql
+   -- This SQL query was auto generated from an ingestion spec
+   REPLACE INTO wikipedia OVERWRITE ALL
+   WITH source AS (SELECT * FROM TABLE(
+     EXTERN(
+       '{"type":"http","uris":["https://druid.apache.org/data/wikipedia.json.gz"]}',
+       '{"type":"json"}',
+       '[{"name":"timestamp","type":"string"},{"name":"isRobot","type":"string"},{"name":"channel","type":"string"},{"name":"flags","type":"string"},{"name":"isUnpatrolled","type":"string"},{"name":"page","type":"string"},{"name":"diffUrl","type":"string"},{"name":"added","type":"long"},{"name":"comment","type":"string"},{"name":"commentLength","type":"long"},{"name":"isNew","type":"string"},{"name":"isMinor","type":"string"},{"name":"delta","type":"long"},{"name":"isAnonymous","type":"string"},{"name":"user","type":"string"},{"name":"deltaBucket","type":"long"},{"name":"deleted","type":"long"},{"name":"namespace","type":"string"},{"name":"cityName","type":"string"},{"name":"countryName","type":"string"},{"name":"regionIsoCode","type":"string"},{"name":"metroCode","type":"string"},{"name":"countryIsoCode","type":"string"},{"name":"regionName","type":"string"}]'
+     )
+   ))
+   SELECT
+     TIME_PARSE("timestamp") AS __time,
+     "isRobot",
+     "channel",
+     "flags",
+     "isUnpatrolled",
+     "page",
+     "diffUrl",
+     "added",
+     "comment",
+     "commentLength",
+     "isNew",
+     "isMinor",
+     "delta",
+     "isAnonymous",
+     "user",
+     "deltaBucket",
+     "deleted",
+     "namespace",
+     "cityName",
+     "countryName",
+     "regionIsoCode",
+     "metroCode",
+     "countryIsoCode",
+     "regionName"
+   FROM source
+   PARTITIONED BY DAY
+   ```
+
+   </details>
+
+4. Review the generated SQL query to make sure it matches your requirements and does what you expect.
+5. Click **Run** to start the ingestion.
diff --git a/docs/35.0.0/tutorials/tutorial-msq-extern.md b/docs/35.0.0/tutorials/tutorial-msq-extern.md
new file mode 100644
index 0000000000..dcd0d50959
--- /dev/null
+++ b/docs/35.0.0/tutorials/tutorial-msq-extern.md
@@ -0,0 +1,151 @@
+---
+id: tutorial-msq-extern
+title: Load files with SQL-based ingestion
+sidebar_label: Load files using SQL
+description: How to generate a query that references externally hosted data
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ This page describes SQL-based batch ingestion using the [`druid-multi-stage-query`](../multi-stage-query/index.md)
+ extension, new in Druid 24.0. Refer to the [ingestion methods](../ingestion/index.md#batch) table to determine which
+ ingestion method is right for you.
+:::
+
+This tutorial demonstrates how to generate a query that references externally hosted data using the **Connect external data** wizard.
+
+The following example uses EXTERN to query a JSON file located at https://druid.apache.org/data/wikipedia.json.gz.
+
+Although you can manually create a query in the UI, you can use Druid to generate a base query for you that you can modify to meet your requirements.
+
+To generate a query from external data, do the following:
+
+1. In the **Query** view of the web console, click **Connect external data**.
+2. On the **Select input type** screen, choose **HTTP(s)** and enter the following value in the **URIs** field: `https://druid.apache.org/data/wikipedia.json.gz`. Leave the HTTP auth username and password blank.
+3. Click **Connect data**.
+4. On the **Parse** screen, you can perform additional actions before you load the data into Druid:
+   - Expand a row to see what data it corresponds to from the source.
+   - Customize how Druid handles the data by selecting the **Input format** and its related options, such as adding **JSON parser features** for JSON files.
+5. When you're ready, click **Done**. You're returned to the **Query** view where you can see the starter query that will insert the data from the external source into a table named `wikipedia`.
+
+   <details>
+   <summary>Show the query</summary>
+
+   ```sql
+   REPLACE INTO "wikipedia" OVERWRITE ALL
+   WITH ext AS (SELECT *
+   FROM TABLE(
+     EXTERN(
+       '{"type":"http","uris":["https://druid.apache.org/data/wikipedia.json.gz"]}',
+       '{"type":"json"}',
+       '[{"name":"isRobot","type":"string"},{"name":"channel","type":"string"},{"name":"timestamp","type":"string"},{"name":"flags","type":"string"},{"name":"isUnpatrolled","type":"string"},{"name":"page","type":"string"},{"name":"diffUrl","type":"string"},{"name":"added","type":"long"},{"name":"comment","type":"string"},{"name":"commentLength","type":"long"},{"name":"isNew","type":"string"},{"name":"isMinor","type":"string"},{"name":"delta","type":"long"},{"name":"isAnonymous","type":"string"},{"name":"user","type":"string"},{"name":"deltaBucket","type":"long"},{"name":"deleted","type":"long"},{"name":"namespace","type":"string"},{"name":"cityName","type":"string"},{"name":"countryName","type":"string"},{"name":"regionIsoCode","type":"string"},{"name":"metroCode","type":"long"},{"name":"countryIsoCode","type":"string"},{"name":"regionName","type":"string"}]'
+     )
+   ))
+   SELECT
+     TIME_PARSE("timestamp") AS __time,
+     isRobot,
+     channel,
+     flags,
+     isUnpatrolled,
+     page,
+     diffUrl,
+     added,
+     comment,
+     commentLength,
+     isNew,
+     isMinor,
+     delta,
+     isAnonymous,
+     user,
+     deltaBucket,
+     deleted,
+     namespace,
+     cityName,
+     countryName,
+     regionIsoCode,
+     metroCode,
+     countryIsoCode,
+     regionName
+   FROM ext
+   PARTITIONED BY DAY
+   ```
+   </details>
+
+6. Review and modify the query to meet your needs. For example, you can rename the table or change segment granularity. To partition by something other than ALL, include `TIME_PARSE("timestamp") AS __time` in your SELECT statement.
+
+   For example, to specify day-based segment granularity, change the partitioning to `PARTITIONED BY DAY`:
+
+     ```sql
+      INSERT INTO ...
+      SELECT
+        TIME_PARSE("timestamp") AS __time,
+      ...
+      ...
+      PARTITIONED BY DAY
+     ```
+
+1. Optionally, select **Preview** to review the data before you ingest it. A preview runs the query without the REPLACE INTO clause and with an added LIMIT.
+   You can see the general shape of the data before you commit to inserting it.
+   The LIMITs make the query run faster but can cause incomplete results.
+2. Click **Run** to launch your query. The query returns information including its duration and the number of rows inserted into the table.
+
+## Query the data
+
+You can query the `wikipedia` table after the ingestion completes.
+For example, you can analyze the data in the table to produce a list of top channels:
+
+```sql
+SELECT
+  channel,
+  COUNT(*)
+FROM "wikipedia"
+GROUP BY channel
+ORDER BY COUNT(*) DESC
+```
+
+With the EXTERN function, you could run the same query on the external data directly without ingesting it first:
+
+<details>
+<summary>Show the query</summary>
+
+```sql
+SELECT
+  channel,
+  COUNT(*)
+FROM TABLE(
+  EXTERN(
+    '{"type": "http", "uris": ["https://druid.apache.org/data/wikipedia.json.gz"]}',
+    '{"type": "json"}',
+    '[{"name": "added", "type": "long"}, {"name": "channel", "type": "string"}, {"name": "cityName", "type": "string"}, {"name": "comment", "type": "string"}, {"name": "commentLength", "type": "long"}, {"name": "countryIsoCode", "type": "string"}, {"name": "countryName", "type": "string"}, {"name": "deleted", "type": "long"}, {"name": "delta", "type": "long"}, {"name": "deltaBucket", "type": "string"}, {"name": "diffUrl", "type": "string"}, {"name": "flags", "type": "string"}, {"name": "isAnonymous", "type": "string"}, {"name": "isMinor", "type": "string"}, {"name": "isNew", "type": "string"}, {"name": "isRobot", "type": "string"}, {"name": "isUnpatrolled", "type": "string"}, {"name": "metroCode", "type": "string"}, {"name": "namespace", "type": "string"}, {"name": "page", "type": "string"}, {"name": "regionIsoCode", "type": "string"}, {"name": "regionName", "type": "string"}, {"name": "timestamp", "type": "string"}, {"name": "user", "type": "string"}]'
+  )
+)
+GROUP BY channel
+ORDER BY COUNT(*) DESC
+```
+
+</details>
+
+## Further reading
+
+See the following topics to learn more:
+
+* [SQL-based ingestion overview](../multi-stage-query/index.md) to further explore SQL-based ingestion.
+* [SQL-based ingestion reference](../multi-stage-query/reference.md) for reference on context parameters, functions, and error codes.
diff --git a/docs/35.0.0/tutorials/tutorial-query-deep-storage.md b/docs/35.0.0/tutorials/tutorial-query-deep-storage.md
new file mode 100644
index 0000000000..61a25955bb
--- /dev/null
+++ b/docs/35.0.0/tutorials/tutorial-query-deep-storage.md
@@ -0,0 +1,287 @@
+---
+id: tutorial-query-deep-storage
+title: "Tutorial: Query from deep storage"
+sidebar_label: "Query from deep storage"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+Query from deep storage allows you to query segments that are stored only in deep storage, which provides lower costs than if you were to load everything onto Historical processes. The tradeoff is that queries from deep storage may take longer to complete. 
+
+This tutorial walks you through loading example data, configuring load rules so that not all the segments get loaded onto Historical services, and querying data from deep storage. If you have [centralized datasource schema enabled](../configuration/index.md#centralized-datasource-schema-experimental), you can query datasources that are only in deep storage without having any segment available on Historical.
+
+To run the queries in this tutorial, replace `ROUTER:PORT` with the location of the Router process and its port number. For example, use `localhost:8888` for the quickstart deployment.
+
+For more general information, see [Query from deep storage](../querying/query-from-deep-storage.md).
+
+If you are trying this feature on an existing cluster, make sure query from deep storage [prerequisites](../querying/query-from-deep-storage.md#prerequisites) are met.
+
+## Load example data
+
+Use the **Load data** wizard or the following SQL query to ingest the `wikipedia` sample datasource bundled with Druid. If you use the wizard, make sure you change the partitioning to be by hour.
+
+Partitioning by hour provides more segment granularity, so you can selectively load segments onto Historicals or keep them in deep storage.
+
+<details>
+<summary>Show the query</summary>
+
+```sql
+REPLACE INTO "wikipedia" OVERWRITE ALL
+WITH "ext" AS (SELECT *
+FROM TABLE(
+  EXTERN(
+    '{"type":"http","uris":["https://druid.apache.org/data/wikipedia.json.gz"]}',
+    '{"type":"json"}'
+  )
+) EXTEND ("isRobot" VARCHAR, "channel" VARCHAR, "timestamp" VARCHAR, "flags" VARCHAR, "isUnpatrolled" VARCHAR, "page" VARCHAR, "diffUrl" VARCHAR, "added" BIGINT, "comment" VARCHAR, "commentLength" BIGINT, "isNew" VARCHAR, "isMinor" VARCHAR, "delta" BIGINT, "isAnonymous" VARCHAR, "user" VARCHAR, "deltaBucket" BIGINT, "deleted" BIGINT, "namespace" VARCHAR, "cityName" VARCHAR, "countryName" VARCHAR, "regionIsoCode" VARCHAR, "metroCode" BIGINT, "countryIsoCode" VARCHAR, "regionName" VARCHAR))
+SELECT
+  TIME_PARSE("timestamp") AS "__time",
+  "isRobot",
+  "channel",
+  "flags",
+  "isUnpatrolled",
+  "page",
+  "diffUrl",
+  "added",
+  "comment",
+  "commentLength",
+  "isNew",
+  "isMinor",
+  "delta",
+  "isAnonymous",
+  "user",
+  "deltaBucket",
+  "deleted",
+  "namespace",
+  "cityName",
+  "countryName",
+  "regionIsoCode",
+  "metroCode",
+  "countryIsoCode",
+  "regionName"
+FROM "ext"
+PARTITIONED BY HOUR
+```
+
+</details>
+
+## Configure a load rule
+
+The load rule configures Druid to keep any segments that fall within the following interval only in deep storage:
+
+```
+2016-06-27T00:00:00.000Z/2016-06-27T02:59:00.000Z
+```
+
+The JSON form of the rule is as follows:
+
+```json
+[
+  {
+    "interval": "2016-06-27T00:00:00.000Z/2016-06-27T02:59:00.000Z",
+    "tieredReplicants": {},
+    "useDefaultTierForNull": false,
+    "type": "loadByInterval"
+  }
+]
+```
+
+The rest of the segments use the default load rules for the cluster. For the quickstart, that means all the other segments get loaded onto Historical processes.
+
+You can configure the load rules through the API or the Druid console. To configure the load rules through the Druid console, go to **Datasources > ... in the Actions column > Edit retention rules**. Then, paste the provided JSON into the JSON tab:
+
+![](../assets/tutorial-query-deepstorage-retention-rule.png)
+
+
+### Verify the replication factor
+
+Segments that are only available from deep storage have a `replication_factor` of 0 in the Druid system table. You can verify that your load rule worked as intended using the following query:
+
+```sql
+SELECT "segment_id", "replication_factor", "num_replicas"  FROM sys."segments" WHERE datasource = 'wikipedia'
+```
+
+You can also verify it through the Druid console by checking the **Replication factor** column in the **Segments** view.
+
+Note that the number of replicas and replication factor may differ temporarily as Druid processes your retention rules.
+
+## Query from deep storage
+
+Now that there are segments that are only available from deep storage, run the following query:
+
+```sql
+SELECT page FROM wikipedia WHERE __time <  TIMESTAMP'2016-06-27 00:10:00' LIMIT 10
+```
+
+To run this query asynchronously, specify the `ASYNC` execution mode using the query context.
+Apply the query context parameter before the query using a SET statement. 
+
+For example, run the following curl command:
+
+```
+curl --location 'http://localhost:8888/druid/v2/sql/statements' \
+--header 'Content-Type: application/json' \
+--data '{
+  "query": "SET executionMode = '\''ASYNC'\''; SELECT page FROM wikipedia WHERE __time < TIMESTAMP '\''2016-06-27 00:10:00'\'' LIMIT 10"
+}'
+```
+
+This query looks for records with timestamps that precede `00:10:00`. Based on the load rule you configured earlier, this data is only available from deep storage.
+
+When you submit the query from deep storage through the API, you get the following response:
+
+<details>
+<summary>Show the response</summary>
+
+```json
+{
+    "queryId": "query-6888b6f6-e597-456c-9004-222b05b97051",
+    "state": "ACCEPTED",
+    "createdAt": "2023-07-28T21:59:02.334Z",
+    "schema": [
+        {
+            "name": "page",
+            "type": "VARCHAR",
+            "nativeType": "STRING"
+        }
+    ],
+    "durationMs": -1
+}
+```
+
+Make sure you note the `queryID`. You'll need it to interact with the query.
+
+</details>
+
+Compare this to if you were to submit the query to Druid SQL's regular endpoint, `POST /sql`: 
+
+```
+curl --location 'http://localhost:8888/druid/v2/sql/' \
+--header 'Content-Type: application/json' \
+--data '{
+  "query": "SET executionMode = '\''ASYNC'\''; SELECT page FROM wikipedia WHERE __time < TIMESTAMP '\''2016-06-27 00:10:00'\'' LIMIT 10"
+}'
+```
+
+The response you get back is an empty response cause there are no records on the Historicals that match the query.
+
+## Get query status
+
+Replace `:queryId` with the ID for your query and run the following curl command to get your query status:
+
+```
+curl --location --request GET 'http://localhost:8888/druid/v2/sql/statements/:queryId' \
+--header 'Content-Type: application/json' \
+```
+
+
+### Response for a running query
+
+The response for a running query is the same as the response from when you submitted the query except the `state` is `RUNNING` instead of `ACCEPTED`.
+
+### Response for a completed query
+
+A successful query also returns a `pages` object that includes the page numbers (`id`), rows per page (`numRows`), and the size of the page (`sizeInBytes`). You can pass the page number as a parameter when you get results to refine the results you get.
+
+Note that `sampleRecords` has been truncated for brevity.
+
+<details>
+<summary>Show the response</summary>
+
+```json
+{
+    "queryId": "query-6888b6f6-e597-456c-9004-222b05b97051",
+    "state": "SUCCESS",
+    "createdAt": "2023-07-28T21:59:02.334Z",
+    "schema": [
+        {
+            "name": "page",
+            "type": "VARCHAR",
+            "nativeType": "STRING"
+        }
+    ],
+    "durationMs": 87351,
+    "result": {
+        "numTotalRows": 152,
+        "totalSizeInBytes": 9036,
+        "dataSource": "__query_select",
+        "sampleRecords": [
+            [
+                "Salo Toraut"
+            ],
+            [
+                "利用者:ワーナー成増/放送ウーマン賞"
+            ],
+            [
+                "Bailando 2015"
+            ],
+            ...
+            ...
+            ...
+        ],
+        "pages": [
+            {
+                "id": 0,
+                "numRows": 152,
+                "sizeInBytes": 9036
+            }
+        ]
+    }
+}
+```
+
+</details>
+
+## Get query results
+
+Replace `:queryId` with the ID for your query and run the following curl command to get your query results:
+
+```
+curl --location 'http://ROUTER:PORT/druid/v2/sql/statements/:queryId'
+```
+
+Note that the response has been truncated for brevity.
+
+<details>
+<summary>Show the response</summary>
+
+```json
+[
+    {
+        "page": "Salo Toraut"
+    },
+    {
+        "page": "利用者:ワーナー成増/放送ウーマン賞"
+    },
+    {
+        "page": "Bailando 2015"
+    },
+    ...
+    ...
+    ...
+]
+```
+
+</details>
+
+## Further reading
+
+* [Query from deep storage](../querying/query-from-deep-storage.md)
+* [Query from deep storage API reference](../api-reference/sql-api.md#query-from-deep-storage)
diff --git a/docs/35.0.0/tutorials/tutorial-query.md b/docs/35.0.0/tutorials/tutorial-query.md
new file mode 100644
index 0000000000..66b38974db
--- /dev/null
+++ b/docs/35.0.0/tutorials/tutorial-query.md
@@ -0,0 +1,245 @@
+---
+id: tutorial-query
+title: Query data
+sidebar_label: Query data
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+This tutorial demonstrates how to query data in Apache Druid using SQL.  
+
+It assumes that you've completed the [Quickstart](../tutorials/index.md) 
+or one of the following tutorials, since we'll query datasources that you would have created
+by following one of them:
+
+* [Load a file](../tutorials/tutorial-batch.md)
+* [Load stream data from Kafka](../tutorials/tutorial-kafka.md)
+
+There are various ways to run Druid SQL queries: from the web console, using a command line utility
+and by posting the query by HTTP. We'll look at each of these. 
+
+
+## Query SQL from the web console
+
+The web console includes a view that makes it easier to build and test queries, and 
+view their results. 
+
+1. Start up the Druid cluster, if it's not already running, and open the web console in your web
+browser. 
+
+2. Click **Query** from the header to open the Query view:  
+
+   ![Query view](../assets/tutorial-query-01.png "Query view")
+
+   You can always write queries directly in the edit pane, but the Query view also provides 
+   facilities to help you construct SQL queries, which we will use to generate a starter query. 
+
+3. Expand the wikipedia datasource tree in the left pane. We'll
+create a query for the page dimension.  
+
+4. Click `page` and then **Show:page** from the menu: 
+
+   ![Query select page](../assets/tutorial-query-02.png "Query select page")
+
+   A SELECT query appears in the query edit pane and immediately runs. However, in this case, the query 
+   returns no data, since by default the query filters for data from the last day, while our data is considerably
+   older than that. Let's remove the filter.  
+
+5. Click **Run** to run the query.
+
+   You should now see two columns of data, a page name and the count:
+
+   ![Query results](../assets/tutorial-query-03.png "Query results")
+
+   Notice that the results are limited in the console to about a hundred, by default, due to the **Smart query limit** 
+   feature. This helps users avoid inadvertently running queries that return an excessive amount of data, possibly
+   overwhelming their system. 
+
+6. Let's edit the query directly and take a look at a few more query building features in the editor.
+   Click in the query edit pane and make the following changes: 
+
+   1.  Add a line after the first column, `"page"` and Start typing the name of a new column, `"countryName"`. Notice that the autocomplete menu suggests column names, functions, keywords, and more. Choose "countryName" and 
+add the new column to the GROUP BY clause as well, either by name or by reference to its position, `2`.  
+
+   2. For readability, replace `Count` column name with `Edits`, since the `COUNT()` function actually
+returns the number of edits for the page. Make the same column name change in the ORDER BY clause as well. 
+
+      The `COUNT()` function is one of many functions available for use in Druid SQL queries. You can mouse over a function name
+      in the autocomplete menu to see a brief description of a function. Also, you can find more information in the Druid 
+      documentation; for example, the `COUNT()` function is documented in 
+      [Aggregation functions](../querying/sql-aggregations.md). 
+
+   The query should now be:
+
+   ```sql
+   SELECT
+     "page",
+     "countryName",
+     COUNT(*) AS "Edits"
+   FROM "wikipedia"
+   GROUP BY 1, 2
+   ORDER BY "Edits" DESC
+   ``` 
+
+   When you run the query again, notice that we're getting the new dimension,`countryName`, but for most of the rows, its value 
+   is null. Let's 
+   show only rows with a `countryName` value.
+
+7. Click the `countryName` dimension in the left pane and choose the first filtering option. It's not exactly what we want, but
+we'll edit it by hand. The new WHERE clause should appear in your query. 
+
+8. Modify the WHERE clause to exclude results that do not have a value for countryName: 
+
+   ```sql
+   WHERE "countryName" IS NOT NULL
+   ``` 
+   Run the query again. You should now see the top edits by country:  
+
+   ![Finished query](../assets/tutorial-query-04.png "Finished query")
+
+9. Under the covers, every Druid SQL query is translated into a query in the JSON-based _Druid native query_ format before it runs
+ on data nodes. You can view the native query for this query by clicking `...` and **Explain SQL Query**. 
+
+   While you can use Druid SQL for most purposes, familiarity with native query is useful for composing complex queries and for troubleshooting 
+performance issues. For more information, see [Native queries](../querying/querying.md). 
+
+   ![Explain query](../assets/tutorial-query-05.png "Explain query")
+
+:::info
+ Another way to view the explain plan is by adding EXPLAIN PLAN FOR to the front of your query, as follows:
+
+```sql
+EXPLAIN PLAN FOR
+SELECT
+  "page",
+  "countryName",
+  COUNT(*) AS "Edits"
+FROM "wikipedia"
+WHERE "countryName" IS NOT NULL
+GROUP BY 1, 2
+ORDER BY "Edits" DESC
+```
+This is particularly useful when running queries
+from the command line or over HTTP.
+:::
+
+
+9. Finally, click  `...`  and **Edit context** to see how you can add additional parameters controlling the execution of the query execution. In the field, enter query context options as JSON key-value pairs, as described in [Set query context](../querying/query-context.md#web-console).
+
+That's it! We've built a simple query using some of the query builder features built into the web console. The following
+sections provide a few more example queries you can try.
+
+See [Query SQL over HTTP](#query-sql-over-http) for an example of how to use the Druid SQL HTTP API. 
+
+## More Druid SQL examples
+
+Try the following queries to learn a few more Druid SQL tricks:
+
+### Query over time
+
+```sql
+SELECT FLOOR(__time to HOUR) AS HourTime, SUM(deleted) AS LinesDeleted
+FROM wikipedia WHERE TIME_IN_INTERVAL("__time", '2016-06-27/2016-06-28')
+GROUP BY 1
+```
+
+![Query example](../assets/tutorial-query-06.png "Query example")
+
+### General group by
+
+```sql
+SELECT channel, page, SUM(added)
+FROM wikipedia WHERE TIME_IN_INTERVAL("__time", '2016-06-27/2016-06-28')
+GROUP BY channel, page
+ORDER BY SUM(added) DESC
+```
+
+![Query example](../assets/tutorial-query-07.png "Query example")
+
+## Query SQL over HTTP
+
+
+You can submit native queries [directly to the Druid Broker over HTTP](../api-reference/sql-api.md#submit-a-query). The request body should be a JSON object, with the value for the key `query` containing text of the query:
+
+```json
+{
+  "query": "SELECT page, COUNT(*) AS Edits FROM wikipedia WHERE TIME_IN_INTERVAL(\"__time\", '2016-06-27/2016-06-28') GROUP BY page ORDER BY Edits DESC LIMIT 10"
+}
+```
+
+The tutorial package includes an example file that contains the SQL query shown above at `quickstart/tutorial/wikipedia-top-pages-sql.json`. Let's submit that query to the Druid Broker:
+
+```bash
+curl -X 'POST' -H 'Content-Type:application/json' -d @quickstart/tutorial/wikipedia-top-pages-sql.json http://localhost:8888/druid/v2/sql
+```
+
+The following results should be returned:
+
+```json
+[
+    {
+        "page": "Copa América Centenario",
+        "Edits": 29
+    },
+    {
+        "page": "User:Cyde/List of candidates for speedy deletion/Subpage",
+        "Edits": 16
+    },
+    {
+        "page": "Wikipedia:Administrators' noticeboard/Incidents",
+        "Edits": 16
+    },
+    {
+        "page": "2016 Wimbledon Championships – Men's Singles",
+        "Edits": 15
+    },
+    {
+        "page": "Wikipedia:Administrator intervention against vandalism",
+        "Edits": 15
+    },
+    {
+        "page": "Wikipedia:Vandalismusmeldung",
+        "Edits": 15
+    },
+    {
+        "page": "The Winds of Winter (Game of Thrones)",
+        "Edits": 12
+    },
+    {
+        "page": "ولاية الجزائر",
+        "Edits": 12
+    },
+    {
+        "page": "Copa América",
+        "Edits": 10
+    },
+    {
+        "page": "Lionel Messi",
+        "Edits": 10
+    }
+]
+```
+
+## Further reading
+
+See the [Druid SQL documentation](../querying/sql.md) for more information on using Druid SQL queries.
+
+See the [Queries documentation](../querying/querying.md) for more information on Druid native queries.
diff --git a/docs/35.0.0/tutorials/tutorial-retention.md b/docs/35.0.0/tutorials/tutorial-retention.md
new file mode 100644
index 0000000000..6beca6255b
--- /dev/null
+++ b/docs/35.0.0/tutorials/tutorial-retention.md
@@ -0,0 +1,115 @@
+---
+id: tutorial-retention
+title: Configure data retention
+sidebar_label: Configure data retention
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+This tutorial demonstrates how to configure retention rules on a datasource to set the time intervals of data that will be retained or dropped.
+
+For this tutorial, we'll assume you've already downloaded Apache Druid as described in
+the [single-machine quickstart](index.md) and have it running on your local machine.
+
+It will also be helpful to have finished [Load a file](../tutorials/tutorial-batch.md) and [Query data](../tutorials/tutorial-query.md) tutorials.
+
+## Load the example data
+
+For this tutorial, we'll be using the Wikipedia edits sample data, with an ingestion task spec that will create a separate segment for each hour in the input data.
+
+The ingestion spec can be found at `quickstart/tutorial/retention-index.json`. Let's submit that spec, which will create a datasource called `retention-tutorial`:
+
+```bash
+bin/post-index-task --file quickstart/tutorial/retention-index.json --url http://localhost:8081
+```
+
+After the ingestion completes, go to [http://localhost:8888/unified-console.html#datasources](http://localhost:8888/unified-console.html#datasources) in a browser to access the web console's datasource view.
+
+This view shows the available datasources and a summary of the retention rules for each datasource:
+
+![Summary](../assets/tutorial-retention-01.png "Summary")
+
+Currently there are no rules set for the `retention-tutorial` datasource. Note that there are default rules for the cluster: load forever with 2 replicas in `_default_tier`.
+
+This means that all data will be loaded regardless of timestamp, and each segment will be replicated to two Historical processes in the default tier.
+
+In this tutorial, we will ignore the tiering and redundancy concepts for now.
+
+Let's view the segments for the `retention-tutorial` datasource by clicking the "24 Segments" link next to "Fully Available".
+
+The segments view ([http://localhost:8888/unified-console.html#segments](http://localhost:8888/unified-console.html#segments)) provides information about what segments a datasource contains. The page shows that there are 24 segments, each one containing data for a specific hour of 2015-09-12:
+
+![Original segments](../assets/tutorial-retention-02.png "Original segments")
+
+## Set retention rules
+
+Suppose we want to drop data for the first 12 hours of 2015-09-12 and keep data for the later 12 hours of 2015-09-12.
+
+Go to the [datasources view](http://localhost:8888/unified-console.html#datasources) and click the blue pencil icon next to `Cluster default: loadForever` for the `retention-tutorial` datasource.
+
+A rule configuration window will appear:
+
+![Rule configuration](../assets/tutorial-retention-03.png "Rule configuration")
+
+Now click the `+ New rule` button twice.
+
+In the upper rule box, select `Load` and `by interval`, and then enter `2015-09-12T12:00:00.000Z/2015-09-13T00:00:00.000Z` in field next to `by interval`. Replicas can remain at 2 in the `_default_tier`.
+
+In the lower rule box, select `Drop` and `forever`.
+
+The rules should look like this:
+
+![Set rules](../assets/tutorial-retention-04.png "Set rules")
+
+Now click `Next`. The rule configuration process will ask for a user name and comment, for change logging purposes. You can enter `tutorial` for both.
+
+Now click `Save`. You can see the new rules in the datasources view:
+
+![New rules](../assets/tutorial-retention-05.png "New rules")
+
+Give the cluster a few minutes to apply the rule change, and go to the [segments view](http://localhost:8888/unified-console.html#segments) in the web console.
+The segments for the first 12 hours of 2015-09-12 are now gone:
+
+![New segments](../assets/tutorial-retention-06.png "New segments")
+
+The resulting retention rule chain is the following:
+
+1. loadByInterval 2015-09-12T12/2015-09-13 (12 hours)
+
+2. dropForever
+
+3. loadForever (default rule)
+
+The rule chain is evaluated from top to bottom, with the default rule chain always added at the bottom.
+
+The tutorial rule chain we just created loads data if it is within the specified 12 hour interval.
+
+If data is not within the 12 hour interval, the rule chain evaluates `dropForever` next, which will drop any data.
+
+The `dropForever` terminates the rule chain, effectively overriding the default `loadForever` rule, which will never be reached in this rule chain.
+
+Note that in this tutorial we defined a load rule on a specific interval.
+
+If instead you want to retain data based on how old it is (e.g., retain data that ranges from 3 months in the past to the present time), you would define a Period load rule instead.
+
+## Further reading
+
+* [Load rules](../operations/rule-configuration.md)
diff --git a/docs/35.0.0/tutorials/tutorial-rollup.md b/docs/35.0.0/tutorials/tutorial-rollup.md
new file mode 100644
index 0000000000..12a7e2a900
--- /dev/null
+++ b/docs/35.0.0/tutorials/tutorial-rollup.md
@@ -0,0 +1,162 @@
+---
+id: tutorial-rollup
+title: Aggregate data with rollup
+sidebar_label: Aggregate data with rollup
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+Apache Druid&circledR; can summarize raw data at ingestion time using a process known as "rollup." [Rollup](../multi-stage-query/concepts.md#rollup) is a first-level aggregation operation over a selected set of columns that reduces the size of stored data.
+
+This tutorial demonstrates how to apply rollup during ingestion and highlights its effects during query execution. The examples in the tutorial use the [multi-stage query (MSQ)](../multi-stage-query/index.md) task engine to execute SQL statements.
+
+## Prerequisites
+
+Before proceeding, download Druid as described in [Quickstart (local)](./index.md) and have it running on your local machine. You don't need to load any data into the Druid cluster.
+
+You should be familiar with data querying in Druid. If you haven't already, go through the [Query data](../tutorials/tutorial-query.md) tutorial first. 
+
+
+## Load the example data
+
+For this tutorial, you use a small sample of network flow event data representing IP traffic.
+The data contains packet and byte counts from a source IP address to a destination IP address.
+
+```json
+{"timestamp":"2018-01-01T01:01:35Z","srcIP":"1.1.1.1", "dstIP":"2.2.2.2","packets":20,"bytes":9024}
+{"timestamp":"2018-01-01T01:01:51Z","srcIP":"1.1.1.1", "dstIP":"2.2.2.2","packets":255,"bytes":21133}
+{"timestamp":"2018-01-01T01:01:59Z","srcIP":"1.1.1.1", "dstIP":"2.2.2.2","packets":11,"bytes":5780}
+{"timestamp":"2018-01-01T01:02:14Z","srcIP":"1.1.1.1", "dstIP":"2.2.2.2","packets":38,"bytes":6289}
+{"timestamp":"2018-01-01T01:02:29Z","srcIP":"1.1.1.1", "dstIP":"2.2.2.2","packets":377,"bytes":359971}
+{"timestamp":"2018-01-01T01:03:29Z","srcIP":"1.1.1.1", "dstIP":"2.2.2.2","packets":49,"bytes":10204}
+{"timestamp":"2018-01-02T21:33:14Z","srcIP":"7.7.7.7", "dstIP":"8.8.8.8","packets":38,"bytes":6289}
+{"timestamp":"2018-01-02T21:33:45Z","srcIP":"7.7.7.7", "dstIP":"8.8.8.8","packets":123,"bytes":93999}
+{"timestamp":"2018-01-02T21:35:45Z","srcIP":"7.7.7.7", "dstIP":"8.8.8.8","packets":12,"bytes":2818}
+```
+
+Load the sample dataset using the [`INSERT INTO`](../multi-stage-query/reference.md#insert) statement and the [`EXTERN`](../multi-stage-query/reference.md#extern-function) function to ingest the data inline. In the [Druid web console](../operations/web-console.md), go to the **Query** view and run the following query:
+
+```sql
+INSERT INTO "rollup_tutorial"
+WITH "inline_data" AS (
+  SELECT *
+  FROM TABLE(EXTERN('{
+    "type":"inline",
+    "data":"{\"timestamp\":\"2018-01-01T01:01:35Z\",\"srcIP\":\"1.1.1.1\",\"dstIP\":\"2.2.2.2\",\"packets\":20,\"bytes\":9024}\n{\"timestamp\":\"2018-01-01T01:02:14Z\",\"srcIP\":\"1.1.1.1\",\"dstIP\":\"2.2.2.2\",\"packets\":38,\"bytes\":6289}\n{\"timestamp\":\"2018-01-01T01:01:59Z\",\"srcIP\":\"1.1.1.1\",\"dstIP\":\"2.2.2.2\",\"packets\":11,\"bytes\":5780}\n{\"timestamp\":\"2018-01-01T01:01:51Z\",\"srcIP\":\"1.1.1.1\",\"dstIP\":\"2.2.2.2\",\"packets\":255,\"bytes\":21133}\n{\"timestamp\":\"2018-01-01T01:02:29Z\",\"srcIP\":\"1.1.1.1\",\"dstIP\":\"2.2.2.2\",\"packets\":377,\"bytes\":359971}\n{\"timestamp\":\"2018-01-01T01:03:29Z\",\"srcIP\":\"1.1.1.1\",\"dstIP\":\"2.2.2.2\",\"packets\":49,\"bytes\":10204}\n{\"timestamp\":\"2018-01-02T21:33:14Z\",\"srcIP\":\"7.7.7.7\",\"dstIP\":\"8.8.8.8\",\"packets\":38,\"bytes\":6289}\n{\"timestamp\":\"2018-01-02T21:33:45Z\",\"srcIP\":\"7.7.7.7\",\"dstIP\":\"8.8.8.8\",\"packets\":123,\"bytes\":93999}\n{\"timestamp\":\"2018-01-02T21:35:45Z\",\"srcIP\":\"7.7.7.7\",\"dstIP\":\"8.8.8.8\",\"packets\":12,\"bytes\":2818}"}', 
+    '{"type":"json"}')) 
+    EXTEND ("timestamp" VARCHAR, "srcIP" VARCHAR, "dstIP" VARCHAR, "packets" BIGINT, "bytes" BIGINT)
+)
+SELECT
+  FLOOR(TIME_PARSE("timestamp") TO MINUTE) AS __time,
+  "srcIP",
+  "dstIP",
+  SUM("bytes") AS "bytes",
+  SUM("packets") AS "packets",
+  COUNT(*) AS "count"
+FROM "inline_data"
+GROUP BY 1, 2, 3
+PARTITIONED BY DAY
+```
+
+Note the following aspects of the ingestion statement:
+* You transform the timestamp field using the `FLOOR` function to round timestamps down to the minute.
+* You group by the dimensions `timestamp`, `srcIP`, and `dstIP`.
+* You create the `bytes` and `packets` metrics, which are summed from their respective input fields.
+* You also create the `count` metric that records the number of rows that get rolled-up per each row in the datasource.
+
+With rollup, Druid combines rows with identical timestamp and dimension values after the timestamp truncation. Druid computes and stores the metric values using the specified aggregation function over each set of rolled-up rows.
+
+After the ingestion completes, you can query the data.
+
+## Query the example data
+
+In the web console, open a new tab in the **Query** view. Run the following query to view the ingested data:
+
+```sql
+SELECT * FROM "rollup_tutorial"
+```
+
+Returns the following:
+
+| `__time` | `srcIP` | `dstIP` | `bytes` | `count` | `packets` |
+| -- | -- | -- | -- | -- | -- |
+| `2018-01-01T01:01:00.000Z` | `1.1.1.1` | `2.2.2.2` | `35,937` | `3` | `286` |
+| `2018-01-01T01:02:00.000Z` | `1.1.1.1` | `2.2.2.2` | `366,260` | `2` | `415` |
+| `2018-01-01T01:03:00.000Z` | `1.1.1.1` | `2.2.2.2` | `10,204` | `1` | `49` |
+| `2018-01-02T21:33:00.000Z` | `7.7.7.7` | `8.8.8.8` | `100,288` | `2` | `161` |
+| `2018-01-02T21:35:00.000Z` | `7.7.7.7` | `8.8.8.8` | `2,818` | `1` | `12` |
+
+Notice there are only five rows as opposed to the nine rows in the example data. In the next section, you explore the components of the rolled-up rows.
+
+## View rollup in action
+
+Consider the three events in the original input data that occur over the course of minute `2018-01-01T01:01`:
+
+```json
+{"timestamp":"2018-01-01T01:01:35Z","srcIP":"1.1.1.1", "dstIP":"2.2.2.2","packets":20,"bytes":9024}
+{"timestamp":"2018-01-01T01:01:51Z","srcIP":"1.1.1.1", "dstIP":"2.2.2.2","packets":255,"bytes":21133}
+{"timestamp":"2018-01-01T01:01:59Z","srcIP":"1.1.1.1", "dstIP":"2.2.2.2","packets":11,"bytes":5780}
+```
+
+Druid combines the three rows into one during rollup:
+
+| `__time` | `srcIP` | `dstIP` | `bytes` | `count` | `packets` |
+| -- | -- | -- | -- | -- | -- |
+| `2018-01-01T01:01:00.000Z` | `1.1.1.1` | `2.2.2.2` | `35,937` | `3` | `286` |
+
+Before the grouping occurs, the `FLOOR(TIME_PARSE("timestamp") TO MINUTE)` expression buckets (floors) the timestamp column of the original input by minute.
+
+The input rows are grouped because they have the same values for their dimension columns `{timestamp, srcIP, dstIP}`. The metric columns calculate the sum aggregation of the grouped rows for `packets` and `bytes`. The `count` metric shows how many rows from the original input data contributed to the final rolled-up row.
+
+Now, consider the two events in the original input data that occur over the course of minute `2018-01-01T01:02`:
+
+```json
+{"timestamp":"2018-01-01T01:02:14Z","srcIP":"1.1.1.1", "dstIP":"2.2.2.2","packets":38,"bytes":6289}
+{"timestamp":"2018-01-01T01:02:29Z","srcIP":"1.1.1.1", "dstIP":"2.2.2.2","packets":377,"bytes":359971}
+```
+
+The rows are grouped into the following during rollup:
+
+| `__time` | `srcIP` | `dstIP` | `bytes` | `count` | `packets` |
+| -- | -- | -- | -- | -- | -- |
+| `2018-01-01T01:02:00.000Z` | `1.1.1.1` | `2.2.2.2` | `366,260` | `2` | `415` |
+
+In the original input data, only one event occurs over the course of minute `2018-01-01T01:03`:
+
+```json
+{"timestamp":"2018-01-01T01:03:29Z","srcIP":"1.1.1.1", "dstIP":"2.2.2.2","packets":49,"bytes":10204}
+```
+
+Therefore, no rollup takes place:
+
+| `__time` | `srcIP` | `dstIP` | `bytes` | `count` | `packets` |
+| -- | -- | -- | -- | -- | -- |
+| `2018-01-01T01:03:00.000Z` | `1.1.1.1` | `2.2.2.2` | `10,204` | `1` | `49` |
+
+
+## Learn more
+
+See the following topics for more information:
+
+* [Data rollup](../ingestion/rollup.md) for suggestions and best practices when performing rollup.
+* [SQL-based ingestion concepts](../multi-stage-query/concepts.md#rollup) for information on rollup using SQL-based ingestion.
+* [SQL-based ingestion query examples](../multi-stage-query/examples.md#insert-with-rollup) for another example of data rollup.  
+* [Druid schema model](../ingestion/schema-model.md) to learn about the primary timestamp, dimensions, and metrics.
diff --git a/docs/35.0.0/tutorials/tutorial-sketches-theta.md b/docs/35.0.0/tutorials/tutorial-sketches-theta.md
new file mode 100644
index 0000000000..681db68b88
--- /dev/null
+++ b/docs/35.0.0/tutorials/tutorial-sketches-theta.md
@@ -0,0 +1,262 @@
+---
+id: tutorial-sketches-theta
+title: Approximations with Theta sketches
+sidebar_label: Theta sketches tutorial
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+Apache Druid can power real-time collection, streaming, and interactive visualization of clickstreams.
+A common problem in clickstream analytics is counting unique things, like visitors or sessions.
+Generally this involves scanning through all detail data, because unique counts do not add up as you aggregate the numbers.
+
+## The problem with counts and set operations on large data sets
+
+Imagine you are interested in the number of visitors that watched episodes of a TV show. Let's say you found that at a given day, 1000 unique visitors watched the first episode, and 800 visitors watched the second episode. You may want to explore further trends, for example:
+- How many visitors watched _both_ episodes?
+- How many visitors are there that watched _at least one_ of the episodes?
+- How many visitors watched episode 1 _but not_ episode 2?
+
+There is no way to answer these questions by just looking at the aggregated numbers. You would have to go back to the detail data and scan every single row. If the data volume is high enough, this may take a very long time, meaning that an interactive data exploration is not possible.
+
+An additional nuisance is that unique counts don't work well with rollups. For this example, it would be great if you could have just one row of data per 15 minute interval<sup>[^1]</sup>, show, and episode. After all, you are not interested in the individual user IDs, just the unique counts.
+
+[^1]: Why 15 minutes and not just 1 hour? Intervals of 15 minutes work better with international timezones because those are not always aligned by hour. India, for instance, is 30 minutes off, and Nepal is even 45 minutes off. With 15 minute aggregates, you can get hourly sums for any of those timezones, too!
+
+Is there a way to avoid crunching the detail data every single time, and maybe even enable rollup?
+Enter Theta sketches.
+
+## Use Theta sketches for fast approximation with set operations
+
+Use Theta sketches to obtain a fast approximate estimate for the distinct count of values used to build the sketches.
+Theta sketches are a probabilistic data structure to enable approximate analysis of big data with known error distributions.
+Druid's implementation relies on the [Apache DataSketches](https://datasketches.apache.org/) library.
+
+The following properties describe Theta sketches:
+* Similar to other sketches, Theta sketches are **mergeable**. This means you can work with rolled up data and merge the sketches over various time intervals. Thus, you can take advantage of Druid's rollup feature.
+* Specific to sketches supported in Druid, Theta sketches support **set operations**. Given two Theta sketches over subsets of data, you can compute the union, intersection, or set difference of the two subsets. This enables you to answer questions like the number of visitors that watched a specific combination of episodes from the example.
+
+In this tutorial, you will learn how to do the following:
+* Create Theta sketches from your input data at ingestion time.
+* Execute distinct count and set operation queries on the Theta sketches to explore the questions presented earlier.
+
+
+## Prerequisites
+
+Before proceeding, download Druid as described in the [single-machine quickstart](./index.md) and have it running on your local machine. You don't need to load any data into the Druid cluster.
+
+It's helpful to have finished [Tutorial: Loading a file](../tutorials/tutorial-batch.md) and [Tutorial: Querying data](../tutorials/tutorial-query.md).
+
+## Sample data
+
+This tutorial works with the following data:
+- **date**: a timestamp. In this case it's just dates but as mentioned earlier, a finer granularity makes sense in real life.
+- **uid**: a user ID
+- **show**: name of a TV show
+- **episode**: episode identifier
+
+```csv
+date,uid,show,episode
+2022-05-19,alice,Game of Thrones,S1E1
+2022-05-19,alice,Game of Thrones,S1E2
+2022-05-19,alice,Game of Thrones,S1E1
+2022-05-19,bob,Bridgerton,S1E1
+2022-05-20,alice,Game of Thrones,S1E1
+2022-05-20,carol,Bridgerton,S1E2
+2022-05-20,dan,Bridgerton,S1E1
+2022-05-21,alice,Game of Thrones,S1E1
+2022-05-21,carol,Bridgerton,S1E1
+2022-05-21,erin,Game of Thrones,S1E1
+2022-05-21,alice,Bridgerton,S1E1
+2022-05-22,bob,Game of Thrones,S1E1
+2022-05-22,bob,Bridgerton,S1E1
+2022-05-22,carol,Bridgerton,S1E2
+2022-05-22,bob,Bridgerton,S1E1
+2022-05-22,erin,Game of Thrones,S1E1
+2022-05-22,erin,Bridgerton,S1E2
+2022-05-23,erin,Game of Thrones,S1E1
+2022-05-23,alice,Game of Thrones,S1E1
+```
+
+## Ingest data using Theta sketches
+
+Load the sample dataset using the [`INSERT INTO`](../multi-stage-query/reference.md#insert) statement and the [`EXTERN`](../multi-stage-query/reference.md#extern-function) function to ingest the sample data inline. In the [Druid web console](../operations/web-console.md), go to the **Query** view and run the following query:
+
+```sql
+INSERT INTO "ts_tutorial"
+WITH "source" AS (SELECT * FROM TABLE(
+  EXTERN(
+    '{"type":"inline","data":"date,uid,show,episode\n2022-05-19,alice,Game of Thrones,S1E1\n2022-05-19,alice,Game of Thrones,S1E2\n2022-05-19,alice,Game of Thrones,S1E1\n2022-05-19,bob,Bridgerton,S1E1\n2022-05-20,alice,Game of Thrones,S1E1\n2022-05-20,carol,Bridgerton,S1E2\n2022-05-20,dan,Bridgerton,S1E1\n2022-05-21,alice,Game of Thrones,S1E1\n2022-05-21,carol,Bridgerton,S1E1\n2022-05-21,erin,Game of Thrones,S1E1\n2022-05-21,alice,Bridgerton,S1E1\n2022-05-22,bob,Game of Thrones,S1E1\n2022-05-22,bob,Bridgerton,S1E1\n2022-05-22,carol,Bridgerton,S1E2\n2022-05-22,bob,Bridgerton,S1E1\n2022-05-22,erin,Game of Thrones,S1E1\n2022-05-22,erin,Bridgerton,S1E2\n2022-05-23,erin,Game of Thrones,S1E1\n2022-05-23,alice,Game of Thrones,S1E1"}',
+    '{"type":"csv","findColumnsFromHeader":true}'
+  )
+) EXTEND ("date" VARCHAR, "show" VARCHAR, "episode" VARCHAR, "uid" VARCHAR))
+SELECT
+  TIME_FLOOR(TIME_PARSE("date"), 'P1D') AS "__time",
+  "show",
+  "episode",
+  COUNT(*) AS "count",
+  DS_THETA("uid") AS "theta_uid"
+FROM "source"
+GROUP BY 1, 2, 3
+PARTITIONED BY DAY
+```
+
+Notice the `theta_uid` column in the `SELECT` statement. It defines the `thetaSketch` aggregator on the `uid` column during ingestion.
+In this scenario you are not interested in individual user IDs, only the unique counts.
+Instead you create Theta sketches on the values of `uid` using the `DS_THETA` function.
+
+[`DS_THETA`](../development/extensions-core/datasketches-theta.md#aggregator) has an optional second parameter that controls the accuracy and size of the sketches.
+
+The `GROUP BY` statement groups the entries for each episode of a show watched on the same day.
+
+## Query the Theta sketch column
+
+Calculating a unique count estimate from a Theta sketch column involves the following steps:
+
+1. Merge the Theta sketches in the column by means of the `DS_THETA` [aggregator function](../querying/sql-aggregations.md#theta-sketch-functions) in Druid SQL.
+2. Retrieve the estimate from the merged sketch with the [`THETA_SKETCH_ESTIMATE`](../querying/sql-scalar.md#theta-sketch-functions) function.
+
+Between steps 1 and 2, you can apply set functions as demonstrated later in [Set operations](#set-operations).
+
+### Basic counting 
+
+Let's first see what the data looks like in Druid. Run the following SQL statement in the query editor:
+```sql
+SELECT * FROM ts_tutorial
+```
+
+![View data with SELECT all query](../assets/tutorial-theta-03.png)
+
+The Theta sketch column `theta_uid` appears as a Base64-encoded string; behind it is a bitmap.
+
+The following query uses `THETA_SKETCH_ESTIMATE` to compute the distinct counts of user IDs and groups by the other dimensions:
+
+```sql
+SELECT
+  __time,
+  "show",
+  "episode",
+  THETA_SKETCH_ESTIMATE(theta_uid) AS users
+FROM ts_tutorial
+```
+
+![Count distinct with Theta sketches](../assets/tutorial-theta-04.png)
+
+### Filtered metrics
+
+Druid has the capability to use [filtered metrics](../querying/sql-aggregations.md). This means you can include a WHERE clause in the SELECT part of the query.
+:::info
+ In the case of Theta sketches, the filter clause has to be inserted between the aggregator and the estimator.
+:::
+
+As an example, query the total unique users that watched _Bridgerton_:
+
+```sql
+SELECT APPROX_COUNT_DISTINCT_DS_THETA(theta_uid) FILTER(WHERE "show" = 'Bridgerton') AS users
+FROM ts_tutorial
+```
+
+![Count distinct with Theta sketches and filters](../assets/tutorial-theta-05.png)
+
+
+In the preceding query, `APPROX_COUNT_DISTINCT_DS_THETA` is equivalent to calling `DS_THETA` and `THETA_SKETCH_ESIMATE` as follows:
+
+```sql
+SELECT THETA_SKETCH_ESTIMATE(
+         DS_THETA(theta_uid) FILTER(WHERE "show" = 'Bridgerton')
+       ) AS users
+FROM ts_tutorial
+```
+
+The `APPROX_COUNT_DISTINCT_DS_THETA` function applies the following:
+
+* `DS_THETA`: Creates a new Theta sketch from the column of Theta sketches.
+* `THETA_SKETCH_ESTIMATE`: Calculates the distinct count estimate from the output of `DS_THETA`.
+
+Note that the filter clause limits an aggregation query to only the rows that match the filter.
+
+### Set operations
+
+You can use this capability of filtering in the aggregator, together with _set operations_, to finally answer the questions from the introduction.
+
+How many users watched both episodes of _Bridgerton?_ Use `THETA_SKETCH_INTERSECT` to compute the unique count of the intersection of two (or more) segments:
+
+```sql
+SELECT THETA_SKETCH_ESTIMATE(
+         THETA_SKETCH_INTERSECT(
+           DS_THETA(theta_uid) FILTER(WHERE "show" = 'Bridgerton' AND "episode" = 'S1E1'),
+           DS_THETA(theta_uid) FILTER(WHERE "show" = 'Bridgerton' AND "episode" = 'S1E2')
+         )
+       ) AS users
+FROM ts_tutorial
+```
+
+![Count distinct with Theta sketches, filters, and set operations](../assets/tutorial-theta-06.png)
+
+Again, the set function is spliced in between the aggregator and the estimator.
+
+Likewise, use `THETA_SKETCH_UNION` to find the number of visitors that watched _any_ of the episodes:
+
+```sql
+SELECT THETA_SKETCH_ESTIMATE(
+         THETA_SKETCH_UNION(
+           DS_THETA(theta_uid) FILTER(WHERE "show" = 'Bridgerton' AND "episode" = 'S1E1'),
+           DS_THETA(theta_uid) FILTER(WHERE "show" = 'Bridgerton' AND "episode" = 'S1E2')
+         )
+       ) AS users
+FROM ts_tutorial
+```
+
+![Count distinct with Theta sketches, filters, and set operations](../assets/tutorial-theta-07.png)
+
+And finally, there is `THETA_SKETCH_NOT` which computes the set difference of two or more segments.
+The result describes how many visitors watched episode 1 of Bridgerton but not episode 2.
+
+
+```sql
+SELECT THETA_SKETCH_ESTIMATE(
+         THETA_SKETCH_NOT(
+           DS_THETA(theta_uid) FILTER(WHERE "show" = 'Bridgerton' AND "episode" = 'S1E1'),
+           DS_THETA(theta_uid) FILTER(WHERE "show" = 'Bridgerton' AND "episode" = 'S1E2')
+         )
+       ) AS users
+FROM ts_tutorial
+```
+
+![Count distinct with Theta sketches, filters, and set operations](../assets/tutorial-theta-08.png)
+
+## Conclusions
+
+- Counting distinct things for large data sets can be done with Theta sketches in Apache Druid.
+- This allows us to use rollup and discard the individual values, just retaining statistical approximations in the sketches.
+- With Theta sketch set operations, affinity analysis is easier, for example, to answer questions such as which segments correlate or overlap by how much.
+
+## Learn more
+
+See the following topics for more information:
+* [Theta sketch](../development/extensions-core/datasketches-theta.md) for reference on ingestion and native queries on Theta sketches in Druid.
+* [Theta sketch scalar functions](../querying/sql-scalar.md#theta-sketch-functions) and [Theta sketch aggregation functions](../querying/sql-aggregations.md#theta-sketch-functions) for Theta sketch functions in Druid SQL queries.
+* [Sketches for high cardinality columns](../ingestion/schema-design.md#sketches-for-high-cardinality-columns) for Druid schema design involving sketches.
+* [DataSketches extension](../development/extensions-core/datasketches-extension.md) for more information about the DataSketches extension in Druid as well as other available sketches.
+* The accuracy of queries using Theta sketches is governed by the size _k_ of the Theta sketch and by the operations you perform. See more details in the [Apache DataSketches documentation](https://datasketches.apache.org/docs/Theta/ThetaAccuracy.html).
+
+## Acknowledgments
+
+This tutorial is adapted from a [blog post](https://blog.hellmar-becker.de/2022/06/05/druid-data-cookbook-counting-unique-visitors-for-overlapping-segments/) by community member Hellmar Becker.
diff --git a/docs/35.0.0/tutorials/tutorial-sql-null.md b/docs/35.0.0/tutorials/tutorial-sql-null.md
new file mode 100644
index 0000000000..b91e8019bc
--- /dev/null
+++ b/docs/35.0.0/tutorials/tutorial-sql-null.md
@@ -0,0 +1,216 @@
+---
+id: tutorial-sql-null
+title: Null handling tutorial
+sidebar_label: Handling null values
+description: Introduction to null handling in Druid
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+This tutorial introduces the basic concepts of null handling for string and numeric columns in Apache Druid.
+The tutorial focuses on filters using the logical NOT operation on columns with NULL values.
+
+## Prerequisites
+
+Before starting this tutorial, download and run Apache Druid on your local machine as described in
+the [Local quickstart](index.md).
+
+The tutorial assumes you are familiar with using the [Query view](./tutorial-sql-query-view.md) to ingest and query data.
+
+The tutorial also assumes you have not changed any of the default settings for null handling.
+
+## Load data with null values
+
+The sample data for the tutorial contains null values for string and numeric columns as follows:
+
+```json
+{"date": "1/1/2024 1:02:00","title": "example_1","string_value": "some_value","numeric_value": 1}
+{"date": "1/1/2024 1:03:00","title": "example_2","string_value": "another_value","numeric_value": 2}
+{"date": "1/1/2024 1:04:00","title": "example_3","string_value": "", "numeric_value": null}
+{"date": "1/1/2024 1:05:00","title": "example_4","string_value": null, "numeric_value": null}
+```
+
+Run the following query in the Druid Console to load the data:
+
+```sql
+REPLACE INTO "null_example" OVERWRITE ALL
+WITH "ext" AS (
+  SELECT *
+  FROM TABLE(
+    EXTERN(
+      '{"type":"inline","data":"{\"date\": \"1/1/2024 1:02:00\",\"title\": \"example_1\",\"string_value\": \"some_value\",\"numeric_value\": 1}\n{\"date\": \"1/1/2024 1:03:00\",\"title\": \"example_2\",\"string_value\": \"another_value\",\"numeric_value\": 2}\n{\"date\": \"1/1/2024 1:04:00\",\"title\": \"example_3\",\"string_value\": \"\", \"numeric_value\": null}\n{\"date\": \"1/1/2024 1:05:00\",\"title\": \"example_4\",\"string_value\": null, \"numeric_value\": null}"}',
+      '{"type":"json"}'
+    )
+  ) EXTEND ("date" VARCHAR, "title" VARCHAR, "string_value" VARCHAR, "numeric_value" BIGINT)
+)
+SELECT
+  TIME_PARSE("date", 'd/M/yyyy H:mm:ss') AS "__time",
+  "title",
+  "string_value",
+  "numeric_value"
+FROM "ext"
+PARTITIONED BY DAY
+```
+
+After Druid finishes loading the data, run the following query to see the table:
+
+```sql
+SELECT * FROM "null_example"
+```
+
+Druid returns the following:
+
+|`__time`|`title`|`string_value`|`numeric_value`|
+|---|---|---|---|
+|`2024-01-01T01:02:00.000Z`|`example_1`|`some_value`|1|
+|`2024-01-01T01:03:00.000Z`|`example_2`|`another_value`|2|
+|`2024-01-01T01:04:00.000Z`|`example_3`|`empty`|`null`|
+|`2024-01-01T01:05:00.000Z`|`example_4`|`null`|`null`|
+
+Note the difference in the empty string value for example 3 and the null string value for example 4.
+
+## String query example
+
+The queries in this section illustrate null handling with strings.
+The following query filters rows where the string value is not equal to `some_value`:
+
+```sql
+SELECT COUNT(*)
+FROM "null_example"
+WHERE "string_value" != 'some_value'
+```
+
+Druid returns 2 for `another_value` and the empty string `""`. The null value is not counted.
+
+Note that the null value is included in `COUNT(*)` but not as a count of the values in the column as follows:
+
+```sql
+SELECT "string_value",
+      COUNT(*) AS count_all_rows,
+      COUNT("string_value") AS count_values
+FROM "inline_data"
+GROUP BY 1
+```
+
+Druid returns the following:
+
+|`string_value`|`count_all_rows`|`count_values`|
+|---|---|---|
+|`null`|1|0|
+|`empty`|1|1|
+|`another_value`|1|1|
+|`some_value`|1|1|
+
+Also note that GROUP BY expressions yield distinct entries for `null` and the empty string.
+
+### Filter for empty strings in addition to null
+
+If your queries rely on treating empty strings and null values the same, you can use an OR operator in the filter. For example to select all rows with null values or empty strings:
+
+```sql
+SELECT *
+FROM "null_example"
+WHERE "string_value" IS NULL OR "string_value" = ''
+```
+
+Druid returns the following:
+
+|`__time`|`title`|`string_value`|`numeric_value`|
+|---|---|---|---|
+|`2024-01-01T01:04:00.000Z`|`example_3`|`empty`|`null`|
+|`2024-01-01T01:05:00.000Z`|`example_4`|`null`|`null`|
+
+For another example, if you do not want to count empty strings, use a FILTER to exclude them. For example:
+
+```sql
+SELECT COUNT("string_value") FILTER(WHERE "string_value" <> '')
+FROM "null_example"
+```
+
+Druid returns 2. Both the empty string and null values are excluded.
+
+## Numeric query examples
+
+Druid does not count null values in numeric comparisons.
+
+```sql
+SELECT COUNT(*)
+FROM "null_example"
+WHERE "numeric_value" < 2
+```
+
+Druid returns 1. The `null` values for examples 3 and 4 are excluded.
+
+Additionally, be aware that null values do not behave as 0. For examples:
+
+```sql
+SELECT numeric_value + 1
+FROM "null_example"
+WHERE "__time" > '2024-01-01 01:04:00.000Z'
+```
+
+Druid returns `null` and not 1. One option is to use the COALESCE function for null handling. For example:
+
+```sql
+SELECT COALESCE(numeric_value, 0) + 1
+FROM "null_example"
+WHERE "__time" > '2024-01-01 01:04:00.000Z'
+```
+
+In this case, Druid returns 1.
+
+## Ingestion time filtering
+
+The same null handling rules apply at ingestion time.
+The following query replaces the example data with data filtered with a WHERE clause:
+
+```sql
+REPLACE INTO "null_example" OVERWRITE ALL
+WITH "ext" AS (
+  SELECT *
+  FROM TABLE(
+    EXTERN(
+      '{"type":"inline","data":"{\"date\": \"1/1/2024 1:02:00\",\"title\": \"example_1\",\"string_value\": \"some_value\",\"numeric_value\": 1}\n{\"date\": \"1/1/2024 1:03:00\",\"title\": \"example_2\",\"string_value\": \"another_value\",\"numeric_value\": 2}\n{\"date\": \"1/1/2024 1:04:00\",\"title\": \"example_3\",\"string_value\": \"\", \"numeric_value\": null}\n{\"date\": \"1/1/2024 1:05:00\",\"title\": \"example_4\",\"string_value\": null, \"numeric_value\": null}"}',
+      '{"type":"json"}'
+    )
+  ) EXTEND ("date" VARCHAR, "title" VARCHAR, "string_value" VARCHAR, "numeric_value" BIGINT)
+)
+SELECT
+  TIME_PARSE("date", 'd/M/yyyy H:mm:ss') AS "__time",
+  "title",
+  "string_value",
+  "numeric_value"
+FROM "ext"
+WHERE "string_value" != 'some_value'
+PARTITIONED BY DAY
+```
+
+The resulting data set only includes two rows. Druid has filtered out example 1 (`some_value`) and example 4 (`null`):
+
+|`__time`|`title`|`string_value`|`numeric_value`|
+|---|---|---|---|
+|`2024-01-01T01:03:00.000Z`|`example_2`|`another_value`|2|
+|`2024-01-01T01:04:00.000Z`|`example_3`|`empty`|`null`|
+
+## Learn more
+
+See the following for more information:
+- [Null values](../querying/sql-data-types.md#null-values)
+- "Generating and working with NULL values" notebook at [Learn druid](https://github.com/implydata/learn-druid/)
diff --git a/docs/35.0.0/tutorials/tutorial-sql-query-view.md b/docs/35.0.0/tutorials/tutorial-sql-query-view.md
new file mode 100644
index 0000000000..e51661f56b
--- /dev/null
+++ b/docs/35.0.0/tutorials/tutorial-sql-query-view.md
@@ -0,0 +1,197 @@
+---
+id: tutorial-sql-query-view
+title: Get to know Query view
+sidebar_label: Get to know Query view
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+This tutorial demonstrates some useful features built into Query view in Apache Druid.
+
+Query view lets you run [Druid SQL queries](../querying/sql.md) and [native (JSON-based) queries](../querying/querying.md) against ingested data.
+
+You can use Query view to test and tune queries before you use them in API requests&mdash;for example, to perform [SQL-based ingestion](../api-reference/sql-ingestion-api.md). You can also ingest data directly in Query view.
+
+The tutorial guides you through the steps to ingest sample data and query the ingested data using some Query view features.
+
+## Prerequisites
+
+Before you follow the steps in this tutorial, download Druid as described in the [quickstart](./index.md) and have it running on your local machine. You don't need to have loaded any data.
+
+## Run a demo query to ingest data
+
+Druid includes demo queries that each demonstrate a different Druid feature&mdash;for example transforming data during ingestion and sorting ingested data. Each query has detailed comments to help you learn more.
+
+In this section you load the demo queries and run a SQL task to ingest sample data into a [table datasource](../querying/datasource.md#table).
+
+1. Navigate to the Druid console at [http://localhost:8888](http://localhost:8888) and click **Query**.
+
+2. Click the ellipsis at the bottom of the query window and select **Load demo queries**. Note that loading the demo queries replaces all of your current query tabs. The demo queries load in several tabs:
+
+   ![demo queries](../assets/tutorial-sql-demo-queries.png)
+
+3. Click the **Demo 1** tab. This query ingests sample data into a datasource called **kttm_simple**. Click the **Demo 1** tab heading again and note the options&mdash;you can rename, copy, and duplicate tabs.
+
+4. Click **Run** to ingest the data.
+
+5. When ingestion is complete, Druid displays the time it took to complete the insert query, and the new datasource **kttm_simple** displays in the left pane.
+
+## View and filter query results
+
+In this section you run some queries against the new datasource and perform some operations on the query results.
+
+1. Click **+** to the right of the existing tabs to open a new query tab.
+
+2. Click the name of the datasource **kttm_simple** in the left pane to display some automatically generated queries:
+
+   ![auto queries](../assets/tutorial-sql-auto-queries.png)
+
+3. Click **SELECT * FROM kttm_simple** and run the query.
+
+4. In the query results pane, click **Chrome** anywhere it appears in the **browser** column then click **Filter on: browser = 'Chrome'** to filter the results.
+
+## Run aggregate queries
+
+[Aggregate functions](../querying/sql-aggregations.md) allow you to perform a calculation on a set of values and return a single value.
+
+In this section you run some queries using aggregate functions and perform some operations on the results, using shortcut features designed to help you build your query.
+
+1. Open a new query tab.
+
+2. Click **kttm_simple** in the left pane to display the generated queries.
+
+3. Click **SELECT COUNT(*) AS "Count" FROM kttm_simple** and run the query.
+
+4. After you run a query that contains an aggregate function, additional Query view options become available. 
+
+   Click the arrow to the left of the **kttm_simple** datasource to display the columns, then click the **country** column. Several options appear to apply country-based filters and aggregate functions to the query:
+
+   ![count distinct](../assets/tutorial-sql-count-distinct.png)
+
+5. Click **Aggregate > COUNT(DISTINCT "country")** to add this clause to the query. The query now appears as follows:
+   
+   ```sql
+   SELECT COUNT(*) AS "Count",
+      COUNT(DISTINCT "country") AS "dist_country"
+   FROM "kttm_simple"
+   GROUP BY ()
+   ```
+   Note that you can use column names such as `dist_country` in this example as shortcuts when building your query.
+
+6. Run the updated query:
+
+   ![aggregate-query](../assets/tutorial-sql-aggregate-query.png)
+
+7. Click **Engine: Auto (SQL native)** to display the engine options&mdash;**Native** for native (JSON-based) queries, **SQL native** for Druid SQL queries, and **SQL MSQ-task** for SQL-based ingestion. 
+
+   Select **Auto** to let Druid select the most efficient engine based on your query input.
+
+8. From the engine menu you can also edit the query context and turn off some query defaults. 
+
+   Deselect **Use approximate COUNT(DISTINCT)** and rerun the query. The country count in the results decreases because the computation has become more exact. See [SQL aggregation functions](../querying/sql-aggregations.md) for more information.
+
+9.  Query view can provide information about a function, in case you aren't sure exactly what it does.
+
+    Delete the contents of the query line `COUNT(DISTINCT country) AS dist_country` and type `COUNT(DISTINCT)` to replace it. A help dialog for the function displays:
+    
+    ![count distinct help](../assets/tutorial-sql-count-distinct-help.png)
+
+    Click outside the help window to close it.
+
+10. You can perform actions on calculated columns in the results pane.
+
+    Click the results column heading **dist_country COUNT(DISTINCT "country")** to see the available options:
+    
+    ![result columns actions](../assets/tutorial-sql-result-column-actions.png)
+
+11.  Select **Edit column** and change the **Output name** to **Distinct countries**.
+
+## Generate an explain plan
+
+In this section you generate an explain plan for a query. An explain plan shows the full query details and all of the operations Druid performs to execute it. 
+
+Druid optimizes queries of certain [types](../querying/sql-translation.md#query-types)&mdash;see [SQL query translation](../querying/sql-translation.md) for information on how to interpret an explain plan and use the details to improve query performance.
+
+1. Open a new query tab.
+
+2. Click **kttm_simple** in the left pane to display the generated queries.
+
+3. Click **SELECT * FROM kttm_simple** and run the query.
+
+4. Click the ellipsis at the bottom of the query window and select **Explain SQL query**. The query plan opens in a new window:
+
+   ![query plan](../assets/tutorial-sql-query-plan.png)
+
+5. Click **Open in new tab**. You can review the query details and modify it as required.
+
+6. Change the limit from 1001 to 2001:
+   
+   ```sql
+   "Limit": 2001,
+   ```
+   
+   and run the query to confirm that the updated query returns 2,001 results.
+
+## Try out a few more features
+
+In this section you try out a few more useful Query view features.
+
+### Use calculator mode
+
+Queries without a FROM clause run in calculator mode&mdash;this can be useful to help you understand how functions work. See the [Druid SQL functions](../querying/sql-functions.md) reference for more information.
+
+1. Open a new query tab and enter the following:
+   ```sql
+   SELECT SQRT(49)
+   ```
+
+2. Run the query to produce the result `7`.
+
+### Download query results
+
+You can download query results in CSV, TSV, or newline-delimited JSON format.
+
+1. Open a new query tab and run a query, for example:
+   
+   ```sql
+   SELECT DISTINCT platform
+   FROM kttm_simple
+   ```
+
+2. Above the results pane, click the down arrow and select **Download results as… CSV**. 
+
+### View query history
+
+In any query tab, click the ellipsis at the bottom of the query window and select **Query history**. 
+
+You can click the links on the left to view queries run at a particular date and time, and open a previously run query in a new query tab.
+
+## Further reading
+
+For more information on ingestion and querying data, see the following topics:
+
+- [Quickstart](./index.md) for information on getting started with Druid.
+- [Tutorial: Querying data](tutorial-query.md) for example queries to run on Druid data.
+- [Ingestion](../ingestion/index.md) for an overview of ingestion and the ingestion methods available in Druid.
+- [SQL-based ingestion](../multi-stage-query/index.md) for an overview of SQL-based ingestion.
+- [SQL-based ingestion query examples](../multi-stage-query/examples.md) for examples of SQL-based ingestion for various use cases.
+- [Introduction to Druid SQL](https://github.com/implydata/learn-druid/tree/main/notebooks) to learn more about Druid SQL.
+
diff --git a/docs/35.0.0/tutorials/tutorial-transform.md b/docs/35.0.0/tutorials/tutorial-transform.md
new file mode 100644
index 0000000000..930dc5bad3
--- /dev/null
+++ b/docs/35.0.0/tutorials/tutorial-transform.md
@@ -0,0 +1,103 @@
+---
+id: tutorial-transform
+title: Transform input data
+sidebar_label: Transform input data
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+
+This tutorial demonstrates how to transform input data during ingestion.
+
+## Prerequisite
+
+Before proceeding, download Apache Druid&circledR; as described in [Quickstart (local)](./index.md) and have it running on your local machine. You don't need to load any data into the Druid cluster.
+
+You should be familiar with data querying in Druid. If you haven't already, go through the [Query data](../tutorials/tutorial-query.md) tutorial first.
+
+## Sample data
+
+For this tutorial, you use the following sample data:
+
+```json
+{"timestamp":"2018-01-01T07:01:35Z", "animal":"octopus", "location":1, "number":100}
+{"timestamp":"2018-01-01T05:01:35Z", "animal":"mongoose", "location":2,"number":200}
+{"timestamp":"2018-01-01T06:01:35Z", "animal":"snake", "location":3, "number":300}
+{"timestamp":"2018-01-01T01:01:35Z", "animal":"lion", "location":4, "number":300}
+```
+
+## Transform data during ingestion
+
+Load the sample dataset using the [`INSERT INTO`](../multi-stage-query/reference.md#insert) statement and the [`EXTERN`](../multi-stage-query/reference.md#extern-function) function to ingest the data inline. In the [Druid web console](../operations/web-console.md), go to the **Query** view and run the following query:
+
+```sql
+INSERT INTO "transform_tutorial"
+WITH "ext" AS (
+  SELECT *
+  FROM TABLE(EXTERN('{"type":"inline","data":"{\"timestamp\":\"2018-01-01T07:01:35Z\",\"animal\":\"octopus\",  \"location\":1, \"number\":100}\n{\"timestamp\":\"2018-01-01T05:01:35Z\",\"animal\":\"mongoose\", \"location\":2,\"number\":200}\n{\"timestamp\":\"2018-01-01T06:01:35Z\",\"animal\":\"snake\", \"location\":3, \"number\":300}\n{\"timestamp\":\"2018-01-01T01:01:35Z\",\"animal\":\"lion\", \"location\":4, \"number\":300}"}', '{"type":"json"}')) EXTEND ("timestamp" VARCHAR, "animal" VARCHAR, "location" BIGINT, "number" BIGINT)
+)
+SELECT
+  TIME_PARSE("timestamp") AS "__time",
+  TEXTCAT('super-', "animal") AS "animal",
+  "location",
+  "number",
+  "number" * 3 AS "triple-number"
+FROM "ext"
+WHERE (TEXTCAT('super-', "animal") = 'super-mongoose' OR "location" = 3 OR "number" = 100)
+PARTITIONED BY DAY
+```
+
+In the `SELECT` clause, you specify the following transformations:
+* `animal`: prepends "super-" to the values in the `animal` column using the [`TEXTCAT`](../querying/sql-functions.md#textcat) function. Note that it only ingests the transformed data.
+* `triple-number`: multiplies the `number` column by three and stores the results in a column named `triple-number`. Note that the query ingests both the original and the transformed data.
+
+Additionally, the `WHERE` clause applies the following three OR operators so that the query only ingests the rows where at least one of the following conditions is `true`:
+
+* `TEXTCAT('super-', "animal")` matches "super-mongoose"
+* `location` matches 3
+* `number` matches 100
+
+Once a row passes the filter, the ingestion job applies the transformations. In this example, the filter selects the first three rows because each row meets at least one of the required OR conditions. For the selected rows, the ingestion job ingests the transformed `animal` column, the `location` column, and both the original `number` and the transformed `triple-number` column. The "lion" row doesn't meet any of the conditions, so it is not ingested or transformed.
+
+## Query the transformed data
+
+In the web console, open a new tab in the **Query** view. Run the following query to view the ingested data:
+
+```sql
+SELECT * FROM "transform_tutorial"
+```
+
+Returns the following:
+
+| `__time` | `animal` | `location` | `number` | `triple-number` | 
+| -- | -- | -- | -- | -- |
+| `2018-01-01T05:01:35.000Z` | `super-mongoose` | `2` | `200` | `600` |
+| `2018-01-01T06:01:35.000Z` | `super-snake` | `3` | `300` | `900` |
+| `2018-01-01T07:01:35.000Z` | `super-octopus` | `1` |  `100` | `300` |
+
+Notice how the "lion" row is missing, and how the other three rows that were ingested have transformations applied to them.
+
+## Learn more
+
+See the following topics for more information:
+
+* [All functions](../querying/sql-functions.md) for a list of functions that can be used to transform data. 
+* [Transform spec reference](../ingestion/ingestion-spec.md#transformspec) to learn more about transforms in JSON-based batch ingestion.
+* [WHERE clause](../querying/sql.md#where) to learn how to specify filters in Druid SQL.
\ No newline at end of file
diff --git a/docs/35.0.0/tutorials/tutorial-unnest-arrays.md b/docs/35.0.0/tutorials/tutorial-unnest-arrays.md
new file mode 100644
index 0000000000..c844ef068b
--- /dev/null
+++ b/docs/35.0.0/tutorials/tutorial-unnest-arrays.md
@@ -0,0 +1,655 @@
+---
+id: tutorial-unnest-arrays
+sidebar_label: "Unnesting arrays"
+title: "Unnest arrays within a column"
+---
+
+import Tabs from '@theme/Tabs';
+import TabItem from '@theme/TabItem';
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+:::info
+ If you're looking for information about how to unnest `COMPLEX<json>` columns, see [Nested columns](../querying/nested-columns.md).
+:::
+
+This tutorial demonstrates how to use the unnest datasource to unnest a column that has data stored in arrays. For example, if you have a column named `dim3` with values like `[a,b]` or `[c,d,f]`, the unnest datasource can output the data to a new column with individual rows that contain single values like `a` and `b`. When doing this, be mindful of the following:
+
+- Unnesting data can dramatically increase the total number of rows.
+- You cannot unnest an array within an array.
+
+You can use the Druid console  or API to unnest data. To start though, you may want to use the Druid console so that viewing the nested and unnested data is easier.
+
+## Prerequisites
+
+You need a Druid cluster, such as the [quickstart](./index.md). The cluster does not need any existing datasources. You'll load a basic one as part of this tutorial.
+
+## Load data with nested values
+
+The data you're ingesting contains a handful of rows that resemble the following:
+
+```
+t:2000-01-01, m1:1.0, m2:1.0, dim1:, dim2:[a], dim3:[a,b], dim4:[x,y], dim5:[a,b]
+```
+
+The focus of this tutorial is on the nested array of values in `dim3`.
+
+You can load this data by running a query for SQL-based ingestion or submitting a JSON-based ingestion spec. The example loads data into a table named `nested_data`:
+
+<Tabs>
+
+<TabItem value="1" label="SQL-based ingestion">
+
+
+```sql
+REPLACE INTO nested_data OVERWRITE ALL
+SELECT
+  TIME_PARSE("t") as __time,
+  dim1,
+  dim2,
+  dim3,
+  dim4,
+  dim5,
+  m1,
+  m2
+FROM TABLE(
+    EXTERN(
+    '{"type":"inline","data":"{\"t\":\"2000-01-01\",\"m1\":\"1.0\",\"m2\":\"1.0\",\"dim1\":\"\",\"dim2\":[\"a\"],\"dim3\":[\"a\",\"b\"],\"dim4\":[\"x\",\"y\"],\"dim5\":[\"a\",\"b\"]},\n{\"t\":\"2000-01-02\",\"m1\":\"2.0\",\"m2\":\"2.0\",\"dim1\":\"10.1\",\"dim2\":[],\"dim3\":[\"c\",\"d\"],\"dim4\":[\"e\",\"f\"],\"dim5\":[\"a\",\"b\",\"c\",\"d\"]},\n{\"t\":\"2001-01-03\",\"m1\":\"6.0\",\"m2\":\"6.0\",\"dim1\":\"abc\",\"dim2\":[\"a\"],\"dim3\":[\"k\",\"l\"]},\n{\"t\":\"2001-01-01\",\"m1\":\"4.0\",\"m2\":\"4.0\",\"dim1\":\"1\",\"dim2\":[\"a\"],\"dim3\":[\"g\",\"h\"]},\n{\"t\":\"2001-01-02\",\"m1\":\"5.0\",\"m2\":\"5.0\",\"dim1\":\"def\",\"dim2\":[\"abc\"],\"dim3\":[\"i\",\"j\"]},\n{\"t\":\"2001-01-03\",\"m1\":\"6.0\",\"m2\":\"6.0\",\"dim1\":\"abc\",\"dim2\":[\"a\"],\"dim3\":[\"k\",\"l\"]},\n{\"t\":\"2001-01-02\",\"m1\":\"5.0\",\"m2\":\"5.0\",\"dim1\":\"def\",\"dim2\":[\"abc\"],\"dim3\":[\"m\",\"n\"]}"}',
+    '{"type":"json"}',
+    '[{"name":"t","type":"string"},{"name":"dim1","type":"string"},{"name":"dim2","type":"string"},{"name":"dim3","type":"string"},{"name":"dim4","type":"string"},{"name":"dim5","type":"string"},{"name":"m1","type":"float"},{"name":"m2","type":"double"}]'
+  )
+)
+PARTITIONED BY YEAR
+```
+
+</TabItem>
+<TabItem value="2" label="Ingestion spec">
+
+
+```json
+{
+  "type": "index_parallel",
+  "spec": {
+    "ioConfig": {
+      "type": "index_parallel",
+      "inputSource": {
+        "type": "inline",
+        "data":"{\"t\":\"2000-01-01\",\"m1\":\"1.0\",\"m2\":\"1.0\",\"dim1\":\"\",\"dim2\":[\"a\"],\"dim3\":[\"a\",\"b\"],\"dim4\":[\"x\",\"y\"],\"dim5\":[\"a\",\"b\"]},\n{\"t\":\"2000-01-02\",\"m1\":\"2.0\",\"m2\":\"2.0\",\"dim1\":\"10.1\",\"dim2\":[],\"dim3\":[\"c\",\"d\"],\"dim4\":[\"e\",\"f\"],\"dim5\":[\"a\",\"b\",\"c\",\"d\"]},\n{\"t\":\"2001-01-03\",\"m1\":\"6.0\",\"m2\":\"6.0\",\"dim1\":\"abc\",\"dim2\":[\"a\"],\"dim3\":[\"k\",\"l\"]},\n{\"t\":\"2001-01-01\",\"m1\":\"4.0\",\"m2\":\"4.0\",\"dim1\":\"1\",\"dim2\":[\"a\"],\"dim3\":[\"g\",\"h\"]},\n{\"t\":\"2001-01-02\",\"m1\":\"5.0\",\"m2\":\"5.0\",\"dim1\":\"def\",\"dim2\":[\"abc\"],\"dim3\":[\"i\",\"j\"]},\n{\"t\":\"2001-01-03\",\"m1\":\"6.0\",\"m2\":\"6.0\",\"dim1\":\"abc\",\"dim2\":[\"a\"],\"dim3\":[\"k\",\"l\"]},\n{\"t\":\"2001-01-02\",\"m1\":\"5.0\",\"m2\":\"5.0\",\"dim1\":\"def\",\"dim2\":[\"abc\"],\"dim3\":[\"m\",\"n\"]}"
+      },
+      "inputFormat": {
+        "type": "json"
+      }
+    },
+    "tuningConfig": {
+      "type": "index_parallel",
+      "partitionsSpec": {
+        "type": "dynamic"
+      }
+    },
+    "dataSchema": {
+      "dataSource": "nested_data",
+      "granularitySpec": {
+        "type": "uniform",
+        "queryGranularity": "NONE",
+        "rollup": false,
+        "segmentGranularity": "YEAR"
+      },
+      "timestampSpec": {
+        "column": "t",
+        "format": "auto"
+      },
+      "dimensionsSpec": {
+        "dimensions": [
+          "dim1",
+          "dim2",
+          "dim3",
+          "dim4",
+          "dim5"
+        ]
+      },
+      "metricsSpec": [
+        {
+          "name": "m1",
+          "type": "floatSum",
+          "fieldName": "m1"
+        },
+        {
+          "name": "m2",
+          "type": "doubleSum",
+          "fieldName": "m2"
+        }
+      ]
+    }
+  }
+}
+```
+</TabItem>
+</Tabs>
+
+## View the data
+
+Now that the data is loaded, run the following query:
+
+```sql
+SELECT * FROM nested_data
+```
+
+In the results, notice that the column named `dim3` has nested values like `["a","b"]`.  The example queries that follow unnest `dim3`  and run queries against the unnested records. Depending on the type of queries you write, see either [Unnest using SQL queries](#unnest-using-sql-queries) or [Unnest using native queries](#unnest-using-native-queries).
+
+## Unnest using SQL queries
+
+The following is the general syntax for UNNEST:
+
+```sql
+SELECT column_alias_name FROM datasource CROSS JOIN UNNEST(source_expression) AS table_alias_name(column_alias_name)
+```
+
+For more information about the syntax, see [UNNEST](../querying/sql.md#unnest).
+
+### Unnest a single source expression in a datasource
+
+The following query returns a column called `d3` from the table `nested_data`. `d3` contains the unnested values from the source column `dim3`:
+
+```sql
+SELECT d3 FROM "nested_data" CROSS JOIN UNNEST(MV_TO_ARRAY(dim3)) AS example_table(d3)
+```
+
+Notice the MV_TO_ARRAY helper function, which converts the multi-value records in `dim3` to arrays. It is required since `dim3` is a multi-value string dimension.
+
+If the column you are unnesting is not a string dimension, then you do not need to use the MV_TO_ARRAY helper function.
+
+### Unnest a virtual column
+
+You can unnest into a virtual column (multiple columns treated as one). The following query returns the two source columns and a third virtual column containing the unnested data:
+
+```sql
+SELECT dim4,dim5,d45 FROM nested_data CROSS JOIN UNNEST(ARRAY[dim4,dim5]) AS example_table(d45)
+```
+
+The virtual column `d45` is the product of the two source columns. Notice how the total number of rows has grown. The table `nested_data` had only seven rows originally.
+
+Another way to unnest a virtual column is to concatenate them with ARRAY_CONCAT:
+
+```sql
+SELECT dim4,dim5,d45 FROM nested_data CROSS JOIN UNNEST(ARRAY_CONCAT(dim4,dim5)) AS example_table(d45)
+```
+
+Decide which method to use based on what your goals are.
+
+### Unnest multiple source expressions
+
+You can include multiple UNNEST clauses in a single query. Each `UNNEST` clause needs the following:
+
+```sql
+UNNEST(source_expression) AS table_alias_name(column_alias_name)
+```
+
+The `table_alias_name` and `column_alias_name` for each UNNEST clause should be unique.
+
+The example query returns the following from  the `nested_data` datasource:
+
+- the source columns `dim3`, `dim4`, and `dim5`
+- an unnested version of `dim3` aliased to `d3`
+- an unnested virtual column composed of `dim4` and `dim5` aliased to `d45`
+
+```sql
+SELECT dim3,dim4,dim5,d3,d45 FROM "nested_data" CROSS JOIN UNNEST(MV_TO_ARRAY("dim3")) AS foo1(d3) CROSS JOIN UNNEST(ARRAY[dim4,dim5]) AS foo2(d45)
+```
+
+
+### Unnest a column from a subset of a table
+
+The following query uses only three columns from the `nested_data` table as the datasource. From that subset, it unnests the column `dim3` into `d3` and returns `d3`.
+
+```sql
+SELECT d3 FROM (SELECT dim1, dim2, dim3 FROM "nested_data") CROSS JOIN UNNEST(MV_TO_ARRAY(dim3)) AS example_table(d3)
+```
+
+### Unnest with a filter
+
+You can specify which rows to unnest by including a filter in your query. The following query:
+
+* Filters the source expression based on `dim2`
+* Unnests the records in `dim3` into `d3`
+* Returns the records for  the unnested `d3` that have a `dim2` record that matches the filter
+
+```sql
+SELECT d3 FROM (SELECT * FROM nested_data WHERE dim2 IN ('abc')) CROSS JOIN UNNEST(MV_TO_ARRAY(dim3)) AS example_table(d3)
+```
+
+You can also filter the results of an UNNEST clause. The following example unnests the inline array `[1,2,3]` but only returns the rows that match the filter:
+
+```sql
+SELECT * FROM UNNEST(ARRAY[1,2,3]) AS example_table(d1) WHERE d1 IN ('1','2')
+```
+
+This means that you can run a query like the following where Druid only return rows that meet the following conditions:
+
+- The unnested values of `dim3` (aliased to `d3`) matches `IN ('b', 'd')`
+- The value of `m1` is less than 2.
+
+```sql
+SELECT * FROM nested_data CROSS JOIN UNNEST(MV_TO_ARRAY("dim3")) AS foo(d3) WHERE d3 IN ('b', 'd') and m1 < 2
+```
+
+The query only returns a single row since only one row meets the conditions. You can see the results change if you modify the filter.
+
+### Unnest and then GROUP BY
+
+The following query unnests `dim3` and then performs a GROUP BY on the output `d3`.
+
+```sql
+SELECT d3 FROM nested_data CROSS JOIN UNNEST(MV_TO_ARRAY(dim3)) AS example_table(d3) GROUP BY d3
+```
+
+You can further transform your results by  including clauses like `ORDER BY d3 DESC` or LIMIT.
+
+## Unnest using native queries
+
+The following section shows examples of how you can use the unnest datasource in queries. They all use the `nested_data` table you created earlier in the tutorial.
+
+You can use a single unnest datasource to unnest multiple columns. Be careful when doing this though because it can lead to a very large number of new rows.
+
+### Scan query
+
+The following native Scan query returns the rows of the datasource and unnests the values in the `dim3` column by using the `unnest` datasource type:
+
+<details>
+<summary>Show the query</summary>
+
+```json
+{
+  "queryType": "scan",
+  "dataSource": {
+    "type": "unnest",
+    "base": {
+      "type": "table",
+      "name": "nested_data"
+    },
+    "virtualColumn": {
+      "type": "expression",
+      "name": "unnest-dim3",
+      "expression": "\"dim3\""
+    }
+  },
+  "intervals": {
+    "type": "intervals",
+    "intervals": [
+      "-146136543-09-08T08:23:32.096Z/146140482-04-24T15:36:27.903Z"
+    ]
+  },
+  "limit": 100,
+  "columns": [
+    "__time",
+    "dim1",
+    "dim2",
+    "dim3",
+    "m1",
+    "m2",
+    "unnest-dim3"
+  ],
+  "granularity": {
+    "type": "all"
+  },
+  "context": {
+    "debug": true,
+    "useCache": false
+  }
+}
+```
+</details>
+
+In the results, notice that there are more rows than before and an additional column named `unnest-dim3`. The values of `unnest-dim3` are the same as the `dim3` column except the nested values are no longer nested and are each a separate record.
+
+You can implement filters. For example, you can add the following to the Scan query to filter results to only rows that have the values `"a"` or `"abc"` in `"dim2"`:
+
+```json
+  "filter": {
+    "type": "in",
+    "dimension": "dim2",
+    "values": [
+      "a",
+      "abc",
+      ]
+  },
+```
+
+### groupBy query
+
+The following query returns an unnested version of the column `dim3` as the column `unnest-dim3` sorted in descending order.
+
+<details>
+<summary>Show the query</summary>
+
+```json
+{
+  "queryType": "groupBy",
+  "dataSource": {
+    "type": "unnest",
+    "base": "nested_data",
+    "virtualColumn": {
+      "type": "expression",
+      "name": "unnest-dim3",
+      "expression": "\"dim3\""
+    }
+  },
+  "intervals": ["-146136543-09-08T08:23:32.096Z/146140482-04-24T15:36:27.903Z"],
+  "granularity": "all",
+  "dimensions": [
+    "unnest-dim3"
+  ],
+  "limitSpec": {
+    "type": "default",
+    "columns": [
+      {
+        "dimension": "unnest-dim3",
+        "direction": "descending"
+      }
+    ],
+    "limit": 1001
+  },
+  "context": {
+    "debug": true
+  }
+}
+```
+
+</details>
+
+### topN query
+
+The example topN query unnests `dim3` into the column `unnest-dim3`. The query uses the unnested column as the dimension for the topN query. The results are outputted to a column named `topN-unnest-d3` and are sorted numerically in ascending order based on the column `a0`, an aggregate value representing the minimum of `m1`.
+
+<details>
+<summary>Show the query</summary>
+
+```json
+{
+  "queryType": "topN",
+  "dataSource": {
+    "type": "unnest",
+    "base": {
+      "type": "table",
+      "name": "nested_data"
+    },
+    "virtualColumn": {
+      "type": "expression",
+      "name": "unnest-dim3",
+      "expression": "\"dim3\""
+    },
+  },
+  "dimension": {
+    "type": "default",
+    "dimension": "unnest-dim3",
+    "outputName": "topN-unnest-d3",
+    "outputType": "STRING"
+  },
+  "metric": {
+    "type": "inverted",
+    "metric": {
+      "type": "numeric",
+      "metric": "a0"
+    }
+  },
+  "threshold": 3,
+  "intervals": {
+    "type": "intervals",
+    "intervals": [
+      "-146136543-09-08T08:23:32.096Z/146140482-04-24T15:36:27.903Z"
+    ]
+  },
+  "granularity": {
+    "type": "all"
+  },
+  "aggregations": [
+    {
+      "type": "floatMin",
+      "name": "a0",
+      "fieldName": "m1"
+    }
+  ],
+  "context": {
+    "debug": true
+  }
+}
+```
+
+</details>
+
+### Unnest with a JOIN query
+
+This query joins the `nested_data` table with itself and outputs the unnested data into a new column called `unnest-dim3`.
+
+<details>
+<summary>Show the query</summary>
+
+```json
+{
+  "queryType": "scan",
+  "dataSource": {
+    "type": "unnest",
+    "base": {
+        "type": "join",
+        "left": {
+          "type": "table",
+          "name": "nested_data"
+        },
+        "right": {
+          "type": "query",
+          "query": {
+            "queryType": "scan",
+            "dataSource": {
+              "type": "table",
+              "name": "nested_data"
+            },
+            "intervals": {
+              "type": "intervals",
+              "intervals": [
+                "-146136543-09-08T08:23:32.096Z/146140482-04-24T15:36:27.903Z"
+              ]
+            },
+            "virtualColumns": [
+              {
+                "type": "expression",
+                "name": "v0",
+                "expression": "\"m2\"",
+                "outputType": "FLOAT"
+              }
+            ],
+            "resultFormat": "compactedList",
+            "columns": [
+              "__time",
+              "dim1",
+              "dim2",
+              "dim3",
+              "m1",
+              "m2",
+              "v0"
+            ],
+            "context": {
+              "sqlOuterLimit": 1001,
+              "useNativeQueryExplain": true
+            },
+            "granularity": {
+              "type": "all"
+            }
+          }
+        },
+        "rightPrefix": "j0.",
+        "condition": "(\"m1\" == \"j0.v0\")",
+        "joinType": "INNER"
+      },
+    "virtualColumn": {
+      "type": "expression",
+      "name": "unnest-dim3",
+      "expression": "\"dim3\""
+    }
+    },
+  "intervals": {
+    "type": "intervals",
+    "intervals": [
+      "-146136543-09-08T08:23:32.096Z/146140482-04-24T15:36:27.903Z"
+    ]
+  },
+  "resultFormat": "compactedList",
+  "limit": 1001,
+  "columns": [
+    "__time",
+    "dim1",
+    "dim2",
+    "dim3",
+    "j0.__time",
+    "j0.dim1",
+    "j0.dim2",
+    "j0.dim3",
+    "j0.m1",
+    "j0.m2",
+    "m1",
+    "m2",
+    "unnest-dim3"
+  ],
+  "context": {
+    "sqlOuterLimit": 1001,
+    "useNativeQueryExplain": true
+  },
+  "granularity": {
+    "type": "all"
+  }
+}
+```
+
+</details>
+
+### Unnest a virtual column
+
+The `unnest` datasource supports unnesting virtual columns, which is a queryable composite column that can draw data from multiple source columns.
+
+The following query returns the columns `dim45` and `m1`. The `dim45` column is the unnested version of a virtual column that contains an array of the `dim4` and `dim5` columns.
+
+<details>
+<summary>Show the query</summary>
+
+```json
+{
+  "queryType": "scan",
+  "dataSource":{
+    "type": "unnest",
+    "base": {
+      "type": "table",
+      "name": "nested_data"
+    },
+    "virtualColumn": {
+      "type": "expression",
+      "name": "dim45",
+      "expression": "array_concat(\"dim4\",\"dim5\")",
+      "outputType": "ARRAY<STRING>"
+    },
+  }
+  "intervals": {
+    "type": "intervals",
+    "intervals": [
+      "-146136543-09-08T08:23:32.096Z/146140482-04-24T15:36:27.903Z"
+    ]
+  },
+  "resultFormat": "compactedList",
+  "limit": 1001,
+  "columns": [
+    "dim45",
+    "m1"
+  ],
+  "granularity": {
+    "type": "all"
+  },
+  "context": {
+    "debug": true,
+    "useCache": false
+  }
+}
+```
+
+</details>
+
+### Unnest a column and a virtual column
+
+The following Scan query unnests the column `dim3` into `d3` and a virtual column composed of `dim4` and `dim5` into the column `d45`. It then returns those source columns and their unnested variants.
+
+<details>
+<summary>Show the query</summary>
+
+```json
+{
+  "queryType": "scan",
+  "dataSource": {
+    "type": "unnest",
+    "base": {
+      "type": "unnest",
+      "base": {
+        "type": "table",
+        "name": "nested_data"
+      },
+
+"virtualColumn": {
+        "type": "expression",
+        "name": "d3",
+        "expression": "\"dim3\"",
+        "outputType": "STRING"
+      },
+    },
+    "virtualColumn": {
+      "type": "expression",
+      "name": "d45",
+      "expression": "array(\"dim4\",\"dim5\")",
+      "outputType": "ARRAY<STRING>"
+    },
+  },
+  "intervals": {
+    "type": "intervals",
+    "intervals": [
+      "-146136543-09-08T08:23:32.096Z/146140482-04-24T15:36:27.903Z"
+    ]
+  },
+  "resultFormat": "compactedList",
+  "limit": 1001,
+  "columns": [
+    "dim3",
+    "d3",
+    "dim4",
+    "dim5",
+    "d45"
+  ],
+  "context": {
+    "queryId": "2618b9ce-6c0d-414e-b88d-16fb59b9c481",
+    "sqlOuterLimit": 1001,
+    "sqlQueryId": "2618b9ce-6c0d-414e-b88d-16fb59b9c481",
+    "useNativeQueryExplain": true
+  },
+  "granularity": {
+    "type": "all"
+  }
+}
+```
+
+</details>
+
+## Learn more
+
+For more information, see the following:
+-  [UNNEST SQL function](../querying/sql.md#unnest)
+- [`unnest` in Datasources](../querying/datasource.md#unnest)
diff --git a/docs/35.0.0/tutorials/tutorial-update-data.md b/docs/35.0.0/tutorials/tutorial-update-data.md
new file mode 100644
index 0000000000..e761cd2a95
--- /dev/null
+++ b/docs/35.0.0/tutorials/tutorial-update-data.md
@@ -0,0 +1,248 @@
+---
+id: tutorial-update-data
+title: Update data
+sidebar_label: Update data
+description: Learn how to update data in Apache Druid.
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+Apache Druid stores data and indexes in [segment files](../design/segments.md) partitioned by time.
+After Druid creates a segment, its contents can't be modified.
+You can either replace data for the whole segment, or, in some cases, overshadow a portion of the segment data.
+
+In Druid, use time ranges to specify the data you want to update, as opposed to a primary key or dimensions often used in transactional databases. Data outside the specified replacement time range remains unaffected.
+You can use this Druid functionality to perform data updates, inserts, and deletes, similar to UPSERT functionality for transactional databases.
+
+This tutorial shows you how to use the Druid SQL [REPLACE](../multi-stage-query/reference.md#replace) function with the OVERWRITE clause to update existing data.
+
+The tutorial walks you through the following use cases:
+
+* [Overwrite all data](#overwrite-all-data)
+* [Overwrite records for a specific time range](#overwrite-records-for-a-specific-time-range)
+* [Update a row using partial segment overshadowing](#update-a-row-using-partial-segment-overshadowing)
+
+All examples use the [multi-stage query (MSQ)](../multi-stage-query/index.md) task engine to executes SQL statements.
+
+## Prerequisites
+
+Before you follow the steps in this tutorial, download Druid as described in [Quickstart (local)](index.md) and have it running on your local machine. You don't need to load any data into the Druid cluster.
+
+You should be familiar with data querying in Druid. If you haven't already, go through the [Query data](../tutorials/tutorial-query.md) tutorial first.
+
+## Load sample data
+
+Load a sample dataset using [REPLACE](../multi-stage-query/reference.md#replace) and [EXTERN](../multi-stage-query/reference.md#extern-function) functions.
+In Druid SQL, the REPLACE function can create a new [datasource](../design/storage.md) or update an existing datasource.
+
+In the Druid [web console](../operations/web-console.md), go to the **Query** view and run the following query:
+
+```sql
+REPLACE INTO "update_tutorial" OVERWRITE ALL
+WITH "ext" AS (
+  SELECT *
+  FROM TABLE(
+    EXTERN(
+     '{"type":"inline","data":"{\"timestamp\":\"2024-01-01T07:01:35Z\",\"animal\":\"octopus\", \"number\":115}\n{\"timestamp\":\"2024-01-01T05:01:35Z\",\"animal\":\"mongoose\", \"number\":737}\n{\"timestamp\":\"2024-01-01T06:01:35Z\",\"animal\":\"snake\", \"number\":1234}\n{\"timestamp\":\"2024-01-01T01:01:35Z\",\"animal\":\"lion\", \"number\":300}\n{\"timestamp\":\"2024-01-02T07:01:35Z\",\"animal\":\"seahorse\", \"number\":115}\n{\"timestamp\":\"2024-01-02T05:01:35Z\",\"animal\":\"skunk\", \"number\":737}\n{\"timestamp\":\"2024-01-02T06:01:35Z\",\"animal\":\"iguana\", \"number\":1234}\n{\"timestamp\":\"2024-01-02T01:01:35Z\",\"animal\":\"opossum\", \"number\":300}"}',
+     '{"type":"json"}'
+    )
+  ) EXTEND ("timestamp" VARCHAR, "animal" VARCHAR, "number" BIGINT)
+)
+SELECT
+  TIME_PARSE("timestamp") AS "__time",
+  "animal",
+  "number"
+FROM "ext"
+PARTITIONED BY DAY
+
+```
+
+In the resulting `update_tutorial` datasource, individual rows are uniquely identified by `__time`, `animal`, and `number`.
+To view the results, open a new tab and run the following query:
+
+```sql
+SELECT * FROM "update_tutorial"
+```
+
+<details>
+<summary> View the results</summary>
+
+| `__time` | `animal` | `number`|
+| -- | -- | -- |
+| `2024-01-01T01:01:35.000Z`| `lion`| 300 |
+| `2024-01-01T05:01:35.000Z`| `mongoose`| 737 |
+| `2024-01-01T06:01:35.000Z`| `snake`| 1234 |
+| `2024-01-01T07:01:35.000Z`| `octopus`| 115 |
+| `2024-01-02T01:01:35.000Z`| `opossum`| 300 |
+| `2024-01-02T05:01:35.000Z`| `skunk`| 737 |
+| `2024-01-02T06:01:35.000Z`| `iguana`| 1234 |
+| `2024-01-02T07:01:35.000Z`| `seahorse`| 115 |
+
+</details>
+
+The results contain records for eight animals over two days.
+
+## Overwrite all data
+
+You can use the REPLACE function with OVERWRITE ALL to replace the entire datasource with new data while dropping the old data.
+
+In the web console, open a new tab and run the following query to overwrite timestamp data for the entire `update_tutorial` datasource:
+
+```sql
+REPLACE INTO "update_tutorial" OVERWRITE ALL
+WITH "ext" AS (SELECT *
+FROM TABLE(
+  EXTERN(
+    '{"type":"inline","data":"{\"timestamp\":\"2024-01-02T07:01:35Z\",\"animal\":\"octopus\", \"number\":115}\n{\"timestamp\":\"2024-01-02T05:01:35Z\",\"animal\":\"mongoose\", \"number\":737}\n{\"timestamp\":\"2024-01-02T06:01:35Z\",\"animal\":\"snake\", \"number\":1234}\n{\"timestamp\":\"2024-01-02T01:01:35Z\",\"animal\":\"lion\", \"number\":300}\n{\"timestamp\":\"2024-01-03T07:01:35Z\",\"animal\":\"seahorse\", \"number\":115}\n{\"timestamp\":\"2024-01-03T05:01:35Z\",\"animal\":\"skunk\", \"number\":737}\n{\"timestamp\":\"2024-01-03T06:01:35Z\",\"animal\":\"iguana\", \"number\":1234}\n{\"timestamp\":\"2024-01-03T01:01:35Z\",\"animal\":\"opossum\", \"number\":300}"}',
+    '{"type":"json"}'
+  )
+) EXTEND ("timestamp" VARCHAR, "animal" VARCHAR, "number" BIGINT))
+SELECT
+  TIME_PARSE("timestamp") AS "__time",
+  "animal",
+  "number"
+FROM "ext"
+PARTITIONED BY DAY
+```
+
+<details>
+<summary> View the results</summary>
+
+| `__time` | `animal` | `number`|
+| -- | -- | -- |
+| `2024-01-02T01:01:35.000Z`| `lion`| 300 |
+| `2024-01-02T05:01:35.000Z`| `mongoose`| 737 |
+| `2024-01-02T06:01:35.000Z`| `snake`| 1234 |
+| `2024-01-02T07:01:35.000Z`| `octopus`| 115 |
+| `2024-01-03T01:01:35.000Z`| `opossum`| 300 |
+| `2024-01-03T05:01:35.000Z`| `skunk`| 737 |
+| `2024-01-03T06:01:35.000Z`| `iguana`| 1234 |
+| `2024-01-03T07:01:35.000Z`| `seahorse`| 115 |
+
+</details>
+
+Note that the values in the `__time` column have changed to one day later.
+
+## Overwrite records for a specific time range
+
+You can use the REPLACE function to overwrite a specific time range of a datasource. When you overwrite a specific time range, that time range must align with the granularity specified in the PARTITIONED BY clause.
+
+In the web console, open a new tab and run the following query to insert a new row and update specific rows. Note that the OVERWRITE WHERE clause tells the query to only update records for the date 2024-01-03.
+
+```sql
+REPLACE INTO "update_tutorial" 
+  OVERWRITE WHERE "__time" >= TIMESTAMP'2024-01-03 00:00:00' AND "__time" < TIMESTAMP'2024-01-04 00:00:00'
+WITH "ext" AS (SELECT *
+FROM TABLE(
+  EXTERN(
+    '{"type":"inline","data":"{\"timestamp\":\"2024-01-03T01:01:35Z\",\"animal\":\"tiger\", \"number\":300}\n{\"timestamp\":\"2024-01-03T07:01:35Z\",\"animal\":\"seahorse\", \"number\":500}\n{\"timestamp\":\"2024-01-03T05:01:35Z\",\"animal\":\"polecat\", \"number\":626}\n{\"timestamp\":\"2024-01-03T06:01:35Z\",\"animal\":\"iguana\", \"number\":300}\n{\"timestamp\":\"2024-01-03T01:01:35Z\",\"animal\":\"flamingo\", \"number\":999}"}',
+    '{"type":"json"}'
+  )
+) EXTEND ("timestamp" VARCHAR, "animal" VARCHAR, "number" BIGINT))
+SELECT
+  TIME_PARSE("timestamp") AS "__time",
+  "animal",
+  "number"
+FROM "ext"
+PARTITIONED BY DAY
+```
+
+<details>
+<summary> View the results</summary>
+
+| `__time` | `animal` | `number`|
+| -- | -- | -- |
+| `2024-01-02T01:01:35.000Z`| `lion`| 300 |
+| `2024-01-02T05:01:35.000Z`| `mongoose`| 737 |
+| `2024-01-02T06:01:35.000Z`| `snake`| 1234 |
+| `2024-01-02T07:01:35.000Z`| `octopus`| 115 |
+| `2024-01-03T01:01:35.000Z`| `flamingo`| 999 |
+| `2024-01-03T01:01:35.000Z`| `tiger`| 300 |
+| `2024-01-03T05:01:35.000Z`| `polecat`| 626 |
+| `2024-01-03T06:01:35.000Z`| `iguana`| 300 |
+| `2024-01-03T07:01:35.000Z`| `seahorse`| 500 |
+
+</details>
+
+Note the changes in the resulting datasource:
+
+* There is now a new row called `flamingo`.
+* The `opossum` row has the value `tiger`.
+* The `skunk` row has the value `polecat`.
+* The `iguana` and `seahorse` rows have different numbers.
+
+## Update a row using partial segment overshadowing
+
+In Druid, you can overlay older data with newer data for the entire segment or portions of the segment within a particular partition.
+This capability is called [overshadowing](../ingestion/tasks.md#overshadowing-between-segments).
+
+You can use partial overshadowing to update a single row by adding a smaller time granularity segment on top of the existing data.
+It's a less common variation on a more common approach where you replace the entire time chunk.
+
+The following example demonstrates how update data using partial overshadowing with mixed segment granularity.  
+Note the following important points about the example:
+
+* The query updates a single record for a specific `number` row.
+* The original datasource uses DAY segment granularity.
+* The new data segment is at HOUR granularity and represents a time range that's smaller than the existing data.
+* The OVERWRITE WHERE and WHERE TIME_IN_INTERVAL clauses specify the destination where the update occurs and the source of the update, respectively.
+* The query replaces everything within the specified interval. To update only a subset of data in that interval, you have to carry forward all records, changing only what you want to change. You can accomplish that by using the [CASE](../querying/sql-functions.md#case) function in the SELECT list.
+
+```sql
+REPLACE INTO "update_tutorial"
+   OVERWRITE
+       WHERE "__time" >= TIMESTAMP'2024-01-03 05:00:00' AND "__time" < TIMESTAMP'2024-01-03 06:00:00'
+SELECT 
+   "__time", 
+   "animal", 
+   CAST(486 AS BIGINT) AS "number"
+FROM "update_tutorial" 
+WHERE TIME_IN_INTERVAL("__time", '2024-01-03T05:01:35Z/PT1S')
+PARTITIONED BY FLOOR(__time TO HOUR)
+```
+
+<details>
+<summary> View the results</summary>
+
+| `__time` | `animal` | `number`|
+| -- | -- | -- |
+| `2024-01-02T01:01:35.000Z`| `lion`| 300 |
+| `2024-01-02T05:01:35.000Z`| `mongoose`| 737 |
+| `2024-01-02T06:01:35.000Z`| `snake`| 1234 |
+| `2024-01-02T07:01:35.000Z`| `octopus`| 115 |
+| `2024-01-03T01:01:35.000Z`| `flamingo`| 999 |
+| `2024-01-03T01:01:35.000Z`| `tiger`| 300 |
+| `2024-01-03T05:01:35.000Z`| `polecat`| 486 |
+| `2024-01-03T06:01:35.000Z`| `iguana`| 300 |
+| `2024-01-03T07:01:35.000Z`| `seahorse`| 500 |
+
+</details>
+
+Note that the `number` for `polecat` has changed from 626 to 486.
+
+When you perform partial segment overshadowing multiple times, you can create segment fragmentation that could affect query performance. Use [compaction](../data-management/compaction.md) to correct any fragmentation.
+
+## Learn more
+
+See the following topics for more information:
+
+* [Data updates](../data-management/update.md) for an overview of updating data in Druid.
+* [Load files with SQL-based ingestion](../tutorials/tutorial-msq-extern.md) for generating a query that references externally hosted data.
+* [Overwrite data with REPLACE](../multi-stage-query/concepts.md#overwrite-data-with-replace) for details on how the MSQ task engine executes SQL REPLACE queries.
\ No newline at end of file
diff --git a/docs/latest/api-reference/supervisor-api.md b/docs/latest/api-reference/supervisor-api.md
index e43470f0e5..38e68d4e13 100644
--- a/docs/latest/api-reference/supervisor-api.md
+++ b/docs/latest/api-reference/supervisor-api.md
@@ -1827,6 +1827,11 @@ Retrieves an audit history of specs for a single supervisor.
 
 `GET` `/druid/indexer/v1/supervisor/{supervisorId}/history`
 
+#### Query parameters
+
+* `count` (optional)
+  * Type: Integer
+  * Limit the number of results to the last `n` entries. Must be greater than 0 if specified.
 
 #### Responses
 
@@ -1850,7 +1855,9 @@ Retrieves an audit history of specs for a single supervisor.
 
 #### Sample request
 
-The following example shows how to retrieve the audit history of a supervisor with the name `wikipedia_stream`.
+The following examples show how to retrieve the audit history of a supervisor with the name `wikipedia_stream`.
+
+**Get all history entries:**
 
 <Tabs>
 
@@ -1873,6 +1880,29 @@ Host: http://ROUTER_IP:ROUTER_PORT
 </TabItem>
 </Tabs>
 
+**Get last 10 history entries:**
+
+<Tabs>
+
+<TabItem value="33" label="cURL">
+
+
+```shell
+curl "http://ROUTER_IP:ROUTER_PORT/druid/indexer/v1/supervisor/wikipedia_stream/history?count=10"
+```
+
+</TabItem>
+<TabItem value="34" label="HTTP">
+
+
+```HTTP
+GET /druid/indexer/v1/supervisor/wikipedia_stream/history?count=10 HTTP/1.1
+Host: http://ROUTER_IP:ROUTER_PORT
+```
+
+</TabItem>
+</Tabs>
+
 #### Sample response
 
 <details>
diff --git a/docs/latest/configuration/extensions.md b/docs/latest/configuration/extensions.md
index fb040188ba..ae8d5987d2 100644
--- a/docs/latest/configuration/extensions.md
+++ b/docs/latest/configuration/extensions.md
@@ -86,6 +86,7 @@ All of these community extensions can be downloaded using [pull-deps](../operati
 |druid-ddsketch|Support for DDSketch approximate quantiles based on [DDSketch](https://github.com/datadog/sketches-java) | [link](../development/extensions-contrib/ddsketch-quantiles.md)|
 |druid-deltalake-extensions|Support for ingesting Delta Lake tables.|[link](../development/extensions-contrib/delta-lake.md)|
 |druid-distinctcount|DistinctCount aggregator|[link](../development/extensions-contrib/distinctcount.md)|
+|druid-exact-count-bitmap|Support for exact cardinality counting using Roaring Bitmap over a Long column.|[link](../development/extensions-contrib/druid-exact-count-bitmap.md)|
 |druid-iceberg-extensions|Support for ingesting Iceberg tables.|[link](../development/extensions-contrib/iceberg.md)|
 |druid-redis-cache|A cache implementation for Druid based on Redis.|[link](../development/extensions-contrib/redis-cache.md)|
 |druid-time-min-max|Min/Max aggregator for timestamp.|[link](../development/extensions-contrib/time-min-max.md)|
diff --git a/docs/latest/configuration/index.md b/docs/latest/configuration/index.md
index a02bc5b24f..8aa5e81846 100644
--- a/docs/latest/configuration/index.md
+++ b/docs/latest/configuration/index.md
@@ -196,9 +196,9 @@ and `druid.tlsPort` properties on each service. Please see `Configuration` secti
 
 Druid uses Jetty as an embedded web server. To learn more about TLS/SSL, certificates, and related concepts in Jetty, including explanations of the configuration settings below, see "Configuring SSL/TLS KeyStores" in the [Jetty Operations Guide](https://www.eclipse.org/jetty/documentation.php).
 
-For information about TLS/SSL support in Java in general, see the [Java Secure Socket Extension (JSSE) Reference Guide](https://docs.oracle.com/en/java/javase/11/security/java-secure-socket-extension-jsse-reference-guide.html).
+For information about TLS/SSL support in Java in general, see the [Java Secure Socket Extension (JSSE) Reference Guide](https://docs.oracle.com/en/java/javase/17/security/java-secure-socket-extension-jsse-reference-guide.html).
 The [Java Cryptography Architecture
-Standard Algorithm Name Documentation for JDK 11](https://docs.oracle.com/en/java/javase/11/docs/specs/security/standard-names.html) lists all possible
+Standard Algorithm Name Documentation for JDK 17](https://docs.oracle.com/en/java/javase/17/docs/specs/security/standard-names.html) lists all possible
 values for the following properties, among others provided by the Java implementation.
 
 |Property|Description|Default|Required|
@@ -231,7 +231,7 @@ These properties apply to the SSLContext that will be provided to the internal H
 |`druid.client.https.trustStoreAlgorithm`|Algorithm to be used by TrustManager to validate certificate chains|`javax.net.ssl.TrustManagerFactory.getDefaultAlgorithm()`|no|
 |`druid.client.https.trustStorePassword`|The [Password Provider](../operations/password-provider.md) or String password for the Trust Store.|none|yes|
 
-This [document](https://docs.oracle.com/en/java/javase/11/docs/specs/security/standard-names.html) lists all the possible
+This [document](https://docs.oracle.com/en/java/javase/17/docs/specs/security/standard-names.html) lists all the possible
 values for the above mentioned configs among others provided by Java implementation.
 
 ### Authentication and authorization
@@ -394,6 +394,7 @@ These properties specify the JDBC connection and other configuration around the
 |`druid.metadata.storage.tables.taskLock`|Used by the indexing service to store task locks.|`druid_tasklocks`|
 |`druid.metadata.storage.tables.supervisors`|Used by the indexing service to store supervisor configurations.|`druid_supervisors`|
 |`druid.metadata.storage.tables.audit`|The table to use for audit history of configuration changes, such as Coordinator rules.|`druid_audit`|
+|`druid.metadata.storage.tables.useShortIndexNames`|Whether to use SHA-based unique index names to ensure all indices are created.|`false`|
 
 ### Deep storage
 
@@ -627,6 +628,12 @@ On the other hand, if `druid.server.http.errorResponseTransform.allowedRegex` is
 {"error":"Plan validation failed","errorMessage":"org.apache.calcite.runtime.CalciteContextException: From line 1, column 15 to line 1, column 38: Object 'nonexistent-datasource' not found","errorClass":null,"host":null}
 ```
 
+##### Persona based error response transform strategy
+
+In this mode, Druid transforms any exceptions which are targeted at non-users personas. Instead of returning such exception directly, the strategy logs the exception against a random id and returns the id along with a generic error message to the user.
+
+To enable this strategy, set `druid.server.http.errorResponseTransform.strategy` to `persona`.
+
 ### Overlord discovery
 
 This config is used to find the [Overlord](../design/overlord.md) using Curator service discovery. Only required if you are actually running an Overlord.
@@ -702,7 +709,7 @@ All Druid components can communicate with each other over HTTP.
 |`druid.global.http.compressionCodec`|Compression codec to communicate with others. May be "gzip" or "identity".|`gzip`|
 |`druid.global.http.readTimeout`|The timeout for data reads.|`PT15M`|
 |`druid.global.http.unusedConnectionTimeout`|The timeout for idle connections in connection pool. The connection in the pool will be closed after this timeout and a new one will be established. This timeout should be less than `druid.global.http.readTimeout`. Set this timeout = ~90% of `druid.global.http.readTimeout`|`PT4M`|
-|`druid.global.http.numMaxThreads`|Maximum number of I/O worker threads|`max(10, ((number of cores * 17) / 16 + 2) + 30)`|
+|`druid.global.http.numMaxThreads`|Maximum number of I/O worker threads|`(number of cores) * 3 / 2 + 1`|
 |`druid.global.http.clientConnectTimeout`|The timeout (in milliseconds) for establishing client connections.|500|
 
 ### Common endpoints configuration
@@ -734,6 +741,7 @@ These Coordinator static configurations can be defined in the `coordinator/runti
 |`druid.plaintextPort`|This is the port to actually listen on; unless port mapping is used, this will be the same port as is on `druid.host`|8081|
 |`druid.tlsPort`|TLS port for HTTPS connector, if [druid.enableTlsPort](../operations/tls-support.md) is set then this config will be used. If `druid.host` contains port then that port will be ignored. This should be a non-negative integer.|8281|
 |`druid.service`|The name of the service. This is used as a dimension when emitting metrics and alerts to differentiate between the various services.|`druid/coordinator`|
+|`druid.labels`|Optional JSON object of key-value pairs that define custom labels for the server. These labels are displayed in the web console under the "Services" tab. Example: `druid.labels={"location":"Airtrunk"}` or `druid.labels.location=Airtrunk`|`null`|
 
 ##### Coordinator operation
 
@@ -977,6 +985,7 @@ These Overlord static configurations can be defined in the `overlord/runtime.pro
 |`druid.plaintextPort`|This is the port to actually listen on; unless port mapping is used, this will be the same port as is on `druid.host`.|8090|
 |`druid.tlsPort`|TLS port for HTTPS connector, if [druid.enableTlsPort](../operations/tls-support.md) is set then this config will be used. If `druid.host` contains port then that port will be ignored. This should be a non-negative Integer.|8290|
 |`druid.service`|The name of the service. This is used as a dimension when emitting metrics and alerts to differentiate between the various services.|`druid/overlord`|
+|`druid.labels`|Optional JSON object of key-value pairs that define custom labels for the server. These labels are displayed in the web console under the "Services" tab. Example: `druid.labels={"location":"Airtrunk"}` or `druid.labels.location=Airtrunk`|`null`|
 
 ##### Overlord operations
 
@@ -1328,6 +1337,7 @@ These Middle Manager and Peon configurations can be defined in the `middleManage
 |`druid.plaintextPort`|This is the port to actually listen on; unless port mapping is used, this will be the same port as is on `druid.host`|8091|
 |`druid.tlsPort`|TLS port for HTTPS connector, if [druid.enableTlsPort](../operations/tls-support.md) is set then this config will be used. If `druid.host` contains port then that port will be ignored. This should be a non-negative Integer.|8291|
 |`druid.service`|The name of the service. This is used as a dimension when emitting metrics and alerts to differentiate between the various services|`druid/middlemanager`|
+|`druid.labels`|Optional JSON object of key-value pairs that define custom labels for the server. These labels are displayed in the web console under the "Services" tab. Example: `druid.labels={"location":"Airtrunk"}` or `druid.labels.location=Airtrunk`|`null`|
 
 #### Middle Manager configuration
 
@@ -1364,6 +1374,7 @@ Processing properties set on the Middle Manager are passed through to Peons.
 |`druid.processing.formatString`|Realtime and Historical processes use this format string to name their processing threads.|processing-%s|
 |`druid.processing.numMergeBuffers`|The number of direct memory buffers available for merging query results. The buffers are sized by `druid.processing.buffer.sizeBytes`. This property is effectively a concurrency limit for queries that require merging buffers. If you are using any queries that require merge buffers (currently, just groupBy) then you should have at least two of these.|`max(2, druid.processing.numThreads / 4)`|
 |`druid.processing.numThreads`|The number of processing threads to have available for parallel processing of segments. Our rule of thumb is `num_cores - 1`, which means that even under heavy load there will still be one core available to do background tasks like talking with ZooKeeper and pulling down segments. If only one core is available, this property defaults to the value `1`.|Number of cores - 1 (or 1)|
+|`druid.processing.numTimeoutThreads`|The number of processing threads to have available for handling per-segment query timeouts. Setting this value to `0` removes the ability to service per-segment timeouts, irrespective of `perSegmentTimeout` query context parameter. As these threads are just servicing timers, it's recommended to set this value to some small percent (e.g. 5%) of the total query processing cores available to the peon.|0|
 |`druid.processing.fifo`|Enables the processing queue to treat tasks of equal priority in a FIFO manner.|`true`|
 |`druid.processing.tmpDir`|Path where temporary files created while processing a query should be stored. If specified, this configuration takes priority over the default `java.io.tmpdir` path.|path represented by `java.io.tmpdir`|
 |`druid.processing.intermediaryData.storage.type`|Storage type for intermediary segments of data shuffle between native parallel index tasks. <br />Set to `local` to store segment files in the local storage of the Middle Manager or Indexer. <br />Set to `deepstore` to use configured deep storage for better fault tolerance during rolling updates. When the storage type is `deepstore`, Druid stores the data in the `shuffle-data` directory under the configured deep storage path. Druid does not support automated cleanup for the `shuffle-data` directory. You can set up cloud storage lifecycle rules for automated cleanup of data at the `shuffle-data` prefix location.|`local`|
@@ -1385,7 +1396,7 @@ You can optionally configure caching to be enabled on the peons by setting cachi
 |--------|---------------|-----------|-------|
 |`druid.realtime.cache.useCache`|true, false|Enable the cache on the realtime.|false|
 |`druid.realtime.cache.populateCache`|true, false|Populate the cache on the realtime.|false|
-|`druid.realtime.cache.unCacheable`|All druid query types|All query types to not cache.|`[]`|
+|`druid.realtime.cache.unCacheable`|All druid query types|All query types to not cache.|`[scan]`|
 |`druid.realtime.cache.maxEntrySize`|positive integer|Maximum cache entry size in bytes.|1_000_000|
 
 See [cache configuration](#cache-configuration) for how to configure cache settings.
@@ -1455,6 +1466,7 @@ For most types of tasks, `SegmentWriteOutMediumFactory` can be configured per-ta
 |`druid.plaintextPort`|This is the port to actually listen on; unless port mapping is used, this will be the same port as is on `druid.host`|8091|
 |`druid.tlsPort`|TLS port for HTTPS connector, if [druid.enableTlsPort](../operations/tls-support.md) is set then this config will be used. If `druid.host` contains port then that port will be ignored. This should be a non-negative Integer.|8283|
 |`druid.service`|The name of the service. This is used as a dimension when emitting metrics and alerts to differentiate between the various services|`druid/indexer`|
+|`druid.labels`|Optional JSON object of key-value pairs that define custom labels for the server. These labels are displayed in the web console under the "Services" tab. Example: `druid.labels={"location":"Airtrunk"}` or `druid.labels.location=Airtrunk`|`null`|
 
 #### Indexer general configuration
 
@@ -1496,6 +1508,8 @@ Druid uses Jetty to serve HTTP requests.
 |`druid.server.http.enableForwardedRequestCustomizer`|If enabled, adds Jetty ForwardedRequestCustomizer which reads X-Forwarded-* request headers to manipulate servlet request object when Druid is used behind a proxy.|false|
 |`druid.server.http.allowedHttpMethods`|List of HTTP methods that should be allowed in addition to the ones required by Druid APIs. Druid APIs require GET, PUT, POST, and DELETE, which are always allowed. This option is not useful unless you have installed an extension that needs these additional HTTP methods or that adds functionality related to CORS. None of Druid's bundled extensions require these methods.|`[]`|
 |`druid.server.http.contentSecurityPolicy`|Content-Security-Policy header value to set on each non-POST response. Setting this property to an empty string, or omitting it, both result in the default `frame-ancestors: none` being set.|`frame-ancestors 'none'`|
+|`druid.server.http.uriCompliance`|Jetty `UriCompliance` mode for Druid's embedded Jetty servers. To modify, override this config with the string representation of any `UriCompliance` mode that [Jetty supports](https://javadoc.jetty.org/jetty-12/org/eclipse/jetty/http/UriCompliance.html).|LEGACY|
+|`druid.server.http.enforceStrictSNIHostChecking`| If enabled, the Jetty server will enforce strict SNI host checking. This means that if a client connects to the server using TLS but does not provide an SNI hostname, or provides an SNI hostname that does not match the server's configured hostname, a request will get a 400 response. Setting this to false is not recommended in production.|true|
 
 #### Indexer processing resources
 
@@ -1506,6 +1520,7 @@ Druid uses Jetty to serve HTTP requests.
 |`druid.processing.formatString`|Indexer processes use this format string to name their processing threads.|processing-%s|
 |`druid.processing.numMergeBuffers`|The number of direct memory buffers available for merging query results. The buffers are sized by `druid.processing.buffer.sizeBytes`. This property is effectively a concurrency limit for queries that require merging buffers. If you are using any queries that require merge buffers (currently, just groupBy) then you should have at least two of these.|`max(2, druid.processing.numThreads / 4)`|
 |`druid.processing.numThreads`|The number of processing threads to have available for parallel processing of segments. Our rule of thumb is `num_cores - 1`, which means that even under heavy load there will still be one core available to do background tasks like talking with ZooKeeper and pulling down segments. If only one core is available, this property defaults to the value `1`.|Number of cores - 1 (or 1)|
+|`druid.processing.numTimeoutThreads`|The number of processing threads to have available for handling per-segment query timeouts. Setting this value to `0` removes the ability to service per-segment timeouts, irrespective of `perSegmentTimeout` query context parameter. As these threads are just servicing timers, it's recommended to set this value to some small percent (e.g. 5%) of the total query processing cores available to the indexer.|0|
 |`druid.processing.fifo`|If the processing queue should treat tasks of equal priority in a FIFO manner|`true`|
 |`druid.processing.tmpDir`|Path where temporary files created while processing a query should be stored. If specified, this configuration takes priority over the default `java.io.tmpdir` path.|path represented by `java.io.tmpdir`|
 
@@ -1526,7 +1541,7 @@ You can optionally configure caching to be enabled on the Indexer by setting cac
 |--------|---------------|-----------|-------|
 |`druid.realtime.cache.useCache`|true, false|Enable the cache on the realtime.|false|
 |`druid.realtime.cache.populateCache`|true, false|Populate the cache on the realtime.|false|
-|`druid.realtime.cache.unCacheable`|All druid query types|All query types to not cache.|`[]`|
+|`druid.realtime.cache.unCacheable`|All druid query types|All query types to not cache.|`[scan]`|
 |`druid.realtime.cache.maxEntrySize`|positive integer|Maximum cache entry size in bytes.|1_000_000|
 
 See [cache configuration](#cache-configuration) for how to configure cache settings.
@@ -1548,6 +1563,7 @@ These Historical configurations can be defined in the `historical/runtime.proper
 |`druid.plaintextPort`|This is the port to actually listen on; unless port mapping is used, this will be the same port as is on `druid.host`|8083|
 |`druid.tlsPort`|TLS port for HTTPS connector, if [druid.enableTlsPort](../operations/tls-support.md) is set then this config will be used. If `druid.host` contains port then that port will be ignored. This should be a non-negative Integer.|8283|
 |`druid.service`|The name of the service. This is used as a dimension when emitting metrics and alerts to differentiate between the various services|`druid/historical`|
+|`druid.labels`|Optional JSON object of key-value pairs that define custom labels for the server. These labels are displayed in the web console under the "Services" tab. Example: `druid.labels={"location":"Airtrunk"}` or `druid.labels.location=Airtrunk`|`null`|
 
 #### Historical general configuration
 
@@ -1614,6 +1630,7 @@ Druid uses Jetty to serve HTTP requests.
 |`druid.processing.formatString`|Realtime and Historical processes use this format string to name their processing threads.|processing-%s|
 |`druid.processing.numMergeBuffers`|The number of direct memory buffers available for merging query results. The buffers are sized by `druid.processing.buffer.sizeBytes`. This property is effectively a concurrency limit for queries that require merging buffers. If you are using any queries that require merge buffers (currently, just groupBy) then you should have at least two of these.|`max(2, druid.processing.numThreads / 4)`|
 |`druid.processing.numThreads`|The number of processing threads to have available for parallel processing of segments. Our rule of thumb is `num_cores - 1`, which means that even under heavy load there will still be one core available to do background tasks like talking with ZooKeeper and pulling down segments. If only one core is available, this property defaults to the value `1`.|Number of cores - 1 (or 1)|
+|`druid.processing.numTimeoutThreads`|The number of processing threads to have available for handling per-segment query timeouts. Setting this value to `0` removes the ability to service per-segment timeouts, irrespective of `perSegmentTimeout` query context parameter. As these threads are just servicing timers, it's recommended to set this value to some small percent (e.g. 5%) of the total query processing cores available to the historical.|0|
 |`druid.processing.fifo`|If the processing queue should treat tasks of equal priority in a FIFO manner|`true`|
 |`druid.processing.tmpDir`|Path where temporary files created while processing a query should be stored. If specified, this configuration takes priority over the default `java.io.tmpdir` path.|path represented by `java.io.tmpdir`|
 
@@ -1634,7 +1651,7 @@ You can optionally only configure caching to be enabled on the Historical by set
 |--------|---------------|-----------|-------|
 |`druid.historical.cache.useCache`|true, false|Enable the cache on the Historical.|false|
 |`druid.historical.cache.populateCache`|true, false|Populate the cache on the Historical.|false|
-|`druid.historical.cache.unCacheable`|All druid query types|All query types to not cache.|`[]`|
+|`druid.historical.cache.unCacheable`|All druid query types|All query types to not cache.|`[scan]`|
 |`druid.historical.cache.maxEntrySize`|positive integer|Maximum cache entry size in bytes.|1_000_000|
 
 See [cache configuration](#cache-configuration) for how to configure cache settings.
@@ -1660,6 +1677,7 @@ These Broker configurations can be defined in the `broker/runtime.properties` fi
 |`druid.plaintextPort`|This is the port to actually listen on; unless port mapping is used, this will be the same port as is on `druid.host`|8082|
 |`druid.tlsPort`|TLS port for HTTPS connector, if [druid.enableTlsPort](../operations/tls-support.md) is set then this config will be used. If `druid.host` contains port then that port will be ignored. This should be a non-negative Integer.|8282|
 |`druid.service`|The name of the service. This is used as a dimension when emitting metrics and alerts to differentiate between the various services|`druid/broker`|
+|`druid.labels`|Optional JSON object of key-value pairs that define custom labels for the server. These labels are displayed in the web console under the "Services" tab. Example: `druid.labels={"location":"Airtrunk"}` or `druid.labels.location=Airtrunk`|`null`|
 
 #### Query configuration
 
@@ -1788,7 +1806,7 @@ client has the following configuration options.
 |`druid.broker.http.readTimeout`|The timeout for data reads from Historical servers and real-time tasks.|`PT15M`|
 |`druid.broker.http.unusedConnectionTimeout`|The timeout for idle connections in connection pool. The connection in the pool will be closed after this timeout and a new one will be established. This timeout should be less than `druid.broker.http.readTimeout`. Set this timeout = ~90% of `druid.broker.http.readTimeout`|`PT4M`|
 |`druid.broker.http.maxQueuedBytes`|Maximum number of bytes queued per query before exerting [backpressure](../operations/basic-cluster-tuning.md#broker-backpressure) on channels to the data servers.<br /><br />Similar to `druid.server.http.maxScatterGatherBytes`, except that `maxQueuedBytes` triggers [backpressure](../operations/basic-cluster-tuning.md#broker-backpressure) instead of query failure. Set to zero to disable. You can override this setting by using the [`maxQueuedBytes` query context parameter](../querying/query-context-reference.md). Druid supports [human-readable](human-readable-byte.md) format. |25 MB or 2% of maximum Broker heap size, whichever is greater.|
-|`druid.broker.http.numMaxThreads`|`Maximum number of I/O worker threads|max(10, ((number of cores * 17) / 16 + 2) + 30)`|
+|`druid.broker.http.numMaxThreads`|`Maximum number of I/O worker threads|(number of cores) * 3 / 2 + 1`|
 |`druid.broker.http.clientConnectTimeout`|The timeout (in milliseconds) for establishing client connections.|500|
 
 
@@ -1890,7 +1908,7 @@ You can optionally only configure caching to be enabled on the Broker by setting
 |`druid.broker.cache.useResultLevelCache`|true, false|Enable result level caching on the Broker.|false|
 |`druid.broker.cache.populateResultLevelCache`|true, false|Populate the result level cache on the Broker.|false|
 |`druid.broker.cache.resultLevelCacheLimit`|positive integer|Maximum size of query response that can be cached.|`Integer.MAX_VALUE`|
-|`druid.broker.cache.unCacheable`|All druid query types|All query types to not cache.|`[]`|
+|`druid.broker.cache.unCacheable`|All druid query types|All query types to not cache.|`[scan]`|
 |`druid.broker.cache.cacheBulkMergeLimit`|positive integer or 0|Queries with more segments than this number will not attempt to fetch from cache at the broker level, leaving potential caching fetches (and cache result merging) to the Historicals|`Integer.MAX_VALUE`|
 |`druid.broker.cache.maxEntrySize`|positive integer|Maximum cache entry size in bytes.|1_000_000|
 
@@ -1924,16 +1942,11 @@ You can configure Druid services to emit [metrics](../operations/metrics.md) reg
 
 ### Metrics monitors for each service
 
-Metric monitoring is an essential part of Druid operations. Druid includes 
-
-:::caution
-
-The `runtime.properties` file for each service overrides the common configuration file (`common.runtime.properties`). They are not additive. This means that if you add any monitors to a specific service, that service only has the monitors specified in its `runtime.properties` file even if there are additional ones listed in the common file. 
-
-:::
-
+Metric monitoring is an essential part of Druid operations.
+Monitors can be enabled by configuring the property `druid.monitoring.monitors` in the common configuration file, `common.runtime.properties`.
+If a monitor is not supported on a certain service, it will simply be ignored while starting up that service.
 
-The following table lists the monitors that are available and the services you could configure the monitor for:
+The following table lists available monitors and the respective services where they are supported:
 
 |Name|Description|Service|
 |----|-----------|-------|
@@ -2284,6 +2297,7 @@ Supported query contexts:
 |`druid.plaintextPort`|This is the port to actually listen on; unless port mapping is used, this will be the same port as is on `druid.host`|8888|
 |`druid.tlsPort`|TLS port for HTTPS connector, if [druid.enableTlsPort](../operations/tls-support.md) is set then this config will be used. If `druid.host` contains port then that port will be ignored. This should be a non-negative Integer.|9088|
 |`druid.service`|The name of the service. This is used as a dimension when emitting metrics and alerts to differentiate between the various services|`druid/router`|
+|`druid.labels`|Optional JSON object of key-value pairs that define custom labels for the server. These labels are displayed in the web console under the "Services" tab. Example: `druid.labels={"location":"Airtrunk"}` or `druid.labels.location=Airtrunk`|`null`|
 
 #### Runtime configuration
 
@@ -2300,7 +2314,7 @@ Supported query contexts:
 |`druid.router.http.numConnections`|Size of connection pool for the Router to connect to Broker processes. If there are more queries than this number that all need to speak to the same process, then they will queue up.|`20`|
 |`druid.router.http.eagerInitialization`|Indicates that http connections from Router to Broker should be eagerly initialized. If set to true, `numConnections` connections are created upon initialization|`true`|
 |`druid.router.http.readTimeout`|The timeout for data reads from Broker processes.|`PT15M`|
-|`druid.router.http.numMaxThreads`|Maximum number of worker threads to handle HTTP requests and responses|`max(10, ((number of cores * 17) / 16 + 2) + 30)`|
+|`druid.router.http.numMaxThreads`|Maximum number of worker threads to handle HTTP requests and responses|`(number of cores) * 3 / 2 + 1`|
 |`druid.router.http.numRequestsQueued`|Maximum number of requests that may be queued to a destination|`1024`|
 |`druid.router.http.requestBuffersize`|Size of the content buffer for receiving requests. These buffers are only used for active connections that have requests with bodies that will not fit within the header buffer|`8 * 1024`|
 |`druid.router.http.clientConnectTimeout`|The timeout (in milliseconds) for establishing client connections.|500|
diff --git a/docs/latest/design/extensions-contrib/dropwizard.md b/docs/latest/design/extensions-contrib/dropwizard.md
index f68b055327..7e1100dc7c 100644
--- a/docs/latest/design/extensions-contrib/dropwizard.md
+++ b/docs/latest/design/extensions-contrib/dropwizard.md
@@ -1,4 +1,5 @@
 ---
+id: dropwizard
 layout: doc_page
 title: "Dropwizard metrics emitter"
 ---
diff --git a/docs/latest/design/indexer.md b/docs/latest/design/indexer.md
index ebfffe7f1c..4b695b290b 100644
--- a/docs/latest/design/indexer.md
+++ b/docs/latest/design/indexer.md
@@ -1,4 +1,5 @@
 ---
+id: indexer
 layout: doc_page
 title: "Indexer service"
 sidebar_label: "Indexer"
diff --git a/docs/latest/development/extensions-contrib/druid-exact-count-bitmap.md b/docs/latest/development/extensions-contrib/druid-exact-count-bitmap.md
new file mode 100644
index 0000000000..b39ed38dd6
--- /dev/null
+++ b/docs/latest/development/extensions-contrib/druid-exact-count-bitmap.md
@@ -0,0 +1,452 @@
+---
+id: druid-exact-count-bitmap
+title: "Exact Count Bitmap"
+---
+
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+  -->
+
+This extension provides exact cardinality counting functionality for LONG type columns using [Roaring Bitmaps](https://roaringbitmap.org/). Unlike approximate cardinality aggregators like HyperLogLog, this aggregator provides precise distinct counts.
+
+## Installation
+
+To use this Apache Druid extension, [include](../../configuration/extensions.md#loading-extensions) `druid-exact-count-bitmap` in the extensions load list.
+
+## Comparison with Similar Aggregations
+
+The [Distinct Count Aggregator](https://druid.apache.org/docs/latest/development/extensions-contrib/distinctcount/) works in a similar way to the Exact Count Aggregator. Hence, it is important to understand the difference between the behavior of these two aggregators. 
+
+| Exact Count | Distinct Count |
+| -- | -- |
+| No prerequisites needed (e.g. configuring hash partition, segment granularity) | Prerequisites needed to perform aggregation |
+| Works on 64-bit number columns only (BIGINT) | Works on dimension columns (Including Strings, Complex Types, etc) |
+
+## How it Works
+
+The extension uses `Roaring64NavigableMap` as its underlying data structure to efficiently store and compute exact cardinality of 64-bit integers. It provides two types of aggregators that serve different purposes:
+
+### Build Aggregator (Bitmap64ExactCountBuild)
+
+The BUILD aggregator is used when you want to compute cardinality directly from raw LONG values:
+
+- Used during ingestion or when querying raw data
+- Must be used on columns of type LONG.
+
+Example:
+
+```json
+{
+  "type": "Bitmap64ExactCountBuild",
+  "name": "unique_values",
+  "fieldName": "id"
+}
+```
+
+### Merge Aggregator (Bitmap64ExactCountMerge)
+
+The MERGE aggregator is used when working with pre-computed bitmaps:
+
+- Used for querying pre-aggregated data (columns that were previously aggregated using BUILD)
+- Combines multiple bitmaps using bitwise operations.
+- Must be used on columns that are aggregated using BUILD, or by a previous MERGE.
+- `Bitmap64ExactCountMerge` aggregator is recommended for use in `timeseries` type queries, though it also works for `topN` and `groupBy` queries.
+
+Example:
+
+```json
+{
+  "type": "Bitmap64ExactCountMerge",
+  "name": "total_unique_values",
+  "fieldName": "unique_values" // Must be a pre-computed bitmap
+}
+```
+
+### Typical Workflow
+
+1. During ingestion, use BUILD to create the initial bitmap:
+    ```json
+    {
+      "type": "index",
+      "spec": {
+        "dataSchema": {
+          "metricsSpec": [
+            {
+              "type": "Bitmap64ExactCountBuild",
+              "name": "unique_users",
+              "fieldName": "user_id"
+            }
+          ]
+        }
+      }
+    }
+    ```
+
+2. When querying the aggregated data, use MERGE to combine bitmaps:
+    ```json
+    {
+      "queryType": "timeseries",
+      "aggregations": [
+        {
+          "type": "Bitmap64ExactCountMerge",
+          "name": "total_unique_users",
+          "fieldName": "unique_users"
+        }
+      ]
+    }
+    ```
+
+## Usage
+
+### SQL Query
+
+You can use the `BITMAP64_EXACT_COUNT` function in SQL queries:
+
+```sql
+SELECT BITMAP64_EXACT_COUNT(column_name)
+FROM datasource
+WHERE ...
+GROUP BY ...
+```
+
+### Post-Aggregator
+
+You can also use the post-aggregator for further processing:
+
+```json
+{
+  "type": "bitmap64ExactCount",
+  "name": "<output_name>",
+  "fieldName": "<aggregator_name>"
+}
+```
+
+## Considerations
+
+- **Memory Usage**: While Roaring Bitmaps are efficient, storing exact unique values will generally consume more memory than approximate algorithms like HyperLogLog.
+- **Input Type**: This aggregator only works with LONG (64-bit integer) columns. String or other data types must be converted to longs before using this aggregator.
+- **Build vs Merge**: Always use BUILD for raw numeric data and MERGE for pre-aggregated data. Using BUILD on pre-aggregated data or MERGE on raw data will not work correctly.
+
+## Example Use Cases
+
+1. **User Analytics**: Count unique users over time
+
+```sql
+-- First ingest with BUILD aggregator
+-- Then query with:
+SELECT 
+  TIME_FLOOR(__time, 'PT1H') AS hour,
+  BITMAP64_EXACT_COUNT(unique_users) as distinct_users
+FROM user_metrics
+GROUP BY 1
+```
+
+2. **High-Precision Metrics**: When exact counts are required
+
+```json
+{
+  "type": "groupBy",
+  "dimensions": [
+    "country"
+  ],
+  "aggregations": [
+    {
+      "type": "Bitmap64ExactCountMerge",
+      "name": "exact_user_count",
+      "fieldName": "unique_users"
+    }
+  ]
+}
+```
+
+## Walkthrough Using Wikipedia datasource
+
+### Batch Ingestion Task Spec
+
+```json
+{
+  "type": "index",
+  "spec": {
+    "dataSchema": {
+      "dataSource": "wikipedia_metrics",
+      "timestampSpec": {
+        "column": "__time",
+        "format": "auto"
+      },
+      "dimensionsSpec": {
+        "dimensions": [
+          "channel",
+          "namespace",
+          "page",
+          "user",
+          "cityName",
+          "countryName",
+          "regionName",
+          "isRobot",
+          "isUnpatrolled",
+          "isNew",
+          "isAnonymous"
+        ]
+      },
+      "metricsSpec": [
+        {
+          "type": "Bitmap64ExactCountBuild",
+          "name": "unique_added_values",
+          "fieldName": "added"
+        },
+        {
+          "type": "Bitmap64ExactCountBuild",
+          "name": "unique_delta_values",
+          "fieldName": "delta"
+        },
+        {
+          "type": "Bitmap64ExactCountBuild",
+          "name": "unique_comment_lengths",
+          "fieldName": "commentLength"
+        },
+        {
+          "name": "count",
+          "type": "count"
+        },
+        {
+          "name": "sum_added",
+          "type": "longSum",
+          "fieldName": "added"
+        },
+        {
+          "name": "sum_delta",
+          "type": "longSum",
+          "fieldName": "delta"
+        }
+      ],
+      "granularitySpec": {
+        "type": "uniform",
+        "segmentGranularity": "DAY",
+        "queryGranularity": "HOUR",
+        "rollup": true,
+        "intervals": [
+          "2016-06-27/2016-06-28"
+        ]
+      }
+    },
+    "ioConfig": {
+      "type": "index",
+      "inputSource": {
+        "type": "druid",
+        "dataSource": "wikipedia",
+        "interval": "2016-06-27/2016-06-28"
+      },
+      "inputFormat": {
+        "type": "tsv",
+        "findColumnsFromHeader": true
+      }
+    },
+    "tuningConfig": {
+      "type": "index",
+      "maxRowsPerSegment": 5000000,
+      "maxRowsInMemory": 25000
+    }
+  }
+}
+```
+
+### Query from datasource with raw bytes
+
+```json
+{
+  "queryType": "timeseries",
+  "dataSource": {
+    "type": "table",
+    "name": "wikipedia_metrics"
+  },
+  "intervals": {
+    "type": "intervals",
+    "intervals": [
+      "-146136543-09-08T08:23:32.096Z/146140482-04-24T15:36:27.903Z"
+    ]
+  },
+  "granularity": {
+    "type": "all"
+  },
+  "aggregations": [
+    {
+      "type": "Bitmap64ExactCountBuild",
+      "name": "a0",
+      "fieldName": "unique_added_values"
+    }
+  ]
+}
+```
+
+### Query from datasource with pre-aggregated bitmap
+
+```json
+{
+  "queryType": "timeseries",
+  "dataSource": {
+    "type": "table",
+    "name": "wikipedia_metrics"
+  },
+  "intervals": {
+    "type": "intervals",
+    "intervals": [
+      "-146136543-09-08T08:23:32.096Z/146140482-04-24T15:36:27.903Z"
+    ]
+  },
+  "granularity": {
+    "type": "all"
+  },
+  "aggregations": [
+    {
+      "type": "Bitmap64ExactCountMerge",
+      "name": "a0",
+      "fieldName": "unique_added_values"
+    }
+  ]
+}
+```
+
+## Other Examples
+
+### Kafka ingestion task spec
+
+```json
+{
+  "type": "kafka",
+  "spec": {
+    "dataSchema": {
+      "dataSource": "ticker_event_bitmap64_exact_count_rollup",
+      "timestampSpec": {
+        "column": "timestamp",
+        "format": "millis",
+        "missingValue": null
+      },
+      "dimensionsSpec": {
+        "dimensions": [
+          {
+            "type": "string",
+            "name": "key"
+          }
+        ],
+        "dimensionExclusions": []
+      },
+      "metricsSpec": [
+        {
+          "type": "Bitmap64ExactCountBuild",
+          "name": "count",
+          "fieldName": "value"
+        }
+      ],
+      "granularitySpec": {
+        "type": "uniform",
+        "segmentGranularity": "HOUR",
+        "queryGranularity": "HOUR",
+        "rollup": true,
+        "intervals": null
+      },
+      "transformSpec": {
+        "filter": null,
+        "transforms": []
+      }
+    },
+    "ioConfig": {
+      "topic": "ticker_event",
+      "inputFormat": {
+        "type": "json",
+        "flattenSpec": {
+          "useFieldDiscovery": true,
+          "fields": []
+        },
+        "featureSpec": {}
+      },
+      "replicas": 1,
+      "taskCount": 1,
+      "taskDuration": "PT3600S",
+      "consumerProperties": {
+        "bootstrap.servers": "localhost:9092"
+      },
+      "pollTimeout": 100,
+      "startDelay": "PT5S",
+      "period": "PT30S",
+      "useEarliestOffset": false,
+      "completionTimeout": "PT1800S",
+      "lateMessageRejectionPeriod": null,
+      "earlyMessageRejectionPeriod": null,
+      "lateMessageRejectionStartDateTime": null,
+      "stream": "ticker_event",
+      "useEarliestSequenceNumber": false,
+      "type": "kafka"
+    }
+  }
+}
+```
+
+### Query with Post-aggregator:
+
+```json
+{
+  "queryType": "timeseries",
+  "dataSource": {
+    "type": "table",
+    "name": "ticker_event_bitmap64_exact_count_rollup"
+  },
+  "intervals": {
+    "type": "intervals",
+    "intervals": [
+      "2020-09-13T06:35:35.000Z/146140482-04-24T15:36:27.903Z"
+    ]
+  },
+  "descending": false,
+  "virtualColumns": [],
+  "filter": null,
+  "granularity": {
+    "type": "all"
+  },
+  "aggregations": [
+    {
+      "type": "count",
+      "name": "cnt"
+    },
+    {
+      "type": "Bitmap64ExactCountMerge",
+      "name": "a0",
+      "fieldName": "count"
+    }
+  ],
+  "postAggregations": [
+    {
+      "type": "arithmetic",
+      "fn": "/",
+      "fields": [
+        {
+          "type": "bitmap64ExactCount",
+          "name": "a0",
+          "fieldName": "a0"
+        },
+        {
+          "type": "fieldAccess",
+          "name": "cnt",
+          "fieldName": "cnt"
+        }
+      ],
+      "name": "rollup_rate"
+    }
+  ],
+  "limit": 2147483647
+}
+```
diff --git a/docs/latest/development/extensions-contrib/kafka-emitter.md b/docs/latest/development/extensions-contrib/kafka-emitter.md
index 1d21bfc67f..772c0ff405 100644
--- a/docs/latest/development/extensions-contrib/kafka-emitter.md
+++ b/docs/latest/development/extensions-contrib/kafka-emitter.md
@@ -48,6 +48,7 @@ All the configuration parameters for the Kafka emitter are under `druid.emitter.
 | `druid.emitter.kafka.clusterName`                  | Optional value to specify the name of your Druid cluster. It can help make groups in your monitoring environment.                         | no        | none                  |
 | `druid.emitter.kafka.extra.dimensions` | Optional JSON configuration to specify a map of extra string dimensions for the events emitted. These can help make groups in your monitoring environment. | no | none |
 | `druid.emitter.kafka.producer.hiddenProperties`    | JSON configuration to specify sensitive Kafka producer properties such as username and password.  This property accepts a [DynamicConfigProvider](../../operations/dynamic-config-provider.md) implementation. | no | none |
+| `druid.emitter.kafka.producer.shutdownTimeout`    | Duration in milliseconds the Kafka producer waits for pending requests to finish before shutting down. | no | Long.MAX_VALUE |
 
 ### Example
 
diff --git a/docs/latest/development/extensions-contrib/prometheus.md b/docs/latest/development/extensions-contrib/prometheus.md
index 2114eb2d23..d5660e2e54 100644
--- a/docs/latest/development/extensions-contrib/prometheus.md
+++ b/docs/latest/development/extensions-contrib/prometheus.md
@@ -44,7 +44,7 @@ All the configuration parameters for the Prometheus emitter are under `druid.emi
 | `druid.emitter.prometheus.addHostAsLabel`     | Flag to include the hostname as a prometheus label.                                                                                                                                                                                    | no        | false                                |
 | `druid.emitter.prometheus.addServiceAsLabel`  | Flag to include the druid service name (e.g. `druid/broker`, `druid/coordinator`, etc.) as a prometheus label.                                                                                                                         | no        | false                                |
 | `druid.emitter.prometheus.pushGatewayAddress` | Pushgateway address. Required if using `pushgateway` strategy.                                                                                                                                                                         | no        | none                                 |
-| `druid.emitter.prometheus.flushPeriod`        | Emit metrics to Pushgateway every `flushPeriod` seconds. Required if `pushgateway` strategy is used.                                                                                                                                   | no        | 15                                   |
+| `druid.emitter.prometheus.flushPeriod`        | When using the `pushgateway` strategy metrics are emitted every `flushPeriod` seconds. <br/>When using the `exporter` strategy this configures the metric TTL such that if the metric value is not updated within `flushPeriod` seconds then it will stop being emitted. Note that unique label combinations per metric are currently not subject to TTL expiration. It is recommended to set this to at least 3 * `scrape_interval`. | Required if `pushgateway` strategy is used, optional otherwise. | 15 seconds for `pushgateway` strategy. <br/>None for `exporter` strategy. |
 | `druid.emitter.prometheus.extraLabels`        | JSON key-value pairs for additional labels on all metrics. Keys (label names) must match the regex `[a-zA-Z_:][a-zA-Z0-9_:]*`. Example: `{"cluster_name": "druid_cluster1", "env": "staging"}`.                                        | no        | none                                 |
 | `druid.emitter.prometheus.deletePushGatewayMetricsOnShutdown` | Flag to delete metrics from Pushgateway on task shutdown. Works only if `pushgateway` strategy is used. This feature allows to delete a stale metrics from batch executed tasks. Otherwise, the Pushgateway will store these stale metrics indefinitely as there is [no time to live mechanism](https://github.com/prometheus/pushgateway/issues/117), using the memory to hold data that was already scraped by Prometheus. | no | false |
 | `druid.emitter.prometheus.waitForShutdownDelay` | Time in milliseconds to wait for peon tasks to delete metrics from the Pushgateway on shutdown (e.g. 60_000). Applicable only when `pushgateway` strategy is used and `deletePushGatewayMetricsOnShutdown` is set to true. There is no guarantee that a peon task will delete metrics from the gateway if the configured delay is more than the [Peon's `druid.indexer.task.gracefulShutdownTimeout`](https://druid.apache.org/docs/latest/configuration/#additional-peon-configuration) value. For best results, set this value is 1.2 times the configured Prometheus `scrape_interval` of Pushgateway to ensure that  Druid scrapes the metrics before cleanup. | no | none |
diff --git a/docs/latest/development/extensions-core/druid-kerberos.md b/docs/latest/development/extensions-core/druid-kerberos.md
index c29acdea7a..8858e53548 100644
--- a/docs/latest/development/extensions-core/druid-kerberos.md
+++ b/docs/latest/development/extensions-core/druid-kerberos.md
@@ -48,12 +48,12 @@ druid.auth.authenticator.<authenticatorName>.<authenticatorProperty>
 The configuration examples in the rest of this document will use "kerberos" as the name of the authenticator being configured.
 
 ### Properties
-|Property|Possible Values|Description|Default|required|
-|--------|---------------|-----------|-------|--------|
-|`druid.auth.authenticator.kerberos.serverPrincipal`|`HTTP/_HOST@EXAMPLE.COM`| SPNEGO service principal used by druid processes|empty|Yes|
-|`druid.auth.authenticator.kerberos.serverKeytab`|`/etc/security/keytabs/spnego.service.keytab`|SPNego service keytab used by druid processes|empty|Yes|
+|Property|Possible Values|Description| Default | required |
+|--------|---------------|-----------|-----|--|
+|`druid.auth.authenticator.kerberos.serverPrincipal`|`HTTP/_HOST@EXAMPLE.COM`| SPNEGO service principal used by druid processes|Empty|Yes|
+|`druid.auth.authenticator.kerberos.serverKeytab`|`/etc/security/keytabs/spnego.service.keytab`|SPNego service keytab used by druid processes|Empty|Yes|
 |`druid.auth.authenticator.kerberos.authToLocal`|`RULE:[1:$1@$0](druid@EXAMPLE.COM)s/.*/druid DEFAULT`|It allows you to set a general rule for mapping principal names to local user names. It will be used if there is not an explicit mapping for the principal name that is being translated.|DEFAULT|No|
-|`druid.auth.authenticator.kerberos.cookieSignatureSecret`|`secretString`| Secret used to sign authentication cookies. It is advisable to explicitly set it, if you have multiple druid nodes running on same machine with different ports as the Cookie Specification does not guarantee isolation by port.|Random value|No|
+|`druid.auth.authenticator.kerberos.cookieSignatureSecret`|`secretString`| Secret used to sign authentication cookies|Empty|Yes|
 |`druid.auth.authenticator.kerberos.authorizerName`|Depends on available authorizers|Authorizer that requests should be directed to|Empty|Yes|
 
 As a note, it is required that the SPNego principal in use by the druid processes must start with HTTP (This specified by [RFC-4559](https://tools.ietf.org/html/rfc4559)) and must be of the form "HTTP/_HOST@REALM".
diff --git a/docs/latest/development/extensions-core/k8s-jobs.md b/docs/latest/development/extensions-core/k8s-jobs.md
index 21977ddf02..c97caf5be2 100644
--- a/docs/latest/development/extensions-core/k8s-jobs.md
+++ b/docs/latest/development/extensions-core/k8s-jobs.md
@@ -372,11 +372,12 @@ The below runtime properties need to be passed to the Job's peon process.
 druid.port=8100 (what port the peon should run on)
 druid.peon.mode=remote
 druid.service=druid/peon (for metrics reporting)
-druid.indexer.task.baseTaskDir=/druid/data (this should match the argument to the ./peon.sh run command in the PodTemplate)
 druid.indexer.runner.type=k8s
 druid.indexer.task.encapsulatedTask=true
 ```
 
+**Note**: Prior to Druid 35.0.0, you will need the `druid.indexer.task.baseTaskDir` runtime property, along with the `TASK_DIR` and `attemptId` arguments to `/peon.sh` to run your jobs. There is no need for that now as Druid will automatically configure the task directory. You can still choose to customize the target task directory by adjusting `druid.indexer.task.baseTaskDir` on the Overlord service.
+
 #### Example 1: Using a Pod Template that retrieves values from a ConfigMap 
 
 <details>
@@ -398,11 +399,11 @@ template:
         - sh
         - -c
         - |
-          /peon.sh /druid/data 1
+          /peon.sh
       env:
       - name: CUSTOM_ENV_VARIABLE
         value: "hello"
-      image: apache/druid:34.0.0
+      image: apache/druid:35.0.0
       name: main
       ports:
       - containerPort: 8091
@@ -492,7 +493,6 @@ data:
         druid.port=8100
         druid.service=druid/peon
         druid.server.http.numThreads=5
-        druid.indexer.task.baseTaskDir=/druid/data
         druid.indexer.runner.type=k8s
         druid.peon.mode=remote
         druid.indexer.task.encapsulatedTask=true
@@ -539,12 +539,12 @@ data:
       spec:
         containers:
         - name: main
-          image: apache/druid:34.0.0
+          image: apache/druid:35.0.0
           command:
             - sh
             - -c
             - |
-              /peon.sh /druid/data 1
+              /peon.sh
           env:
             - name: druid_port
               value: 8100
@@ -556,8 +556,6 @@ data:
               value: remote
             - name: druid_service
               value: "druid/peon"
-            - name: druid_indexer_task_baseTaskDir
-              value: /druid/data
             - name: druid_indexer_runner_type
               value: k8s
             - name: druid_indexer_task_encapsulatedTask
@@ -794,6 +792,8 @@ Should you require the needed permissions for interacting across Kubernetes name
 | `druid.indexer.runner.graceTerminationPeriodSeconds` | `Long` | Number of seconds you want to wait after a sigterm for container lifecycle hooks to complete. Keep at a smaller value if you want tasks to hold locks for shorter periods. | `PT30S` (K8s default) | No |
 | `druid.indexer.runner.capacity` | `Integer` | Number of concurrent jobs that can be sent to Kubernetes. | `2147483647` | No |
 | `druid.indexer.runner.cpuCoreInMicro` | `Integer` | Number of CPU micro core for the task. | `1000` | No |
+| `druid.indexer.runner.logSaveTimeout` | `Duration` | The peon executing the ingestion task makes a best effort to persist the pod logs from `k8s` to persistent task log storage. The timeout ensures that `k8s` connection issues do not cause the pod to hang indefinitely thereby blocking Overlord operations. If the timeout occurs before the logs are saved, those logs will not be available in Druid. | `PT300S` | NO |
+
 
 ### Metrics added
 
@@ -818,7 +818,7 @@ rules:
     resources: ["jobs"]
     verbs: ["get", "watch", "list", "delete", "create"]
   - apiGroups: [""]
-    resources: ["pods", "pods/log"]
+    resources: ["events", "pods", "pods/log"]
     verbs: ["get", "watch", "list", "delete", "create"]
 ---
 kind: RoleBinding
@@ -856,3 +856,43 @@ To do this, set the following property.
 |`druid.indexer.runner.k8sAndWorker.runnerStrategy.taskType.default`| `String` (e.g., `k8s`, `worker`) | Specifies the default runner to use if no overrides apply. This setting ensures there is always a fallback runner available.|None|No|
 |`druid.indexer.runner.k8sAndWorker.runnerStrategy.taskType.overrides`| `JsonObject`(e.g., `{"index_kafka": "worker"}`)| Defines task-specific overrides for runner types. Each entry sets a task type to a specific runner, allowing fine control. |`{}`|No|
 
+### Experimental Fabric8 Http Client Configurations
+
+:::warning
+
+This section is experimental and subject to change. The Druid developer community intends on selecting a stable default HTTP client and configuration in the future, simplifying configuration and distribution packaging. This means that not all exposed HTTP clients and their configurations will be supported long term. If you opt in to using this experimental configuration, please provide feedback to the Druid developer community ([GitHub Issue](https://github.com/apache/druid/issues/18629) ... Apache mailing list: `dev@druid.apache.org`) on your experience to help guide our long term decisions.
+
+:::
+
+The extension uses [fabric8 KubernetesClient](https://github.com/fabric8io/kubernetes-client) to communicate with the Kubernetes API server. This client creates an
+underlying HTTP Client using a pluggable HTTP client library. By default, the client is [vert.x](https://github.com/fabric8io/kubernetes-client/tree/main/httpclient-vertx). The legacy default
+was [okhttp](https://github.com/fabric8io/kubernetes-client/tree/main/httpclient-okhttp).
+
+|Property| Possible Values |Description| Default |required|
+|--------|-----------------|-----------|---------|--------|
+|`druid.indexer.runner.k8sAndWorker.http.httpClientType`|`String` (e.g., `okhttp`, `vertx`, `javaStandardHttp`)|Specifies the HTTP client library to be used by the worker task runner for communication with worker nodes.|`vertx`|No|
+
+#### vert.x HTTP Client
+
+|Property| Possible Values |Description| Default |required|
+|--------|-----------------|-----------|---------|--------|
+|`druid.indexer.runner.k8sAndWorker.http.vertx.workerPoolSize`|`Integer`|...|20|No|
+|`druid.indexer.runner.k8sAndWorker.http.vertx.eventLoopPoolSize`|`Integer`|...|`2 * number cores`|No|
+|`druid.indexer.runner.k8sAndWorker.http.vertx.internalBlockingPoolSize`|`Integer`|...|20|No|
+
+#### OkHttp Client
+
+|Property| Possible Values |Description| Default |required|
+|--------|-----------------|-----------|---------|--------|
+|`druid.indexer.runner.k8sAndWorker.http.okhttp.useCustomDispatcherExecutor`|`Boolean`|Flag indicating if okhttp client will use a custom defined thread pool for okhttp http client request dispatcher|false|No|
+|`druid.indexer.runner.k8sAndWorker.http.okhttp.coreWorkerThreads`|`Integer`|The number of threads to keep in the pool, even if they are idle. Only applicable if `useCustomDispatcherExecutor` is true.|50|No|
+|`druid.indexer.runner.k8sAndWorker.http.okhttp.maxWorkerThreads`|`Integer`|Maximum number of threads in the custom thread pool for okhttp client request dispatcher. Must be greater than or equal to `druid.indexer.runner.k8sAndWorker.http.okhttp.coreWorkerThreads` Only applicable if `useCustomDispatcherExecutor` is true.|`druid.indexer.runner.k8sAndWorker.http.okhttp.coreWorkerThreads`|No|
+|`druid.indexer.runner.k8sAndWorker.http.okhttp.workerThreadKeepAliveTime`|`Long`|Idle timeout in seconds for non-core threads in the worker thread pool. Only applicable if `useCustomDispatcherExecutor` is true.|60|No|
+
+#### Native Java HTTP Client
+
+|Property| Possible Values |Description| Default |required|
+|--------|-----------------|-----------|---------|--------|
+|`druid.indexer.runner.k8sAndWorker.http.javaStandardHttp.coreWorkerThreads`|`Integer`|The number of threads to keep in the pool, even if they are idle.|20|No|
+|`druid.indexer.runner.k8sAndWorker.http.javaStandardHttp.maxWorkerThreads`|`Integer`|Maximum number of threads in the custom thread pool for okhttp client request dispatcher.|20|No|
+|`druid.indexer.runner.k8sAndWorker.http.javaStandardHttp.workerThreadKeepAliveTime`|`Long`|Idle timeout in seconds for non-core threads in the worker thread pool.|60|No|
diff --git a/docs/latest/development/extensions-core/s3.md b/docs/latest/development/extensions-core/s3.md
index 20bf52d7c3..ed33d4337e 100644
--- a/docs/latest/development/extensions-core/s3.md
+++ b/docs/latest/development/extensions-core/s3.md
@@ -57,6 +57,7 @@ To use S3 for Deep Storage, you must supply [connection information](#configurat
 |`druid.storage.type`|Global deep storage provider. Must be set to `s3` to make use of this extension.|Must be set (likely `s3`).|
 |`druid.storage.disableAcl`|Boolean flag for how object permissions are handled. To use ACLs, set this property to `false`. To use Object Ownership, set it to `true`. The permission requirements for ACLs and Object Ownership are different. For more information, see [S3 permissions settings](#s3-permissions-settings).|false|
 |`druid.storage.useS3aSchema`|If true, use the "s3a" filesystem when using Hadoop-based ingestion. If false, the "s3n" filesystem will be used. Only affects Hadoop-based ingestion.|false|
+|`druid.storage.zip`|`true`, `false`|Whether segments in `s3` are written as directories (`false`) or zip files (`true`).|`false`|
 |`druid.storage.transfer.useTransferManager`| If true, use AWS S3 Transfer Manager to upload segments to S3.|true|
 |`druid.storage.transfer.minimumUploadPartSize`| Minimum size (in bytes) of each part in a multipart upload.|20971520 (20 MB)|
 |`druid.storage.transfer.multipartUploadThreshold`| The file size threshold (in bytes) above which a file upload is converted into a multipart upload instead of a single PUT request.| 20971520 (20 MB)|
diff --git a/docs/latest/development/extensions-core/simple-client-sslcontext.md b/docs/latest/development/extensions-core/simple-client-sslcontext.md
index db1a37afe4..981e00107a 100644
--- a/docs/latest/development/extensions-core/simple-client-sslcontext.md
+++ b/docs/latest/development/extensions-core/simple-client-sslcontext.md
@@ -23,9 +23,9 @@ title: "Simple SSLContext Provider Module"
   -->
 
 
-This Apache Druid module contains a simple implementation of [SSLContext](https://docs.oracle.com/en/java/javase/11/docs/api/java.base/javax/net/ssl/SSLContext.html)
+This Apache Druid module contains a simple implementation of [SSLContext](https://docs.oracle.com/en/java/javase/17/docs/api/java.base/javax/net/ssl/SSLContext.html)
 that will be injected to be used with HttpClient that Druid processes use internally to communicate with each other. To learn more about
-Java's SSL support, please refer to [this](https://docs.oracle.com/en/java/javase/11/security/java-secure-socket-extension-jsse-reference-guide.html) guide.
+Java's SSL support, please refer to [this](https://docs.oracle.com/en/java/javase/17/security/java-secure-socket-extension-jsse-reference-guide.html) guide.
 
 
 |Property|Description|Default|Required|
@@ -48,5 +48,5 @@ The following table contains optional parameters for supporting client certifica
 |`druid.client.https.keyManagerPassword`|The [Password Provider](../../operations/password-provider.md) or String password for the Key Manager.|none|no|
 |`druid.client.https.validateHostnames`|Validate the hostname of the server. This should not be disabled unless you are using [custom TLS certificate checks](../../operations/tls-support.md) and know that standard hostname validation is not needed.|true|no|
 
-This [document](https://docs.oracle.com/en/java/javase/11/docs/specs/security/standard-names.html) lists all the possible
+This [document](https://docs.oracle.com/en/java/javase/17/docs/specs/security/standard-names.html) lists all the possible
 values for the above mentioned configs among others provided by Java implementation.
diff --git a/docs/latest/ingestion/data-formats.md b/docs/latest/ingestion/data-formats.md
index a595b1c6de..4bdf99a4ea 100644
--- a/docs/latest/ingestion/data-formats.md
+++ b/docs/latest/ingestion/data-formats.md
@@ -168,6 +168,28 @@ For example:
 }
 ```
 
+### Lines
+
+Configure the Lines `inputFormat` to load line-oriented data where each line is treated as a single field:
+
+| Field | Type | Description | Required |
+|-------|------|-------------|----------|
+| type | String | Set value to `lines`. | yes |
+
+The Lines input format reads each line from the input as UTF-8 text, and creates a single column named `line` containing the entire line as a string.
+This is useful for reading line-oriented data in a simple form for later processing.
+
+For example:
+
+```json
+"ioConfig": {
+  "inputFormat": {
+    "type": "lines"
+  },
+  ...
+}
+```
+
 ### ORC
 
 To use the ORC input format, load the Druid Orc extension ( [`druid-orc-extensions`](../development/extensions-core/orc.md)).
@@ -964,12 +986,11 @@ Each line can be further parsed using [`parseSpec`](#parsespec).
 
 :::caution[Deprecated]
 
-Hadoop-based ingestion is deprecated. We recommend one of Druid's other supported ingestion methods, such as [SQL-based ingestion](../multi-stage-query/index.md) or [MiddleManager-less ingestion using Kubernetes](../development/extensions-core/k8s-jobs.md)
-
-You must now explicitly opt-in to using the deprecated `index_hadoop` task type. To opt-in, set `druid.indexer.task.allowHadoopTaskExecution` to `true` in your `common.runtime.properties` file. For more information, see [#18239](https://github.com/apache/druid/pull/18239)
+Hadoop-based ingestion is deprecated. For more information, see the [upgrade notes](../release-info/upgrade-notes.md#hadoop-based-ingestion).
 
 :::
 
+
 :::info
 You need to include [`druid-avro-extensions`](../development/extensions-core/avro.md) as an extension to use the Avro Hadoop Parser.
 
@@ -1031,6 +1052,14 @@ For example, using Avro Hadoop parser with custom reader's schema file:
 
 ### ORC Hadoop Parser
 
+:::caution[Deprecated]
+
+Hadoop-based ingestion is deprecated. For more information, see the [upgrade notes](../release-info/upgrade-notes.md#hadoop-based-ingestion).
+
+
+:::
+
+
 :::info
  You need to include the [`druid-orc-extensions`](../development/extensions-core/orc.md) as an extension to use the ORC Hadoop Parser.
 :::
@@ -1276,6 +1305,13 @@ setting `"mapreduce.job.user.classpath.first": "true"`, then this will not be an
 
 ### Parquet Hadoop Parser
 
+:::caution[Deprecated]
+
+Hadoop-based ingestion is deprecated. For more information, see the [upgrade notes](../release-info/upgrade-notes.md#hadoop-based-ingestion).
+
+:::
+
+
 :::info
  You need to include the [`druid-parquet-extensions`](../development/extensions-core/parquet.md) as an extension to use the Parquet Hadoop Parser.
 :::
@@ -1420,6 +1456,13 @@ However, the Parquet Avro Hadoop Parser was the original basis for supporting th
 
 ### Parquet Avro Hadoop Parser
 
+:::caution[Deprecated]
+
+Hadoop-based ingestion is deprecated. For more information, see the [upgrade notes](../release-info/upgrade-notes.md#hadoop-based-ingestion).
+
+:::
+
+
 :::info
  Consider using the [Parquet Hadoop Parser](#parquet-hadoop-parser) over this parser to ingest
 Parquet files. See [Parquet Hadoop Parser vs Parquet Avro Hadoop Parser](#parquet-hadoop-parser-vs-parquet-avro-hadoop-parser)
diff --git a/docs/latest/ingestion/hadoop.md b/docs/latest/ingestion/hadoop.md
index 3dd738f789..af416c8773 100644
--- a/docs/latest/ingestion/hadoop.md
+++ b/docs/latest/ingestion/hadoop.md
@@ -25,13 +25,16 @@ sidebar_label: "Hadoop-based"
 
 :::caution[Deprecated]
 
-Hadoop-based ingestion is deprecated. We recommend one of Druid's other supported ingestion methods, such as [SQL-based ingestion](../multi-stage-query/index.md) or [MiddleManager-less ingestion using Kubernetes](../development/extensions-core/k8s-jobs.md)
+Hadoop-based ingestion is deprecated and scheduled to be removed with Druid 37.0.0.
 
-You must now explicitly opt-in to using the deprecated `index_hadoop` task type. To opt-in, set `druid.indexer.task.allowHadoopTaskExecution` to `true` in your `common.runtime.properties` file. For more information, see [#18239](https://github.com/apache/druid/pull/18239)
+We recommend one of Druid's other supported ingestion methods, such as [SQL-based ingestion](../multi-stage-query/index.md) or [MiddleManager-less ingestion using Kubernetes](../development/extensions-core/k8s-jobs.md)
+
+You must now explicitly opt-in to using the deprecated `index_hadoop` task type. To opt-in, set `druid.indexer.task.allowHadoopTaskExecution` to `true` in your `common.runtime.properties` file. For more information, see [#18239](https://github.com/apache/druid/pull/18239).
 
 :::
 
 
+
 Apache Hadoop-based batch ingestion in Apache Druid is supported via a Hadoop-ingestion task. These tasks can be posted to a running
 instance of a Druid [Overlord](../design/overlord.md). Please refer to our [Hadoop-based vs. native batch comparison table](index.md#batch) for
 comparisons between Hadoop-based, native batch (simple), and native batch (parallel) ingestion.
diff --git a/docs/latest/ingestion/input-sources.md b/docs/latest/ingestion/input-sources.md
index d4698b20f0..49cf90cdbf 100644
--- a/docs/latest/ingestion/input-sources.md
+++ b/docs/latest/ingestion/input-sources.md
@@ -184,7 +184,7 @@ Sample specs:
 |uris|JSON array of URIs where S3 objects to be ingested are located.|None|`uris` or `prefixes` or `objects` must be set|
 |prefixes|JSON array of URI prefixes for the locations of S3 objects to be ingested. Empty objects starting with one of the given prefixes will be skipped.|None|`uris` or `prefixes` or `objects` must be set|
 |objects|JSON array of S3 Objects to be ingested.|None|`uris` or `prefixes` or `objects` must be set|
-|objectGlob|A glob for the object part of the S3 URI. In the URI `s3://foo/bar/file.json`, the glob is applied to `bar/file.json`.<br /><br />The glob must match the entire object part, not just the filename. For example, the glob `*.json` does not match `s3://foo/bar/file.json`, because the object part is `bar/file.json`, and the`*` does not match the slash. To match all objects ending in `.json`, use `**.json` instead.<br /><br />For more information, refer to the documentation for [`FileSystem#getPathMatcher`](https://docs.oracle.com/en/java/javase/11/docs/api/java.base/java/nio/file/FileSystem.html#getPathMatcher(java.lang.String)).|None|no|
+|objectGlob|A glob for the object part of the S3 URI. In the URI `s3://foo/bar/file.json`, the glob is applied to `bar/file.json`.<br /><br />The glob must match the entire object part, not just the filename. For example, the glob `*.json` does not match `s3://foo/bar/file.json`, because the object part is `bar/file.json`, and the`*` does not match the slash. To match all objects ending in `.json`, use `**.json` instead.<br /><br />For more information, refer to the documentation for [`FileSystem#getPathMatcher`](https://docs.oracle.com/en/java/javase/17/docs/api/java.base/java/nio/file/FileSystem.html#getPathMatcher(java.lang.String)).|None|no|
 |systemFields|JSON array of system fields to return as part of input rows. Possible values: `__file_uri` (S3 URI starting with `s3://`), `__file_bucket` (S3 bucket), and `__file_path` (S3 object key).|None|no|
 | endpointConfig |Config for overriding the default S3 endpoint and signing region. This would allow ingesting data from a different S3 store. Please see [s3 config](../development/extensions-core/s3.md#connecting-to-s3-configuration) for more information.|None|No (defaults will be used if not given)
 | clientConfig |S3 client properties for the overridden s3 endpoint. This is used in conjunction with `endPointConfig`. Please see [s3 config](../development/extensions-core/s3.md#connecting-to-s3-configuration) for more information.|None|No (defaults will be used if not given)
@@ -204,8 +204,9 @@ Properties Object:
 
 |Property|Description|Default|Required|
 |--------|-----------|-------|---------|
-|accessKeyId|The [Password Provider](../operations/password-provider.md) or plain text string of this S3 input source access key|None|yes if secretAccessKey is given|
-|secretAccessKey|The [Password Provider](../operations/password-provider.md) or plain text string of this S3 input source secret key|None|yes if accessKeyId is given|
+|accessKeyId|The [Password Provider](../operations/password-provider.md) or plain text string of this S3 input source access key|None|Yes, if `secretAccessKey` or `sessionToken` is given.|
+|secretAccessKey|The [Password Provider](../operations/password-provider.md) or plain text string of this S3 input source secret key|None|Yes, if `accessKeyId` or `sessionToken` is given.|
+|sessionToken|The [Password Provider](../operations/password-provider.md) or plain text string of this S3 input source session token|None|no|
 |assumeRoleArn|AWS ARN of the role to assume [see](https://docs.aws.amazon.com/IAM/latest/UserGuide/id_credentials_temp_request.html). **assumeRoleArn** can be used either with the ingestion spec AWS credentials or with the default S3 credentials|None|no|
 |assumeRoleExternalId|A unique identifier that might be required when you assume a role in another account [see](https://docs.aws.amazon.com/IAM/latest/UserGuide/id_credentials_temp_request.html)|None|no|
 
@@ -289,7 +290,7 @@ Sample specs:
 |uris|JSON array of URIs where Google Cloud Storage objects to be ingested are located.|None|`uris` or `prefixes` or `objects` must be set|
 |prefixes|JSON array of URI prefixes for the locations of Google Cloud Storage objects to be ingested. Empty objects starting with one of the given prefixes will be skipped.|None|`uris` or `prefixes` or `objects` must be set|
 |objects|JSON array of Google Cloud Storage objects to be ingested.|None|`uris` or `prefixes` or `objects` must be set|
-|objectGlob|A glob for the object part of the S3 URI. In the URI `s3://foo/bar/file.json`, the glob is applied to `bar/file.json`.<br /><br />The glob must match the entire object part, not just the filename. For example, the glob `*.json` does not match `s3://foo/bar/file.json`, because the object part is `bar/file.json`, and the`*` does not match the slash. To match all objects ending in `.json`, use `**.json` instead.<br /><br />For more information, refer to the documentation for [`FileSystem#getPathMatcher`](https://docs.oracle.com/en/java/javase/11/docs/api/java.base/java/nio/file/FileSystem.html#getPathMatcher(java.lang.String)).|None|no|
+|objectGlob|A glob for the object part of the S3 URI. In the URI `s3://foo/bar/file.json`, the glob is applied to `bar/file.json`.<br /><br />The glob must match the entire object part, not just the filename. For example, the glob `*.json` does not match `s3://foo/bar/file.json`, because the object part is `bar/file.json`, and the`*` does not match the slash. To match all objects ending in `.json`, use `**.json` instead.<br /><br />For more information, refer to the documentation for [`FileSystem#getPathMatcher`](https://docs.oracle.com/en/java/javase/17/docs/api/java.base/java/nio/file/FileSystem.html#getPathMatcher(java.lang.String)).|None|no|
 
 Note that the Google Cloud Storage input source will skip all empty objects only when `prefixes` is specified.
 
@@ -377,7 +378,7 @@ Sample specs:
 |uris|JSON array of URIs where the Azure objects to be ingested are located. Use this format: `azureStorage://STORAGE_ACCOUNT/CONTAINER/PATH_TO_FILE`|None|One of the following must be set:`uris`, `prefixes`, or `objects`.|
 |prefixes|JSON array of URI prefixes for the locations of Azure objects to ingest. Use this format`azureStorage://STORAGE_ACCOUNT/CONTAINER/PREFIX`. Empty objects starting with any of the given prefixes are skipped.|None|One of the following must be set:`uris`, `prefixes`, or `objects`.|
 |objects|JSON array of Azure objects to ingest.|None|One of the following must be set:`uris`, `prefixes`, or `objects`.|
-|objectGlob|A glob for the object part of the Azure URI. In the URI `azureStorage://foo/bar/file.json`, the glob is applied to `bar/file.json`.<br /><br />The glob must match the entire object part, not just the filename. For example, the glob `*.json` does not match `azureStorage://foo/bar/file.json` because the object part is `bar/file.json`, and the`*` does not match the slash. To match all objects ending in `.json`, use `**.json` instead.<br /><br />For more information, refer to the documentation for [`FileSystem#getPathMatcher`](https://docs.oracle.com/en/java/javase/11/docs/api/java.base/java/nio/file/FileSystem.html#getPathMatcher(java.lang.String)).|None|no|
+|objectGlob|A glob for the object part of the Azure URI. In the URI `azureStorage://foo/bar/file.json`, the glob is applied to `bar/file.json`.<br /><br />The glob must match the entire object part, not just the filename. For example, the glob `*.json` does not match `azureStorage://foo/bar/file.json` because the object part is `bar/file.json`, and the`*` does not match the slash. To match all objects ending in `.json`, use `**.json` instead.<br /><br />For more information, refer to the documentation for [`FileSystem#getPathMatcher`](https://docs.oracle.com/en/java/javase/17/docs/api/java.base/java/nio/file/FileSystem.html#getPathMatcher(java.lang.String)).|None|no|
 |systemFields|JSON array of system fields to return as part of input rows. Possible values: `__file_uri` (Azure blob URI starting with `azureStorage://`), `__file_bucket` (Azure bucket), and `__file_path` (Azure object path).|None|no|
 |properties|Properties object for overriding the default Azure configuration. See below for more information.|None|No (defaults will be used if not given)|
 
@@ -471,7 +472,7 @@ Sample specs:
 |uris|JSON array of URIs where the Azure objects to be ingested are located, in the form `azure://<container>/<path-to-file>`|None|`uris` or `prefixes` or `objects` must be set|
 |prefixes|JSON array of URI prefixes for the locations of Azure objects to ingest, in the form `azure://<container>/<prefix>`. Empty objects starting with one of the given prefixes are skipped.|None|`uris` or `prefixes` or `objects` must be set|
 |objects|JSON array of Azure objects to ingest.|None|`uris` or `prefixes` or `objects` must be set|
-|objectGlob|A glob for the object part of the Azure URI. In the URI `azure://foo/bar/file.json`, the glob is applied to `bar/file.json`.<br /><br />The glob must match the entire object part, not just the filename. For example, the glob `*.json` does not match `azure://foo/bar/file.json`, because the object part is `bar/file.json`, and the`*` does not match the slash. To match all objects ending in `.json`, use `**.json` instead.<br /><br />For more information, refer to the documentation for [`FileSystem#getPathMatcher`](https://docs.oracle.com/en/java/javase/11/docs/api/java.base/java/nio/file/FileSystem.html#getPathMatcher(java.lang.String)).|None|no|
+|objectGlob|A glob for the object part of the Azure URI. In the URI `azure://foo/bar/file.json`, the glob is applied to `bar/file.json`.<br /><br />The glob must match the entire object part, not just the filename. For example, the glob `*.json` does not match `azure://foo/bar/file.json`, because the object part is `bar/file.json`, and the`*` does not match the slash. To match all objects ending in `.json`, use `**.json` instead.<br /><br />For more information, refer to the documentation for [`FileSystem#getPathMatcher`](https://docs.oracle.com/en/java/javase/17/docs/api/java.base/java/nio/file/FileSystem.html#getPathMatcher(java.lang.String)).|None|no|
 |systemFields|JSON array of system fields to return as part of input rows. Possible values: `__file_uri` (Azure blob URI starting with `azure://`), `__file_bucket` (Azure bucket), and `__file_path` (Azure object path).|None|no|
 
 Note that the Azure input source skips all empty objects only when `prefixes` is specified.
@@ -1119,7 +1120,7 @@ Sample:
 
 ### Iceberg filter object
 
-This input source provides the following filters: `and`, `equals`, `interval`, and `or`. You can use these filters to filter out data files from a snapshot, reducing the number of files Druid has to ingest.
+This input source provides the following filters: `and`, `equals`, `interval`, `timeWindow`, `range` and `or`. You can use these filters to filter out data files from a snapshot, reducing the number of files Druid has to ingest.
 It is strongly recommended to apply filtering only on Iceberg partition columns. When filtering on non-partition columns, Iceberg filters may return rows that do not fully match the expression. To address this, it may help to define an additional filter in the [`transformSpec`](./ingestion-spec.md#transformspec) to remove residual rows.
 
 `equals` Filter:
@@ -1170,6 +1171,16 @@ It is strongly recommended to apply filtering only on Iceberg partition columns.
 |lowerOpen|Boolean indicating if lower bound is open in the interval of values defined by the range (`>` instead of `>=`). |false|no|
 |upperOpen|Boolean indicating if upper bound is open on the interval of values defined by range (`<` instead of `<=`). |false|no|
 
+`timeWindow` Filter:
+
+| Property|Description|Default| Required |
+|---------|-----------|-------|----------|
+|type| Set this value to `timeWindow`.|None|yes|
+|filterColumn|The column name from the iceberg table schema based on which filtering needs to happen. The filter column must be defined as TimestampType in Iceberg.|None|yes|
+|baseTime|Determines the reference timestamp from which the lookback and lookahead durations are applied to define the time window.|Current UTC timestamp|no|
+|lookbackDuration|Defines the duration that determines how far backward should the filter include data relative to `baseTime`.|P1D|no|
+|lookaheadDuration|Defines the duration that determines how far ahead should the filter include data relative to `baseTime`.|Zero|no|
+
 ## Delta Lake input source
 
 :::info[Required extension]
@@ -1179,12 +1190,12 @@ To use the Delta Lake input source, load the extension [`druid-deltalake-extensi
 You can use the Delta input source to read data stored in a Delta Lake table. For a given table, the input source scans
 the latest snapshot from the configured table. Druid ingests the underlying delta files from the table.
 
-| Property|Description| Default|Required |
-|---------|-----------|-----------------|
-|type|Set this value to `delta`.| None|yes|
-|tablePath|The location of the Delta table.|None|yes|
-|filter|The JSON Object that filters data files within a snapshot.|None|no|
-|snapshotVersion|The snapshot version to read from the Delta table. An integer value must be specified.|Latest|no|
+| Property | Description | Default | Required |
+|----------|-------------|---------|----------|
+| type | Set this value to `delta`. | None | yes |
+| tablePath | The location of the Delta table. | None | yes |
+| filter | The JSON Object that filters data files within a snapshot. | None | no |
+| snapshotVersion | The snapshot version to read from the Delta table. An integer value must be specified. | Latest | no |
 
 ### Delta filter object
 
diff --git a/docs/latest/ingestion/supervisor.md b/docs/latest/ingestion/supervisor.md
index 50e8857b00..882207cac1 100644
--- a/docs/latest/ingestion/supervisor.md
+++ b/docs/latest/ingestion/supervisor.md
@@ -80,6 +80,7 @@ The following table outlines the configuration properties for `autoScalerConfig`
 |`taskCountStart`|Optional config to specify the number of ingestion tasks to start with. When you enable the autoscaler, Druid ignores the value of `taskCount` in `ioConfig` and, if specified, starts with the `taskCountStart` number of tasks. Otherwise, defaults to `taskCountMin`.|No|`taskCountMin`|
 |`minTriggerScaleActionFrequencyMillis`|The minimum time interval between two scale actions.| No|600000|
 |`autoScalerStrategy`|The algorithm of autoscaler. Druid only supports the `lagBased` strategy. See [Autoscaler strategy](#autoscaler-strategy) for more information.|No|`lagBased`|
+|`stopTaskCountRatio`|A variable version of `ioConfig.stopTaskCount` with a valid range of (0.0, 1.0]. Allows the maximum number of stoppable tasks in steady state to be proportional to the number of tasks currently running.|No||
 
 ##### Autoscaler strategy
 
diff --git a/docs/latest/multi-stage-query/reference.md b/docs/latest/multi-stage-query/reference.md
index 64e31a8bb0..a3ecd01abe 100644
--- a/docs/latest/multi-stage-query/reference.md
+++ b/docs/latest/multi-stage-query/reference.md
@@ -417,6 +417,8 @@ The following table lists the context parameters for the MSQ task engine:
 | `failOnEmptyInsert` | INSERT or REPLACE<br /><br /> When set to false (the default), an INSERT query generating no output rows will be no-op, and a REPLACE query generating no output rows will delete all data that matches the OVERWRITE clause.  When set to true, an ingest query generating no output rows will throw an `InsertCannotBeEmpty` fault. | `false` |
 | `storeCompactionState` | REPLACE<br /><br /> When set to true, a REPLACE query stores as part of each segment's metadata a `lastCompactionState` field that captures the various specs used to create the segment. Future compaction jobs skip segments whose `lastCompactionState` matches the desired compaction state. Works the same as [`storeCompactionState`](../ingestion/tasks.md#context-parameters) task context flag. | `false` |
 | `removeNullBytes` | SELECT, INSERT or REPLACE<br /><br /> The MSQ engine cannot process null bytes in strings and throws `InvalidNullByteFault` if it encounters them in the source data. If the parameter is set to true, The MSQ engine will remove the null bytes in string fields when reading the data. | `false` |
+| `maxFrameSize` | SELECT, INSERT or REPLACE<br /><br />Size of frames used for data transfer within the MSQ engine. You generally do not need to change this unless you have very large rows. | `1000000` (1 MB) |
+| `maxThreads` | SELECT, INSERT or REPLACE<br /><br />Maximum number of threads to use for processing. This only has an effect if it is greater than zero and less than the default thread count based on system configuration. Otherwise, it is ignored, and workers use the default thread count. | Not set (use default thread count) |
 
 ## Joins
 
@@ -531,7 +533,7 @@ There are common configurations that control the behavior regardless of which st
 Common properties to configure the behavior of durable storage
 
 |Parameter          | Required | Description          | Default | 
-|--|--|--|
+|--|--|--|--|
 |`druid.msq.intermediate.storage.enable`  | Yes |  Whether to enable durable storage for the cluster. Set it to true to enable durable storage. For more information about enabling durable storage, see [Durable storage](../operations/durable-storage.md). | false | 
 |`druid.msq.intermediate.storage.type` |  Yes | The type of storage to use. Set it to `s3` for S3, `azure` for Azure and `google` for Google | n/a |
 |`druid.msq.intermediate.storage.tempDir`| Yes |  Directory path on the local disk to store temporary files required while uploading and downloading the data. If the property is not configured on the indexer or middle manager, it defaults to using the task temporary directory. | n/a |
diff --git a/docs/latest/operations/dump-segment.md b/docs/latest/operations/dump-segment.md
index f8c99366ad..f80b627519 100644
--- a/docs/latest/operations/dump-segment.md
+++ b/docs/latest/operations/dump-segment.md
@@ -36,7 +36,7 @@ java -classpath "/my/druid/lib/*" -Ddruid.extensions.loadList="[]" org.apache.dr
   --out /home/druid/output.txt
 ```
 
-If you use JDK 11 and above, you need to add the following additional parameters
+If you use JDK 17 and above, you need to add the following additional parameters
 ```
 --add-opens java.base/java.lang=ALL-UNNAMED
 --add-opens java.base/sun.nio.ch=ALL-UNNAMED
diff --git a/docs/latest/operations/java.md b/docs/latest/operations/java.md
index 0b8a474ac9..a035e4e239 100644
--- a/docs/latest/operations/java.md
+++ b/docs/latest/operations/java.md
@@ -27,7 +27,7 @@ a Java runtime for Druid.
 
 ## Selecting a Java runtime
 
- The project team recommends Java 17. Although you can use Java 11, support for it is deprecated.
+Druid officially supports Java 17 and 21.
 
 The project team recommends using an OpenJDK-based Java distribution. There are many free and actively-supported
 distributions available, including
@@ -43,7 +43,7 @@ Druid relies on the environment variables `JAVA_HOME` or `DRUID_JAVA_HOME` to fi
 ## Garbage collection
 
 In general, the project team recommends using the G1 collector with default settings. This is the default collector in
-Java 11 and 17.
+Java 17.
 
 Garbage collector selection and tuning is a form of sport in the Java community. There may be situations where adjusting
 garbage collection configuration improves or worsens performance. The project team's guidance is that most people do
@@ -51,18 +51,10 @@ not need to stray away from G1 with default settings.
 
 ## Strong encapsulation
 
-Java 9 and beyond (including Java 11 and 17) include the capability for
+Java 9 and beyond (including Java 17) include the capability for
 [strong encapsulation](https://dev.java/learn/strong-encapsulation-\(of-jdk-internals\)/) of internal JDK APIs. Druid
 uses certain internal JDK APIs, which must be added to `--add-exports` and `--add-opens` on the Java command line.
 
-On Java 11, if these parameters are not included, you will see warnings like the following:
-
-```
-WARNING: An illegal reflective access operation has occurred
-WARNING: Use --illegal-access=warn to enable warnings of further illegal reflective access operations
-WARNING: All illegal access operations will be denied in a future release
-```
-
 On Java 17, if these parameters are not included, you will see errors on startup like the following:
 
 ```
diff --git a/docs/latest/operations/metrics.md b/docs/latest/operations/metrics.md
index 8fc1cf3416..ce488676a0 100644
--- a/docs/latest/operations/metrics.md
+++ b/docs/latest/operations/metrics.md
@@ -45,13 +45,13 @@ Most metric values reset each emission period, as specified in `druid.monitoring
 
 |Metric|Description|Dimensions|Normal value|
 |------|-----------|----------|------------|
-|`query/time`|Milliseconds taken to complete a query.|Native Query: `dataSource`, `type`, `interval`, `hasFilters`, `duration`, `context`, `remoteAddress`, `id`.|< 1s|
+|`query/time`|Milliseconds taken to complete a query.|Native Query: `dataSource`, `type`, `interval`, `hasFilters`, `duration`, `context`, `remoteAddress`, `id`, `statusCode`.|< 1s|
 
 ### Broker
 
 |Metric|Description|Dimensions|Normal value|
 |------|-----------|----------|------------|
-|`query/time`|Milliseconds taken to complete a query.|<p>Common: `dataSource`, `type`, `interval`, `hasFilters`, `duration`, `context`, `remoteAddress`, `id`.</p><p>Aggregation Queries: `numMetrics`, `numComplexMetrics`.</p><p>GroupBy: `numDimensions`.</p><p> TopN: `threshold`, `dimension`.</p>|< 1s|
+|`query/time`|Milliseconds taken to complete a query.|<p>Common: `dataSource`, `type`, `interval`, `hasFilters`, `duration`, `context`, `remoteAddress`, `id`, `statusCode`.</p><p>Aggregation Queries: `numMetrics`, `numComplexMetrics`.</p><p>GroupBy: `numDimensions`.</p><p> TopN: `threshold`, `dimension`.</p>|< 1s|
 |`query/bytes`|The total number of bytes returned to the requesting client in the query response from the broker. Other services report the total bytes for their portion of the query. |<p>Common: `dataSource`, `type`, `interval`, `hasFilters`, `duration`, `context`, `remoteAddress`, `id`.</p><p> Aggregation Queries: `numMetrics`, `numComplexMetrics`.</p><p> GroupBy: `numDimensions`.</p><p> TopN: `threshold`, `dimension`.</p>| |
 |`query/node/time`|Milliseconds taken to query individual historical/realtime processes.|`id`, `status`, `server`|< 1s|
 |`query/resultCache/hit`|Whether the query hit the result cache (1) or not (0). Emission of the metric indicates the result-level cache was polled.|<p>Common: `dataSource`, `type`, `interval`, `hasFilters`, `duration`, `context`, `remoteAddress`, `id`.</p>|Varies|
@@ -64,7 +64,7 @@ Most metric values reset each emission period, as specified in `druid.monitoring
 |`query/timeout/count`|Number of timed out queries.|This metric is only available if the `QueryCountStatsMonitor` module is included.| |
 |`query/segments/count`|This metric is not enabled by default. See the `QueryMetrics` Interface for reference regarding enabling this metric. Number of segments that will be touched by the query. In the broker, it makes a plan to distribute the query to realtime tasks and historicals based on a snapshot of segment distribution state. If there are some segments moved after this snapshot is created, certain historicals and realtime tasks can report those segments as missing to the broker. The broker will resend the query to the new servers that serve those segments after move. In this case, those segments can be counted more than once in this metric.||Varies|
 |`query/priority`|Assigned lane and priority, only if Laning strategy is enabled. Refer to [Laning strategies](../configuration/index.md#laning-strategies)|`lane`, `dataSource`, `type`|0|
-|`sqlQuery/time`|Milliseconds taken to complete a SQL query.|`id`, `nativeQueryIds`, `dataSource`, `remoteAddress`, `success`, `engine`|< 1s|
+|`sqlQuery/time`|Milliseconds taken to complete a SQL query.|`id`, `nativeQueryIds`, `dataSource`, `remoteAddress`, `success`, `engine`, `statusCode`|< 1s|
 |`sqlQuery/planningTimeMs`|Milliseconds taken to plan a SQL to native query.|`id`, `nativeQueryIds`, `dataSource`, `remoteAddress`, `success`, `engine`| |
 |`sqlQuery/bytes`|Number of bytes returned in the SQL query response.|`id`, `nativeQueryIds`, `dataSource`, `remoteAddress`, `success`, `engine`| |
 |`serverview/init/time`|Time taken to initialize the broker server view. Useful to detect if brokers are taking too long to start.||Depends on the number of segments.|
@@ -97,7 +97,7 @@ Most metric values reset each emission period, as specified in `druid.monitoring
 
 |Metric|Description|Dimensions|Normal value|
 |------|-----------|----------|------------|
-|`query/time`|Milliseconds taken to complete a query.|<p>Common: `dataSource`, `type`, `interval`, `hasFilters`, `duration`, `context`, `remoteAddress`, `id`.</p><p> Aggregation Queries: `numMetrics`, `numComplexMetrics`.</p><p> GroupBy: `numDimensions`.</p><p> TopN: `threshold`, `dimension`.</p>|< 1s|
+|`query/time`|Milliseconds taken to complete a query.|<p>Common: `dataSource`, `type`, `interval`, `hasFilters`, `duration`, `context`, `remoteAddress`, `id`, `statusCode`.</p><p> Aggregation Queries: `numMetrics`, `numComplexMetrics`.</p><p> GroupBy: `numDimensions`.</p><p> TopN: `threshold`, `dimension`.</p>|< 1s|
 |`query/segment/time`|Milliseconds taken to query individual segment. Includes time to page in the segment from disk.|`id`, `status`, `segment`, `vectorized`.|several hundred milliseconds|
 |`query/wait/time`|Milliseconds spent waiting for a segment to be scanned.|`id`, `segment`|< several hundred milliseconds|
 |`segment/scan/pending`|Number of segments in queue waiting to be scanned.||Close to 0|
@@ -121,7 +121,7 @@ Most metric values reset each emission period, as specified in `druid.monitoring
 
 |Metric|Description|Dimensions|Normal value|
 |------|-----------|----------|------------|
-|`query/time`|Milliseconds taken to complete a query.|<p>Common: `dataSource`, `type`, `interval`, `hasFilters`, `duration`, `context`, `remoteAddress`, `id`.</p><p> Aggregation Queries: `numMetrics`, `numComplexMetrics`.</p><p> GroupBy: `numDimensions`.</p><p> TopN: `threshold`, `dimension`.</p>|< 1s|
+|`query/time`|Milliseconds taken to complete a query.|<p>Common: `dataSource`, `type`, `interval`, `hasFilters`, `duration`, `context`, `remoteAddress`, `id`, `statusCode`.</p><p> Aggregation Queries: `numMetrics`, `numComplexMetrics`.</p><p> GroupBy: `numDimensions`.</p><p> TopN: `threshold`, `dimension`.</p>|< 1s|
 |`query/wait/time`|Milliseconds spent waiting for a segment to be scanned.|`id`, `segment`|several hundred milliseconds|
 |`segment/scan/pending`|Number of segments in queue waiting to be scanned.||Close to 0|
 |`segment/scan/active`|Number of segments currently scanned. This metric also indicates how many threads from `druid.processing.numThreads` are currently being used.||Close to `druid.processing.numThreads`|
@@ -186,7 +186,7 @@ If SQL is enabled, the Broker will emit the following metrics for SQL.
 
 |Metric|Description|Dimensions|Normal value|
 |------|-----------|----------|------------|
-|`sqlQuery/time`|Milliseconds taken to complete a SQL.|`id`, `nativeQueryIds`, `dataSource`, `remoteAddress`, `success`, `engine`|< 1s|
+|`sqlQuery/time`|Milliseconds taken to complete a SQL.|`id`, `nativeQueryIds`, `dataSource`, `remoteAddress`, `success`, `engine`, `statusCode`|< 1s|
 |`sqlQuery/planningTimeMs`|Milliseconds taken to plan a SQL to native query.|`id`, `nativeQueryIds`, `dataSource`, `remoteAddress`, `success`, `engine`| |
 |`sqlQuery/bytes`|number of bytes returned in SQL response.|`id`, `nativeQueryIds`, `dataSource`, `remoteAddress`, `success`, `engine`| |
 
@@ -265,7 +265,7 @@ batch ingestion emit the following metrics. These metrics are deltas for each em
 |`ingest/events/processed`|Number of events processed per emission period.|`dataSource`, `taskId`, `taskType`, `groupId`, `tags`|Equal to the number of events per emission period.|
 |`ingest/events/processedWithError`|Number of events processed with some partial errors per emission period. Events processed with partial errors are counted towards both this metric and `ingest/events/processed`.|`dataSource`, `taskId`, `taskType`, `groupId`, `tags`|0|
 |`ingest/events/unparseable`|Number of events rejected because the events are unparseable.|`dataSource`, `taskId`, `taskType`, `groupId`, `tags`|0|
-|`ingest/events/thrownAway`|Number of events rejected because they are null, or filtered by `transformSpec`, or outside one of `lateMessageRejectionPeriod`, `earlyMessageRejectionPeriod`, or `windowPeriod`.|`dataSource`, `taskId`, `taskType`, `groupId`, `tags`|0|
+|`ingest/events/thrownAway`|Number of events rejected because they are null, or filtered by `transformSpec`, or outside one of `lateMessageRejectionPeriod`, `earlyMessageRejectionPeriod`.|`dataSource`, `taskId`, `taskType`, `groupId`, `tags`|0|
 |`ingest/events/duplicate`|Number of events rejected because the events are duplicated.|`dataSource`, `taskId`, `taskType`, `groupId`, `tags`|0|
 |`ingest/input/bytes`|Number of bytes read from input sources, after decompression but prior to parsing. This covers all data read, including data that does not end up being fully processed and ingested. For example, this includes data that ends up being rejected for being unparseable or filtered out.|`dataSource`, `taskId`, `taskType`, `groupId`, `tags`|Depends on the amount of data read.|
 |`ingest/rows/output`|Number of Druid rows persisted.|`dataSource`, `taskId`, `taskType`, `groupId`|Your number of events with rollup.|
@@ -390,9 +390,9 @@ These metrics are emitted by the Druid Coordinator in every run of the correspon
 |`segment/dropped/count`|Number of segments chosen to be dropped from the cluster due to being over-replicated.|`dataSource`, `tier`|Varies|
 |`segment/deleted/count`|Number of segments marked as unused due to drop rules.|`dataSource`|Varies|
 |`segment/unneeded/count`|Number of segments dropped due to being marked as unused.|`dataSource`, `tier`|Varies|
-|`segment/assignSkipped/count`|Number of segments that could not be assigned to any server for loading. This can occur due to replication throttling, no available disk space, or a full load queue.|`dataSource`, `tier`, `description`|Varies|
-|`segment/moveSkipped/count`|Number of segments that were chosen for balancing but could not be moved. This can occur when segments are already optimally placed.|`dataSource`, `tier`, `description`|Varies|
-|`segment/dropSkipped/count`|Number of segments that could not be dropped from any server.|`dataSource`, `tier`, `description`|Varies|
+|`segment/assignSkipped/count`|Number of segments that could not be assigned to any server for loading. This can occur due to replication throttling, no available disk space, or a full load queue.|`dataSource`, `server`, `tier`, `description`|Varies|
+|`segment/moveSkipped/count`|Number of segments that were chosen for balancing but could not be moved. This can occur when segments are already optimally placed.|`dataSource`, `server`, `tier`, `description`|Varies|
+|`segment/dropSkipped/count`|Number of segments that could not be dropped from any server.|`dataSource`, `server`, `tier`, `description`|Varies|
 |`segment/loadQueue/size`|Size in bytes of segments to load.|`server`|Varies|
 |`segment/loadQueue/count`|Number of segments to load.|`server`|Varies|
 |`segment/loading/rateKbps`|Current rate of segment loading on a server in kbps (1000 bits per second). The rate is calculated as a moving average over the last 10 GiB or more of successful segment loads on that server.|`server`|Varies|
@@ -441,6 +441,8 @@ These metrics are emitted by the Druid Coordinator in every run of the correspon
 |`serverview/sync/unstableTime`|Time in milliseconds for which the Coordinator has been failing to sync with a segment-loading server. Emitted only when [HTTP-based server view](../configuration/index.md#segment-management) is enabled.|`server`, `tier`|Not emitted for synced servers.|
 |`metadatacache/init/time`|Time taken to initialize the coordinator segment metadata cache.||Depends on the number of segments.|
 |`segment/schemaCache/refresh/count`|Number of segments for which schema was refreshed in coordinator segment schema cache.|`dataSource`||
+|`segment/schemaCache/refreshSkipped/count`|Number of segments for which schema refresh was skipped due to presence of segment metadata in datasource polled from coordinator.|`dataSource`||
+|`segment/schemaCache/dataSource/removed`|Emitted when a datasource is removed from the Broker cache due to segments being marked as unused.|`dataSource`||
 |`segment/schemaCache/refresh/time`|Time taken to refresh segments in coordinator segment schema cache.|`dataSource`||
 |`segment/schemaCache/backfill/count`|Number of segments for which schema was back filled in the database.|`dataSource`||
 |`segment/schemaCache/realtime/count`|Number of realtime segments for which schema is cached.||Depends on the number of realtime segments in the cluster.|
@@ -558,7 +560,6 @@ These metrics are only available if the `OshiSysMonitor` module is included.
 |`sys/mem/used`|Memory used||< max|
 |`sys/mem/max`|Memory max||Varies|
 |`sys/mem/free`|Memory free||Varies|
-|`sys/storage/used`|Disk space used|`fsDirName`|Varies|
 |`sys/cpu`|CPU used|`cpuName`, `cpuTime`|Varies|
 |`sys/uptime`|Total system uptime||Varies|
 |`sys/la/{i}`|System CPU load averages over past `i` minutes, where `i={1,5,15}`||Varies|
diff --git a/docs/latest/operations/other-hadoop.md b/docs/latest/operations/other-hadoop.md
index a82b331de4..7d13a406c1 100644
--- a/docs/latest/operations/other-hadoop.md
+++ b/docs/latest/operations/other-hadoop.md
@@ -25,12 +25,15 @@ title: "Working with different versions of Apache Hadoop"
 
 :::caution[Deprecated]
 
-Hadoop-based ingestion is deprecated. We recommend one of Druid's other supported ingestion methods, such as [SQL-based ingestion](../multi-stage-query/index.md) or [MiddleManager-less ingestion using Kubernetes](../development/extensions-core/k8s-jobs.md)
+Hadoop-based ingestion is deprecated and scheduled to be removed with Druid 37.0.0.
 
-You must now explicitly opt-in to using the deprecated `index_hadoop` task type. To opt-in, set `druid.indexer.task.allowHadoopTaskExecution` to `true` in your `common.runtime.properties` file. For more information, see [#18239](https://github.com/apache/druid/pull/18239)
+We recommend one of Druid's other supported ingestion methods, such as [SQL-based ingestion](../multi-stage-query/index.md) or [MiddleManager-less ingestion using Kubernetes](../development/extensions-core/k8s-jobs.md)
+
+You must now explicitly opt-in to using the deprecated `index_hadoop` task type. To opt-in, set `druid.indexer.task.allowHadoopTaskExecution` to `true` in your `common.runtime.properties` file. For more information, see [#18239](https://github.com/apache/druid/pull/18239).
 
 :::
 
+
 Apache Druid can interact with Hadoop in two ways:
 
 1. [Use HDFS for deep storage](../development/extensions-core/hdfs.md) using the druid-hdfs-storage extension.
diff --git a/docs/latest/operations/pull-deps.md b/docs/latest/operations/pull-deps.md
index 220dde5592..4cd0ae1619 100644
--- a/docs/latest/operations/pull-deps.md
+++ b/docs/latest/operations/pull-deps.md
@@ -57,7 +57,7 @@ Don't use the default remote repository, https://repo1.maven.org/maven2/. Only u
 
 `-d` or `--defaultVersion`
 
-Version to use for extension coordinate that doesn't have a version information. For example, if extension coordinate is `org.apache.druid.extensions:mysql-metadata-storage`, and default version is `34.0.0`, then this coordinate will be treated as `org.apache.druid.extensions:mysql-metadata-storage:34.0.0`
+Version to use for extension coordinate that doesn't have a version information. For example, if extension coordinate is `org.apache.druid.extensions:mysql-metadata-storage`, and default version is `35.0.0`, then this coordinate will be treated as `org.apache.druid.extensions:mysql-metadata-storage:35.0.0`
 
 `--use-proxy`
 
@@ -91,10 +91,10 @@ To run `pull-deps`, you should
 
 Example:
 
-Suppose you want to download ```mysql-metadata-storage``` and ```hadoop-client```(both 2.3.0 and 2.4.0) with a specific version, you can run `pull-deps` command with `-c org.apache.druid.extensions:mysql-metadata-storage:34.0.0`, `-h org.apache.hadoop:hadoop-client:2.3.0` and `-h org.apache.hadoop:hadoop-client:2.4.0`, an example command would be:
+Suppose you want to download ```mysql-metadata-storage``` and ```hadoop-client```(both 2.3.0 and 2.4.0) with a specific version, you can run `pull-deps` command with `-c org.apache.druid.extensions:mysql-metadata-storage:35.0.0`, `-h org.apache.hadoop:hadoop-client:2.3.0` and `-h org.apache.hadoop:hadoop-client:2.4.0`, an example command would be:
 
 ```
-java -classpath "/my/druid/lib/*" org.apache.druid.cli.Main tools pull-deps --clean -c org.apache.druid.extensions:mysql-metadata-storage:34.0.0 -h org.apache.hadoop:hadoop-client:2.3.0 -h org.apache.hadoop:hadoop-client:2.4.0
+java -classpath "/my/druid/lib/*" org.apache.druid.cli.Main tools pull-deps --clean -c org.apache.druid.extensions:mysql-metadata-storage:35.0.0 -h org.apache.hadoop:hadoop-client:2.3.0 -h org.apache.hadoop:hadoop-client:2.4.0
 ```
 
 Because `--clean` is supplied, this command will first remove the directories specified at `druid.extensions.directory` and `druid.extensions.hadoopDependenciesDir`, then recreate them and start downloading the extensions there. After finishing downloading, if you go to the extension directories you specified, you will see
@@ -103,7 +103,7 @@ Because `--clean` is supplied, this command will first remove the directories sp
 tree extensions
 extensions
 └── mysql-metadata-storage
-    └── mysql-metadata-storage-34.0.0.jar
+    └── mysql-metadata-storage-35.0.0.jar
 ```
 
 ```
@@ -128,10 +128,10 @@ hadoop-dependencies/
     ..... lots of jars
 ```
 
-Note that if you specify `--defaultVersion`, you don't have to put version information in the coordinate. For example, if you want `mysql-metadata-storage` to use version `34.0.0`,  you can change the command above to
+Note that if you specify `--defaultVersion`, you don't have to put version information in the coordinate. For example, if you want `mysql-metadata-storage` to use version `35.0.0`,  you can change the command above to
 
 ```
-java -classpath "/my/druid/lib/*" org.apache.druid.cli.Main tools pull-deps --defaultVersion 34.0.0 --clean -c org.apache.druid.extensions:mysql-metadata-storage -h org.apache.hadoop:hadoop-client:2.3.0 -h org.apache.hadoop:hadoop-client:2.4.0
+java -classpath "/my/druid/lib/*" org.apache.druid.cli.Main tools pull-deps --defaultVersion 35.0.0 --clean -c org.apache.druid.extensions:mysql-metadata-storage -h org.apache.hadoop:hadoop-client:2.3.0 -h org.apache.hadoop:hadoop-client:2.4.0
 ```
 
 :::info
diff --git a/docs/latest/operations/reset-cluster.md b/docs/latest/operations/reset-cluster.md
index b6dac868ab..476a68ef86 100644
--- a/docs/latest/operations/reset-cluster.md
+++ b/docs/latest/operations/reset-cluster.md
@@ -23,57 +23,7 @@ title: "reset-cluster tool"
   -->
 
 
-The `reset-cluster` tool can be used to completely wipe out Apache Druid cluster state stored on Metadata and Deep storage. This is
-intended to be used in dev/test environments where you typically want to reset the cluster before running
-the test suite.
-`reset-cluster` automatically figures out necessary information from Druid cluster configuration. So the java classpath
-used in the command must have all the necessary druid configuration files.
-
-It can be run in one of the following ways.
-
-```
-java -classpath "/my/druid/lib/*" -Ddruid.extensions.loadList="[]" org.apache.druid.cli.Main \
-  tools reset-cluster \
-  [--metadataStore] \
-  [--segmentFiles] \
-  [--taskLogs] \
-  [--hadoopWorkingPath]
-```
-
-or
-
-```
-java -classpath "/my/druid/lib/*" -Ddruid.extensions.loadList="[]" org.apache.druid.cli.Main \
-  tools reset-cluster \
-  --all
-```
-
-Usage documentation can be printed by running following command.
-
-```
-$ java -classpath "/my/druid/lib/*" -Ddruid.extensions.loadList="[]" org.apache.druid.cli.Main help tools reset-cluster
-
-NAME
-        druid tools reset-cluster - Cleanup all persisted state from metadata
-        and deep storage.
-
-SYNOPSIS
-        druid tools reset-cluster [--all] [--hadoopWorkingPath]
-                [--metadataStore] [--segmentFiles] [--taskLogs]
-
-OPTIONS
-        --all
-            delete all state stored in metadata and deep storage
-
-        --hadoopWorkingPath
-            delete hadoopWorkingPath
-
-        --metadataStore
-            delete all records in metadata storage
-
-        --segmentFiles
-            delete all segment files from deep storage
-
-        --taskLogs
-            delete all tasklogs
-```
+In older versions of Apache Druid, `reset-cluster` was a tool that could wipe out Apache Druid cluster state stored in
+metadata and deep storage, intended primarily for use in dev and test environments. However, this tool was prone to
+becoming out of sync with the codebase since it was not used in practice during dev and testing, and could not cover
+all cleanup cases when extensions were involved. It was removed in Druid 35.0.0.
diff --git a/docs/latest/operations/tls-support.md b/docs/latest/operations/tls-support.md
index 543f177bfe..23dc133244 100644
--- a/docs/latest/operations/tls-support.md
+++ b/docs/latest/operations/tls-support.md
@@ -37,10 +37,10 @@ Apache Druid uses Jetty as its embedded web server.
 
 To get familiar with TLS/SSL, along with related concepts like keys and certificates,
 read [Configuring Secure Protocols](https://www.eclipse.org/jetty/documentation/jetty-12/operations-guide/index.html#og-protocols-ssl) in the Jetty documentation.
-To get more in-depth knowledge of TLS/SSL support in Java in general, refer to the [Java Secure Socket Extension (JSSE) Reference Guide](https://docs.oracle.com/en/java/javase/11/security/java-secure-socket-extension-jsse-reference-guide.html).
-The [Class SslContextFactory](https://www.eclipse.org/jetty/javadoc/jetty-11/org/eclipse/jetty/util/ssl/SslContextFactory.html)
+To get more in-depth knowledge of TLS/SSL support in Java in general, refer to the [Java Secure Socket Extension (JSSE) Reference Guide](https://docs.oracle.com/en/java/javase/17/security/java-secure-socket-extension-jsse-reference-guide.html).
+The [Class SslContextFactory](https://javadoc.jetty.org/jetty-12/org/eclipse/jetty/util/ssl/SslContextFactory.html)
 reference doc can help in understanding TLS/SSL configurations listed below. Finally, [Java Cryptography Architecture
-Standard Algorithm Name Documentation for JDK 11](https://docs.oracle.com/en/java/javase/11/docs/specs/security/standard-names.html) lists all possible
+Standard Algorithm Name Documentation for JDK 17](https://docs.oracle.com/en/java/javase/17/docs/specs/security/standard-names.html) lists all possible
 values for the configs below, among others provided by Java implementation.
 
 |Property|Description|Default|Required|
@@ -51,6 +51,7 @@ values for the configs below, among others provided by Java implementation.
 |`druid.server.https.keyStorePassword`|The [Password Provider](../operations/password-provider.md) or String password for the Key Store.|none|yes|
 |`druid.server.https.reloadSslContext`| Should Druid server detect Key Store file change and reload.|false|no|
 |`druid.server.https.reloadSslContextSeconds`| How frequently should Druid server scan for Key Store file change.|60|yes|
+|`druid.server.https.forceApplyConfig`|Whether to apply TLS server configs even if an existing `SslContextFactory.Server` instance is bound.|false|no|
 
 The following table contains configuration options related to client certificate authentication.
 
@@ -79,7 +80,7 @@ The following table contains non-mandatory advanced configuration options, use c
 ## Internal communication over TLS
 
 Whenever possible Druid processes will use HTTPS to talk to each other. To enable this communication Druid's HttpClient needs to
-be configured with a proper [SSLContext](https://docs.oracle.com/en/java/javase/11/docs/api/java.base/javax/net/ssl/SSLContext.html) that is able
+be configured with a proper [SSLContext](https://docs.oracle.com/en/java/javase/17/docs/api/java.base/javax/net/ssl/SSLContext.html) that is able
 to validate the Server Certificates, otherwise communication will fail.
 
 Since, there are various ways to configure SSLContext, by default, Druid looks for an instance of SSLContext Guice binding
diff --git a/docs/latest/querying/dimensionspecs.md b/docs/latest/querying/dimensionspecs.md
index 68773abdae..dba52abcc6 100644
--- a/docs/latest/querying/dimensionspecs.md
+++ b/docs/latest/querying/dimensionspecs.md
@@ -255,7 +255,7 @@ For a regular dimension, it assumes the string is formatted in
 [ISO-8601 date and time format](https://en.wikipedia.org/wiki/ISO_8601).
 
 * `format` : date time format for the resulting dimension value, in [Joda Time DateTimeFormat](http://www.joda.org/joda-time/apidocs/org/joda/time/format/DateTimeFormat.html), or null to use the default ISO8601 format.
-* `locale` : locale (language and country) to use, given as a [IETF BCP 47 language tag](https://www.oracle.com/java/technologies/javase/jdk11-suported-locales.html#util-text), e.g. `en-US`, `en-GB`, `fr-FR`, `fr-CA`, etc.
+* `locale` : locale (language and country) to use, given as a [IETF BCP 47 language tag](https://www.oracle.com/java/technologies/javase/jdk17-suported-locales.html#util-text), e.g. `en-US`, `en-GB`, `fr-FR`, `fr-CA`, etc.
 * `timeZone` : time zone to use in [IANA tz database format](http://en.wikipedia.org/wiki/List_of_tz_database_time_zones), e.g. `Europe/Berlin` (this can possibly be different than the aggregation time-zone)
 * `granularity` : [granularity](granularities.md) to apply before formatting, or omit to not apply any granularity.
 * `asMillis` : boolean value, set to true to treat input strings as millis rather than ISO8601 strings. Additionally, if `format` is null or not specified, output will be in millis rather than ISO8601.
diff --git a/docs/latest/querying/filters.md b/docs/latest/querying/filters.md
index a9a862a499..d088d92641 100644
--- a/docs/latest/querying/filters.md
+++ b/docs/latest/querying/filters.md
@@ -431,7 +431,7 @@ The regular expression filter is similar to the selector filter, but using regul
 | -------- | ----------- | -------- |
 | `type` | Must be `regex`.| Yes |
 | `dimension` | Input column or virtual column name to filter on. | Yes |
-| `pattern` | String pattern to match - any standard [Java regular expression](https://docs.oracle.com/en/java/javase/11/docs/api/java.base/java/util/regex/Pattern.html). | Yes |
+| `pattern` | String pattern to match - any standard [Java regular expression](https://docs.oracle.com/en/java/javase/17/docs/api/java.base/java/util/regex/Pattern.html). | Yes |
 | `extractionFn` | [Extraction function](./dimensionspecs.md#extraction-functions) to apply to `dimension` prior to value matching. See [filtering with extraction functions](#filtering-with-extraction-functions) for details. | No |
 
 Note that it is often more optimal to use a like filter instead of a regex for simple matching of prefixes.
diff --git a/docs/latest/querying/math-expr.md b/docs/latest/querying/math-expr.md
index 926446200f..06ac395c7a 100644
--- a/docs/latest/querying/math-expr.md
+++ b/docs/latest/querying/math-expr.md
@@ -81,7 +81,7 @@ The following built-in functions are available.
 |name|description|
 |----|-----------|
 |concat|concat(expr, expr...) concatenate a list of strings|
-|format|format(pattern[, args...]) returns a string formatted in the manner of Java's [String.format](https://docs.oracle.com/en/java/javase/11/docs/api/java.base/java/lang/String.html#format(java.lang.String,java.lang.Object...)).|
+|format|format(pattern[, args...]) returns a string formatted in the manner of Java's [String.format](https://docs.oracle.com/en/java/javase/17/docs/api/java.base/java/lang/String.html#format(java.lang.String,java.lang.Object...)).|
 |like|like(expr, pattern[, escape]) is equivalent to SQL `expr LIKE pattern`|
 |lookup|lookup(expr, lookup-name[,replaceMissingValueWith]) looks up expr in a registered,`replaceMissingValueWith` is an optional constant string [query-time lookup](../querying/lookups.md)|
 |parse_long|parse_long(string[, radix]) parses a string as a long with the given radix, or 10 (decimal) if a radix is not provided.|
diff --git a/docs/latest/querying/query-context-reference.md b/docs/latest/querying/query-context-reference.md
index acc762fa9f..a7532b265d 100644
--- a/docs/latest/querying/query-context-reference.md
+++ b/docs/latest/querying/query-context-reference.md
@@ -44,6 +44,7 @@ Unless otherwise noted, the following parameters apply to all query types, and t
 |Parameter          |Default                                 | Description          |
 |-------------------|----------------------------------------|----------------------|
 |`timeout`          | `druid.server.http.defaultQueryTimeout`| Query timeout in millis, beyond which unfinished queries will be cancelled. 0 timeout means `no timeout` (up to the server-side maximum query timeout, `druid.server.http.maxQueryTimeout`). To set the default timeout and maximum timeout, see [Broker configuration](../configuration/index.md#broker) |
+|`perSegmentTimeout`| `null`                                 | Per-segment processing timeout in millis, beyond which unfinished queries will be cancelled. Should be ≤ `timeout`. 0 `perSegmentTimeout` means `no per-segment timeout`. Generally, a standard default should be O(X seconds). A cluster-wide default value for this query context can be specified via `druid.query.default.context.perSegmentTimeout`.|
 |`priority`         | The default priority is one of the following: <ul><li>Value of `priority` in the query context, if set</li><li>The value of the runtime property `druid.query.default.context.priority`, if set and not null</li><li>`0` if the priority is not set in the query context or runtime properties</li></ul>| Query priority. Queries with higher priority get precedence for computational resources.|
 |`lane`             | `null`                                 | Query lane, used to control usage limits on classes of queries. See [Broker configuration](../configuration/index.md#broker) for more details.|
 |`queryId`          | auto-generated                         | Unique identifier given to this query. If a query ID is set or known, this can be used to cancel the query |
@@ -70,6 +71,7 @@ Unless otherwise noted, the following parameters apply to all query types, and t
 |`setProcessingThreadNames`|`true`| Whether processing thread names will be set to `queryType_dataSource_intervals` while processing a query. This aids in interpreting thread dumps, and is on by default. Query overhead can be reduced slightly by setting this to `false`. This has a tiny effect in most scenarios, but can be meaningful in high-QPS, low-per-segment-processing-time scenarios. |
 |`sqlPlannerBloat`|`1000`|Calcite parameter which controls whether to merge two Project operators when inlining expressions causes complexity to increase. Implemented as a workaround to exception `There are not enough rules to produce a node with desired properties: convention=DRUID, sort=[]` thrown after rejecting the merge of two projects.|
 |`cloneQueryMode`|`excludeClones`| Indicates whether clone Historicals should be queried by brokers. Clone servers are created by the `cloneServers` Coordinator dynamic configuration. Possible values are `excludeClones`, `includeClones` and `preferClones`. `excludeClones` means that clone Historicals are not queried by the broker. `preferClones` indicates that when given a choice between the clone Historical and the original Historical which is being cloned, the broker chooses the clones. Historicals which are not involved in the cloning process will still be queried. `includeClones` means that broker queries any Historical without regarding clone status. This parameter only affects native queries. MSQ does not query Historicals directly.|
+|`realtimeSegmentsOnly` |`false`| When set to true, only query realtime segments. Historical segments are excluded. |
 
 ## Parameters by query type
 
diff --git a/docs/latest/querying/query-execution.md b/docs/latest/querying/query-execution.md
index 123b80738c..9228258601 100644
--- a/docs/latest/querying/query-execution.md
+++ b/docs/latest/querying/query-execution.md
@@ -51,8 +51,7 @@ and tasks running on Middle Managers) that are currently serving those segments.
 
 4. For all query types except [Scan](scan-query.md), data servers process each segment in parallel and generate partial
 results for each segment. The specific processing that is done depends on the query type. These partial results may be
-cached if [query caching](caching.md) is enabled. For Scan queries, segments are processed in order by a single thread,
-and results are not cached.
+cached if [query caching](caching.md) is enabled. For Scan queries, segments are processed in order by a single thread.
 
 5. The Broker receives partial results from each data server, merges them into the final result set, and returns them
 to the caller. For Timeseries and Scan queries, and for GroupBy queries where there is no sorting, the Broker is able to
diff --git a/docs/latest/querying/sql-functions.md b/docs/latest/querying/sql-functions.md
index 9f75a96ce7..beaa4c4eb3 100644
--- a/docs/latest/querying/sql-functions.md
+++ b/docs/latest/querying/sql-functions.md
@@ -4157,6 +4157,70 @@ Returns the following:
 
 [Learn more](sql-multivalue-string-functions.md)
 
+## MV_FILTER_REGEX
+
+Filters a multi-value expression to include only values matching the specified regular expression pattern.
+
+* **Syntax:** `MV_FILTER_REGEX(expr, pattern)`
+* **Function type:** Multi-value string
+
+<details>
+<summary>Example</summary>
+
+The following example filters the `tags` multi-value string from the `mvd-example` datasource to include only values starting with the letter `t`:
+
+```sql
+SELECT MV_FILTER_REGEX("tags", '^t.*') AS regex_filtered
+FROM "mvd-example"
+LIMIT 4
+```
+
+Returns the following:
+
+| `regex_filtered` |
+| -- |
+| `["t1","t2","t3"]` |
+| `["t3","t4","t5"]` |
+| `["t5","t6","t7"]` |
+| `[]` |
+
+</details>
+
+Filters multi-value `expr` to include values that match `pattern`.
+
+---
+
+## MV_FILTER_PREFIX
+
+Filters a multi-value expression to include only values that start with the specified prefix.
+
+* **Syntax:** `MV_FILTER_PREFIX(expr, prefix)`
+* **Function type:** Multi-value string
+
+<details>
+<summary>Example</summary>
+
+The following example filters the `tags` multi-value string from the `mvd-example` datasource to include only values starting with `t3`:
+
+```sql
+SELECT MV_FILTER_PREFIX("tags", 't3') AS prefix_filtered
+FROM "mvd-example"
+LIMIT 4
+```
+
+Returns the following:
+
+| `prefix_filtered` |
+| -- |
+| `[]` |
+| `["t3"]` |
+| `[]` |
+| `[]` |
+
+</details>
+
+Filters multi-value `expr` to include values that have prefix `prefix`.
+
 ## MV_LENGTH
 
 Returns the length of an array expression.
diff --git a/docs/latest/querying/sql-metadata-tables.md b/docs/latest/querying/sql-metadata-tables.md
index cd2db5cf14..6d59462fd1 100644
--- a/docs/latest/querying/sql-metadata-tables.md
+++ b/docs/latest/querying/sql-metadata-tables.md
@@ -236,6 +236,8 @@ Servers table lists all discovered servers in the cluster.
 |max_size|BIGINT|Max size in bytes this server recommends to assign to segments see [druid.server.maxSize](../configuration/index.md#historical-general-configuration). Only valid for HISTORICAL type, for other types it's 0|
 |is_leader|BIGINT|1 if the server is currently the 'leader' (for services which have the concept of leadership), otherwise 0 if the server is not the leader, or null if the server type does not have the concept of leadership|
 |start_time|STRING|Timestamp in ISO8601 format when the server was announced in the cluster|
+|version|VARCHAR|Druid version running on the server|
+|labels|VARCHAR|Labels for the server configured using the property [`druid.labels`](../configuration/index.md)|
 To retrieve information about all servers, use the query:
 
 ```sql
diff --git a/docs/latest/querying/sql-multivalue-string-functions.md b/docs/latest/querying/sql-multivalue-string-functions.md
index 5530621454..7cba8a70f6 100644
--- a/docs/latest/querying/sql-multivalue-string-functions.md
+++ b/docs/latest/querying/sql-multivalue-string-functions.md
@@ -50,6 +50,8 @@ All array references in the multi-value string function documentation can refer
 |--------|-----|
 |`MV_FILTER_ONLY(expr, arr)`|Filters multi-value `expr` to include only values contained in array `arr`.|
 |`MV_FILTER_NONE(expr, arr)`|Filters multi-value `expr` to include no values contained in array `arr`.|
+|`MV_FILTER_REGEX(expr, pattern)`|Filters multi-value `expr` to include values that match `pattern`.|
+|`MV_FILTER_PREFIX(expr, prefix)`|Filters multi-value `expr` to include values that have prefix `prefix`.|
 |`MV_LENGTH(arr)`|Returns length of the array expression.|
 |`MV_CONTAINS(arr, expr)`|If `expr` is a scalar type, returns true if `arr` contains `expr`. If `expr` is an array, returns true if `arr` contains all elements of `expr`. Otherwise returns false.|
 |`MV_OVERLAP(arr1, arr2)`|Returns true if `arr1` and `arr2` have any elements in common, else false.|
diff --git a/docs/latest/querying/sql-query-context.md b/docs/latest/querying/sql-query-context.md
index 854d383847..31ec12338a 100644
--- a/docs/latest/querying/sql-query-context.md
+++ b/docs/latest/querying/sql-query-context.md
@@ -47,6 +47,7 @@ The table below lists the query context parameters you can use with Druid SQL.
 |`useNativeQueryExplain`|If `true`, `EXPLAIN PLAN FOR` returns the explain plan as a JSON representation of equivalent native query, else it returns the original version of explain plan generated by Calcite.<br /><br />This property is provided for backwards compatibility. We don't recommend setting this parameter unless your application depends on the older behavior.|`true`|
 |`sqlFinalizeOuterSketches`|If `false` (default behavior in Druid 25.0.0 and later), `DS_HLL`, `DS_THETA`, and `DS_QUANTILES_SKETCH` return sketches in query results. If `true` (default behavior in Druid 24.0.1 and earlier), Druid finalizes sketches from these functions when they appear in query results.<br /><br />This property is provided for backwards compatibility with behavior in Druid 24.0.1 and earlier. We don't recommend setting this parameter unless your application uses Druid 24.0.1 or earlier. Instead, use a function that doesn't return a sketch, such as `APPROX_COUNT_DISTINCT_DS_HLL`, `APPROX_COUNT_DISTINCT_DS_THETA`, `APPROX_QUANTILE_DS`, `DS_THETA_ESTIMATE`, or `DS_GET_QUANTILE`.|`false`|
 |`sqlUseBoundAndSelectors`|If `false` (default behavior in Druid 27.0.0 and later), the SQL planner uses [equality](./filters.md#equality-filter), [null](./filters.md#null-filter), and [range](./filters.md#range-filter) filters instead of [selector](./filters.md#selector-filter) and [bounds](./filters.md#bound-filter). For filtering `ARRAY` typed values, `sqlUseBoundAndSelectors` must be `false`. | `false`.|
+|`sqlUseExtractionFns`|If false, the SQL planner avoids using [`extractionFn`](dimensionspecs.md#extraction-functions) in favor of using other constructs such as [virtual columns](virtual-columns.md). This parameter is provided for compatibility with prior behavior, and may be removed in a future release.|false|
 |`sqlReverseLookup`|Whether to consider the [reverse-lookup rewrite](lookups.md#reverse-lookup) of the `LOOKUP` function during SQL planning.<br /><br />Druid reverses calls to `LOOKUP` only when the number of matching keys is lower than both `inSubQueryThreshold` and `sqlReverseLookupThreshold`.|`true`|
 |`sqlReverseLookupThreshold`|Maximum size of `IN` filter to create when applying a [reverse-lookup rewrite](lookups.md#reverse-lookup). If a `LOOKUP` call matches more keys than the specified threshold, it remains unchanged.<br /><br />If `inSubQueryThreshold` is lower than `sqlReverseLookupThreshold`, Druid uses `inSubQueryThreshold` threshold instead.|10000|
 |`sqlPullUpLookup`|Whether to consider the [pull-up rewrite](lookups.md#pull-up) of the `LOOKUP` function during SQL planning.|`true`|
diff --git a/docs/latest/querying/sql-scalar.md b/docs/latest/querying/sql-scalar.md
index 05f29436da..59c3e2893a 100644
--- a/docs/latest/querying/sql-scalar.md
+++ b/docs/latest/querying/sql-scalar.md
@@ -115,7 +115,7 @@ String functions accept strings and return a type appropriate to the function.
 |`REPLACE(expr, substring, replacement)`|Replaces instances of `substring` in `expr` with `replacement` and returns the result.|
 |`REPEAT(expr, N)`|Repeats `expr` `N` times.|
 |`REVERSE(expr)`|Reverses `expr`.|
-|`STRING_FORMAT(pattern[, args...])`|Returns a string formatted in the manner of Java's [String.format](https://docs.oracle.com/en/java/javase/11/docs/api/java.base/java/lang/String.html#format(java.lang.String,java.lang.Object...)).|
+|`STRING_FORMAT(pattern[, args...])`|Returns a string formatted in the manner of Java's [String.format](https://docs.oracle.com/en/java/javase/17/docs/api/java.base/java/lang/String.html#format(java.lang.String,java.lang.Object...)).|
 |`STRPOS(expr, substring)`|Returns the index of `substring` within `expr`, with indexes starting from 1. If `substring` is not found, returns 0.|
 |`SUBSTRING(expr, index[, length])`|Returns a substring of `expr` starting at a given one-based index. If `length` is omitted, extracts characters to the end of the string, otherwise returns a substring of `length` UTF-16 characters.|
 |`SUBSTR(expr, index[, length])`|Alias for `SUBSTRING`.|
diff --git a/docs/latest/release-info/release-notes.md b/docs/latest/release-info/release-notes.md
index c07dc5c1d7..1635084308 100644
--- a/docs/latest/release-info/release-notes.md
+++ b/docs/latest/release-info/release-notes.md
@@ -22,17 +22,17 @@ title: "Release notes"
   ~ under the License.
   -->
 
-<!--Replace 34.0.0 with the correct Druid version.-->
+<!--Replace 35.0.0 with the correct Druid version.-->
 
-Apache Druid 34.0.0 contains over 270 new features, bug fixes, performance enhancements, documentation improvements, and additional test coverage from 48 contributors.
+Apache Druid 35.0.0 contains over $NUMBER_FEATURES new features, bug fixes, performance enhancements, documentation improvements, and additional test coverage from $NUMBER_OF_CONTRIBUTORS contributors.
 
 <!--
 Replace {{MILESTONE}} with the correct milestone number. For example: https://github.com/apache/druid/issues?q=is%3Aclosed+milestone%3A28.0+sort%3Aupdated-desc+
 -->
 
-See the [complete set of changes](https://github.com/apache/druid/milestone/62?closed=1) for additional details, including bug fixes.
+See the [complete set of changes](https://github.com/apache/druid/issues?q=is%3Aclosed+milestone%3A{{MILESTONE}}+sort%3Aupdated-desc+) for additional details, including bug fixes.
 
-Review the [upgrade notes](#upgrade-notes) and [incompatible changes](#incompatible-changes) before you upgrade to Druid 34.0.0.
+Review the [upgrade notes](#upgrade-notes) and [incompatible changes](#incompatible-changes) before you upgrade to Druid 35.0.0.
 If you are upgrading across multiple versions, see the [Upgrade notes](upgrade-notes.md) page, which lists upgrade notes for the most recent Druid versions.
 
 <!-- 
@@ -57,392 +57,63 @@ For tips about how to write a good release note, see [Release notes](https://git
 
 This section contains important information about new and existing features.
 
-### Java 11 support
-
-Java 11 support has been deprecated since Druid 32.0, and official support will be removed as early as Druid 35.0.0
-
-### Hadoop-based ingestion
-
-Hadoop-based ingestion has been deprecated since Druid 32.0 and will be removed as early as Druid 35.0.0. 
-We recommend one of Druid's other supported ingestion methods, such as [SQL-based ingestion](../multi-stage-query/index.md) or [MiddleManager-less ingestion using Kubernetes](../development/extensions-core/k8s-jobs.md).
-
-As part of this change, you must now opt-in to using the deprecated `index_hadoop` task type. If you don't do this, your Hadoop-based ingestion tasks will fail.
-
-To opt-in, set `druid.indexer.task.allowHadoopTaskExecution` to `true` in your `common.runtime.properties` file.
-
-[#18239](https://github.com/apache/druid/pull/18239)
-
-### Use SET statements for query context parameters
-
-You can now use SET statements to define query context parameters for a query through the [Druid console](#set-statements-in-the-druid-console) or the [API](#set-statements-with-the-api).
-
-[#17894](https://github.com/apache/druid/pull/17894) [#17974](https://github.com/apache/druid/pull/17974)
-
-#### SET statements in the Druid console
-
-The web console now supports using SET statements to specify query context parameters. For example, if you include `SET timeout = 20000;` in your query, the timeout query context parameter is set:
-
-```sql
-SET timeout = 20000;
-SELECT "channel", "page", sum("added") from "wikipedia" GROUP BY 1, 2
-```
-
-[#17966](https://github.com/apache/druid/pull/17966)
-
-#### SET statements with the API
-
-SQL queries issued to `/druid/v2/sql` can now include multiple SET statements to build up context for the final statement. For example, the following SQL query results includes the `timeout`, `useCache`, `populateCache`, `vectorize`, and `engine` query context parameters: 
-
-```sql
-SET timeout = 20000;
-SET useCache = false;
-SET populateCache = false;
-SET vectorize = 'force';
-SET engine = 'msq-dart'
-SELECT "channel", "page", sum("added") from "wikipedia" GROUP BY 1, 2
-```
-
-The API call for this query looks like the following: 
-
-```curl
-curl --location 'http://HOST:PORT/druid/v2/sql' \
---header 'Content-Type: application/json' \
---data '{
-  "query": "SET timeout=20000; SET useCache=false; SET populateCache=false; SET engine='\''msq-dart'\'';SELECT  user,  commentLength,COUNT(*) AS \"COUNT\" FROM wikipedia GROUP BY 1, 2 ORDER BY 2 DESC",
-  "resultFormat": "array",
-  "header": true,
-  "typesHeader": true,
-  "sqlTypesHeader": true
-}'
-```
-
-This improvement also works for INSERT and REPLACE queries using the MSQ task engine. Note that JDBC isn't supported.
-
-#### Improved HTTP endpoints
-
-You can now use raw SQL in the HTTP body for `/druid/v2/sql` endpoints. You can set `Content-Type` to `text/plain` instead of `application/json`, so you can provide raw text that isn't escaped. 
-
- [#17937](https://github.com/apache/druid/pull/17937)
-
-### Cloning Historicals (experimental)
-
-You can now configure clones for Historicals using the dynamic Coordinator configuration `cloneServers`. Cloned Historicals are useful for situations such as rolling updates where you want to launch a new Historical as a replacement for an existing one.
-
-Set the config to a map from the target Historical server to the source Historical:
-
-```
-  "cloneServers": {"historicalClone":"historicalOriginal"}
-```
-
-The clone doesn't participate in regular segment assignment or balancing. Instead, the Coordinator mirrors any segment assignment made to the original Historical onto the clone, so that the clone becomes an exact copy of the source. Segments on the clone Historical do not count towards replica counts either. If the original Historical disappears, the clone remains in the last known state of the source server until removed from the `cloneServers` config.
-
-When you query your data using the native query engine, you can prefer (`preferClones`), exclude (`excludeClones`), or include (`includeClones`) clones by setting the query context parameter `cloneQueryMode`. By default, clones are excluded.
-
-As part of this change, new Coordinator APIs are available. For more information, see [Coordinator APIs for clones](#coordinator-apis-for-clones).
-
-[#17863](https://github.com/apache/druid/pull/17863) [#17899](https://github.com/apache/druid/pull/17899) [#17956](https://github.com/apache/druid/pull/17956) 
-
-### Embedded kill tasks on the Overlord (Experimental)
-
-You can now run kill tasks directly on the Overlord itself. Embedded kill tasks provide several benefits; they:
-
-- Kill segments as soon as they're eligible 
-- Don't take up tasks slot
-- finish faster since they use optimized metadata queries and don't launch a new JVM
-- Kill a small number of segments per task, ensuring locks on an interval aren't held for too long
-- Skip locked intervals to avoid head-of-line blocking
-- Require minimal configuration
-- Can keep up with a large number of unused segments in the cluster
-
-This feature is controlled by the following configs:
-
-- `druid.manager.segments.killUnused.enabled` - Whether the feature is enabled or not (Defaults to `false`)
-- `druid.manager.segments.killUnused.bufferPeriod` - The amount of time that a segment must be unused before it is able to be permanently removed from metadata and deep storage. This can serve as a buffer period to prevent data loss if data ends up being needed after being marked unused (Defaults to `P30D`)
-
-To use embedded kill tasks, you need to have segment metadata cache enabled.
-
-As part of this feature, [new metrics](#overlord-kill-task-metrics) have been added.
-
-[#18028](https://github.com/apache/druid/pull/18028) [#18124](https://github.com/apache/druid/pull/18124)
-
-### Preferred tier selection 
-You can now configure the Broker service to prefer Historicals on a specific tier. This is useful for across availability zone deployment. Brokers in one AZ select historicals in the same AZ by default but still keeps the ability to select historical nodes in another AZ if historicals in the same AZ are not available.
-
-To enable, set property `druid.broker.select.tier` to `perferred` in Broker runtime properties. You can then configure `druid.broker.select.tier.preferred.tier` to the tier you want each broker to prefer (i.e. for brokers in `AZ1`, you could set this to the tier name of your `AZ1` historical servers).
-
-[#18136](https://github.com/apache/druid/pull/18136)
-
-### Dart improvements 
-
-The Dart query engine now uses the `/druid/v2/sql` endpoint like other SQL query engines. The former Dart specific endpoint is no longer supported. To use Dart for a query, include the `engine` query context parameter and set it to `msq-dart`.
-
-[#18003](https://github.com/apache/druid/pull/18003) [#18003](https://github.com/apache/druid/pull/18003)
-
-Enabling Dart remains the same, add the following line to your `broker/runtime.properties` and `historical/runtime.properties` files:
-
-```
-druid.msq.dart.enabled = true
-```
-
-Additionally, Dart now queries real-time tasks by default. You can control this behavior by setting the query context parameter `includeSegmentSource` to `REALTIME` (default) or `NONE`, in a similar way to MSQ tasks. You can also run synchronous or asynchronous queries. 
-
-[#18076](https://github.com/apache/druid/pull/18076) [#18241](https://github.com/apache/druid/pull/18241)
-
-### `SegmentMetadataCache` on the Coordinator
-
-[#17996](https://github.com/apache/druid/pull/17996) [#17935](https://github.com/apache/druid/pull/17935)
-
 ## Functional area and related changes
 
 This section contains detailed release notes separated by areas.
 
 ### Web console
 
-- You can now assign tiered replications to tiers that aren't currently online [#18050](https://github.com/apache/druid/pull/18050)
-- You can now filter tasks by the error in the Task view [#18057](https://github.com/apache/druid/pull/18057)
-- Improved SQL autocomplete and added JSON autocomplete [#18126](https://github.com/apache/druid/pull/18126)
-- Changed how the web console determines what functions are available, improving things like auto-completion [#18214](https://github.com/apache/druid/pull/18214)
-- Updated the web console to use the Overlord APIs instead of Coordinator APIs when managing segments, such as marking them as unused [#18172](https://github.com/apache/druid/pull/18172)
+#### Other web console improvements
 
 ### Ingestion
 
-- Improved concurrency for batch and streaming ingestion tasks [#17828](https://github.com/apache/druid/pull/17828)
-- Removed the `useMaxMemoryEstimates` config. When set to false, Druid used a much more accurate memory estimate that was introduced in Druid 0.23.0. That more accurate method is the only available method now. The config has defaulted to false for several releases [#17936](https://github.com/apache/druid/pull/17936)
-
-#### Streaming ingestion
-
-##### Multi-stream supervisors (experimental)
-
-You can now use more than one supervisor to ingest data into the same datasource. Use the `id` field to distinguish between supervisors ingesting into the same datasource (identified by `spec.dataSchema.dataSource` for streaming supervisors).
-
-When using this feature, make sure you set `useConcurrentLocks` to `true` for the `context` field in the supervisor spec.
-
-[#18149](https://github.com/apache/druid/pull/18149) [#18082](https://github.com/apache/druid/pull/18082)
+#### SQL-based ingestion
 
-##### Supervisors and the underlying input stream
+##### Other SQL-based ingestion improvements
 
-Seekable stream supervisors (Kafka, Kinesis, and Rabbit) can no longer be updated to ingest from a different input stream (such as a topic for Kafka). Since such a change is not fully supported by the underlying system, a request to make such a change will result in a 400 error. 
-
-[#17955](https://github.com/apache/druid/pull/17955) [#17975](https://github.com/apache/druid/pull/17975)
+#### Streaming ingestion
 
 ##### Other streaming ingestion improvements
 
-- Improved streaming ingestion so that it automatically determine the maximum number of columns to merge [#17917](https://github.com/apache/druid/pull/17917)
-
-
 ### Querying
 
-#### Metadata query for segments
-
-You can use a segment metadata query to find the list of projections attached to a segment.
-
-[#18119](https://github.com/apache/druid/pull/18119) [#18223](https://github.com/apache/druid/pull/)
-
-#### `json_merge()` improvement
-
-`json_merge()` is now SQL-compliant when arguments are null. The function now returns null if any argument is null. For example, queries like SELECT JSON_MERGE(null, null) and SELECT JSON_MERGE(null, '{}') will return null instead of throwing an error.
-
-[#17983](https://github.com/apache/druid/pull/17983)
 #### Other querying improvements
 
-- You can now perform big decimal aggregations using the MSQ task engine [#18164](https://github.com/apache/druid/pull/18164)
-- Changed `MV_OVERLAP` and `MV_CONTAINS` functions now aligns more closely with the native `inType` filter [#18084](https://github.com/apache/druid/pull/18084)
-- Improved query handling when segments are temporarily missing on Historicals but not detected by Brokers. Druid doesn't return partial results incorrectly in such cases. [#18025](https://github.com/apache/druid/pull/18025)
-
 ### Cluster management
 
-#### Configurable timeout for subtasks
-
-You can now configure a timeout for `index_parallel` and `compact` type tasks. Set the context parameter `subTaskTimeoutMillis` to the maximum time in milliseconds you want to wait before a subtask gets canceled. By default, there's no timeout.
-
-Using this config helps parent tasks fail sooner instead of being stuck running zombie sub-tasks.
-
-[#18039](https://github.com/apache/druid/pull/18039)
-
-#### Coordinator APIs for clones
-
-The following Coordinator APIs are now available:
-
-- `/druid/coordinator/v1/cloneStatus` to get information about ongoing cloning operations.
-- `/druid/coordinator/v1/brokerConfigurationStatus` which returns the broker sync status for coordinator dynamic configs.
-
-[#17899](https://github.com/apache/druid/pull/17899)
-
 #### Other cluster management improvements
 
-- Added the optional `taskCountStart`  property to the lag based auto scaler. Use it to specify the initial task count for the supervisor to be submitted with [#17900](https://github.com/apache/druid/pull/17900)
-- Added audit logs for the following `BasicAuthorizerResource` update methods: `authorizerUserUpdateListener`, `authorizerGroupMappingUpdateListener`, `authorizerUpdateListener` (deprecated) [#17916](https://github.com/apache/druid/pull/17916)
-- Added support for streaming task logs to Indexers [#18170](https://github.com/apache/druid/pull/18170)
-- Improved how MSQ task engine tasks get canceled, speeding it up and freeing up resources sooner [#18095](https://github.com/apache/druid/pull/18095)
-
-### Metrics and monitoring
-
-#### Metrics for Historical cloning
-
-The following metrics for Historical cloning have been added: 
-
-- `config/brokerSync/time`
-- `config/brokerSync/total/time`
-- `config/brokerSync/error`
+### Data management
 
+#### Other data management improvements
 
-#### Real-time ingestion metrics
-
-The following metrics for streaming ingestion have been added: 
-
-|Metric|Description|Dimensions|
-|------|------------|-----------|
-|`ingest/events/maxMessageGap`|Maximum seen time gap in milliseconds between each ingested event timestamp and the current system timestamp of metrics emission. This metric is reset every emission period.|`dataSource`, `taskId`, `taskType`, `groupId`, `tags`|Greater than 0, depends on the time carried in event.|
-|`ingest/events/minMessageGap`|Minimum seen time gap in milliseconds between each ingested event timestamp and the current system timestamp of metrics emission. This metric is reset every emission period.|`dataSource`, `taskId`, `taskType`, `groupId`, `tags`|Greater than 0, depends on the time carried in event.|
-|`ingest/events/avgMessageGap`|Average time gap in milliseconds between each ingested event timestamp and the current system timestamp of metrics emission. This metric is reset every emission period.|`dataSource`, `taskId`, `taskType`, `groupId`, `tags`|Greater than 0, depends on the time carried in event.|
-
-[#17847](https://github.com/apache/druid/pull/17847)
-
-#### Kafka consumer metrics
-
-The following metrics that correspond to Kafka metrics have been added:
-
-| Kafka metric           | Druid metric                     |
-|----------------------------|----------------------------------------|
-| `bytes-consumed-total`     | `kafka/consumer/bytesConsumed`         |
-| `records-consumed-total`   | `kafka/consumer/recordsConsumed`       |
-| `fetch-total`              | `kafka/consumer/fetch`                 |
-| `fetch-rate`               | `kafka/consumer/fetchRate`             |
-| `fetch-latency-avg`        | `kafka/consumer/fetchLatencyAvg`       |
-| `fetch-latency-max`        | `kafka/consumer/fetchLatencyMax`       |
-| `fetch-size-avg`           | `kafka/consumer/fetchSizeAvg`          |
-| `fetch-size-max`           | `kafka/consumer/fetchSizeMax`          |
-| `records-lag`              | `kafka/consumer/recordsLag`            |
-| `records-per-request-avg`  | `kafka/consumer/recordsPerRequestAvg`  |
-| `outgoing-byte-total`      | `kafka/consumer/outgoingBytes`         |
-| `incoming-byte-total`      | `kafka/consumer/incomingBytes`         |
-
-[#17919](https://github.com/apache/druid/pull/17919)
-
-#### Overlord kill task metrics
-
-|Metric|Description|Dimensions|
-|------|------------|-----------|
-|`segment/killed/metadataStore/count`|Number of segments permanently deleted from metadata store|`dataSource`, `taskId`, `taskType`, `groupId`, `tags`|
-|`segment/killed/deepStorage/count`|Number of segments permanently deleted from deep storage|`dataSource`, `taskId`, `taskType`, `groupId`, `tags`|
-|`segment/kill/queueReset/time`|Time taken to reset the kill queue on the Overlord. This metric is emitted only if `druid.manager.segments.killUnused.enabled` is true.||
-|`segment/kill/queueProcess/time`|Time taken to fully process all the jobs in the kill queue on the Overlord. This metric is emitted only if `druid.manager.segments.killUnused.enabled` is true.||
-|`segment/kill/jobsProcessed/count`|Number of jobs processed from the kill queue on the Overlord. This metric is emitted only if `druid.manager.segments.killUnused.enabled` is true.||
-|`segment/kill/skippedIntervals/count`|Number of intervals skipped from kill due to being already locked. This metric is emitted only if `druid.manager.segments.killUnused.enabled` is true.|`dataSource`, `taskId`|
-
-[#18028](https://github.com/apache/druid/pull/18028)
-
-#### New task metrics
-
-The MSQ task engine and Dart now support the following metrics:
-
-- `query/time`: Reported by controller and worker at the end of the query.
-- `query/cpu/time`: Reported by each worker at the end of the query.
-
-Additionally, MSQ task engine metrics now include the following dimensions:
-
-- `queryId`
-- `sqlQueryId`
-- `engine`: Denotes the engine used for the query, `msq-dart` or `msq-task`.
-- `dartQueryId`: (Dart only)
-- `type`: Always `msq`
-- `dataSource`
-- `interval`
-- `duration`
-- `success`
-
-[#18121](https://github.com/apache/druid/pull/18121)
-
-#### Other metrics and monitoring improvements
-
-- Added the `description` dimension for the `task/run/time` metric 
-- Added a metric for how long it takes to complete an autoscale action: `task/autoScaler/scaleActionTime` [#17971](https://github.com/apache/druid/pull/17971)
-- Added a `taskType` dimension to Overlord-emitted task count metrics  [#18032](https://github.com/apache/druid/pull/18032)
-- Added the following groupBy metrics to the Prometheus emitter: `mergeBuffer/used`, `mergeBuffer/acquisitionTimeNs`, `mergeBuffer/acquisition`, `groupBy/spilledQueries`, `groupBy/spilledBytes`, and `groupBy/mergeDictionarySize` [#17929](https://github.com/apache/druid/pull/17929)
-- Changed the logging level for query cancellation from `warn` to `info` to reduce noise [#18046](https://github.com/apache/druid/pull/18046)
-- Changed query logging so that SQL queries that can't be parsed are no longer logged and don't emit metrics [#18102](https://github.com/apache/druid/pull/18102)
-- Changed the logging level for lifecycle from `debug` to `info` [#17884](https://github.com/apache/druid/pull/17884)
-- Added  `groupId` and `tasks` to Overlord logs [#17980](https://github.com/apache/druid/pull/17980)
-- You can now use the `druid.request.logging.rollPeriod` to configure the log rotation period (default 1 day) [#17976](https://github.com/apache/druid/pull/17976)
-- Improved metric emission on the Broker to include per-query result-level caching (`query/resultCache/hit` returning `1` means the cache was used) [#18063](https://github.com/apache/druid/pull/18063)
+### Metrics and monitoring
 
 ### Extensions
 
-#### Kubernetes
-
-- The task runner log now includes the task id for a job and includes a log before a job is created [#18105](https://github.com/apache/druid/pull/18105)
+### Documentation improvements
 
 ## Upgrade notes and incompatible changes
 
 ### Upgrade notes
 
-#### Hadoop-based ingestion
+#### Front-coded dictionaries
 
-Hadoop-based ingestion has been deprecated since Druid 32.0 and will be removed as early as Druid 35.0.0. 
+<!--Carry this forward until 32. Then move it to incompatible changes -->
 
-We recommend one of Druid's other supported ingestion methods, such as [SQL-based ingestion](../multi-stage-query/index.md) or [MiddleManager-less ingestion using Kubernetes](../development/extensions-core/k8s-jobs.md).
+In Druid 32.0.0, the front coded dictionaries feature will be turned on by default. Front-coded dictionaries reduce storage and improve performance by optimizing for strings where the front part looks similar.
 
-As part of this change, you must now opt-in to using the deprecated `index_hadoop` task type. If you don't do this, your Hadoop-based ingestion tasks will fail.
-To opt-in, set `druid.indexer.task.allowHadoopTaskExecution` to `true` in your `common.runtime.properties` file.
-[#18239](https://github.com/apache/druid/pull/18239)
+Once this feature is on, you cannot easily downgrade to an earlier version that does not support the feature. 
 
-#### `groupBy` and `topN` queries
+For more information, see [Migration guide: front-coded dictionaries](./migr-front-coded-dict.md).
 
-Druid now uses the `groupBy` native query type, rather than `topN`, for SQL queries that group
-by and order by the same column, have `LIMIT`, and don't have `HAVING`. This speeds up execution
-of such queries since `groupBy` is vectorized while `topN` is not. 
+If you're already using this feature, you don't need to take any action. 
 
-You can restore the previous behavior by setting the query context parameter `useLexicographicTopN` to `true`. Behavior for `useApproximateTopN` is unchanged, and the default remains `true`.
-
-[#18074](https://github.com/apache/druid/pull/18074)
-#### `IS_INCREMENTAL_HANDOFF_SUPPORTED` config removed
-
-Removed the `IS_INCREMENTAL_HANDOFF_SUPPORTED` context reference from supervisors, as incremental publishing has been the default behavior since version 0.16.0. This context was originally introduced to support rollback to `LegacyKafkaIndexTaskRunner` in versions earlier than 0.16.0, which has since been removed.
-
-#### `useMaxMemoryEstimates` config removed 
-
-Removed the `useMaxMemoryEstimates` config. When set to false, Druid used a much more accurate memory estimate that was introduced in Druid 0.23.0. That more accurate method is the only available method now. The config has defaulted to false for several releases. 
-
-[#17936](https://github.com/apache/druid/pull/17936)
 
 ### Incompatible changes
 
 ### Developer notes
 
-- Some maven plugins no longer use hard-coded version numbers. Instead, they now pull from the Apache parent [#18138](https://github.com/apache/druid/pull/18138)
-
 #### Dependency updates
 
-- Added `j2objc-annotations` [#18154](https://github.com/apache/druid/pull/18154)
-
-The following dependencies have had their versions bumped:
-
-- `apache.kafka` from `3.9.0` to `3.9.1` [#18178](https://github.com/apache/druid/pull/18178)
-- `aws.sdk` for Java from `1.12.638` to  `1.12.784` [#18068](https://github.com/apache/druid/pull/18068)
-- `fabric8` from `6.7.2` to `6.13.1`. The updated `fabric8` version uses `Vert.x` as an HTTP client instead of  `OkHttp` [#17913](https://github.com/apache/druid/pull/17913)
-- Curator from `5.5.0` to `5.8.0` [#17857](https://github.com/apache/druid/pull/17857)
-- `com.fasterxml.jackson.core` from `2.12.7.1` to `2.18.4` [#18013](https://github.com/apache/druid/pull/18013)
-- `fabric8` from `6.13.1` to `7.2.0`
-- `org.apache.parquet:parquet-avro` from `1.15.1` to `1.15.2`  [#18131](https://github.com/apache/druid/pull/18131)
-- `commons-beanutils:commons-beanutils` from `1.9.4` to `1.11.0` [#18132](https://github.com/apache/druid/pull/18132)
-- `form-data` from `4.0.0` to `4.0.4` [18310](https://github.com/apache/druid/pull/18310)
-- `guava` from `32.0.1` to `32.1.3` [#18154](https://github.com/apache/druid/pull/18154)
-- `confluent` from `6.2.12` to `6.2.15` [#18154](https://github.com/apache/druid/pull/18154)
-- `netty4` from `4.1.118.Final` to `4.1.122.Final` [#18154](https://github.com/apache/druid/pull/18154)
-- `slf4j` from `1.7.36` to `2.0.16` [#18154](https://github.com/apache/druid/pull/18154)
-- `commons-logging` from `1.1.1` to `1.3.5` [#18154](https://github.com/apache/druid/pull/18154)
-- `commons-lang3` to `3.17.0` [#18154](https://github.com/apache/druid/pull/18154)
-- `commons-text` to `1.13.1` [#18154](https://github.com/apache/druid/pull/18154)
-- `json-smart` to `2.5.2` [#18154](https://github.com/apache/druid/pull/18154)
-- `kotlin-stdlib` to `1.9.25` [#18154](https://github.com/apache/druid/pull/18154)
-- `joda-time` to `2.14.0` [#18154](https://github.com/apache/druid/pull/18154)
-- `com.google.code.findbugs` to `3.0.2` [#18154](https://github.com/apache/druid/pull/18154)
-- `log4j-slf4j` updated to `log4j-slf4j2` [#18154](https://github.com/apache/druid/pull/18154)
-- `snappy-java` to `1.1.10.7` [#18154](https://github.com/apache/druid/pull/18154)
-- `httpcore` to `4.4.16` [#18154](https://github.com/apache/druid/pull/18154)
-- `asm` to `9.8` [#18154](https://github.com/apache/druid/pull/18154)
-- `async-http-client` to `3.0.2` [#18154](https://github.com/apache/druid/pull/18154)
-- `plexus-utils` to `3.1.0` [#18154](https://github.com/apache/druid/pull/18154)
-- `equalsverifier` to `3.15.8` [#18154](https://github.com/apache/druid/pull/18154)
-- `value-annotations` to `2.10.1` [#18154](https://github.com/apache/druid/pull/18154)
-- `form-data` to `4.0.4` [#18310](https://github.com/apache/druid/pull/18310)
+The following dependencies have had their versions bumped:
\ No newline at end of file
diff --git a/docs/latest/release-info/upgrade-notes.md b/docs/latest/release-info/upgrade-notes.md
index 6aad866df5..440eb7d77e 100644
--- a/docs/latest/release-info/upgrade-notes.md
+++ b/docs/latest/release-info/upgrade-notes.md
@@ -44,7 +44,7 @@ If you're already using this feature, you don't need to take any action.
 
 #### Hadoop-based ingestion
 
-Hadoop-based ingestion has been deprecated since Druid 32.0 and will be removed as early as Druid 35.0.0. 
+Hadoop-based ingestion has been deprecated since Druid 32.0 and is scheduled to be removed in Druid 37.0.0. 
 
 We recommend one of Druid's other supported ingestion methods, such as [SQL-based ingestion](../multi-stage-query/index.md) or [MiddleManager-less ingestion using Kubernetes](../development/extensions-core/k8s-jobs.md).
 
@@ -117,13 +117,11 @@ This feature is introduced in Druid 33.0.
 
 [#17653](https://github.com/apache/druid/pull/17653)
 
-
-
 ## 32.0.0
 
 ### Incompatible changes
 
-#### ANSI-SQL compatibility and query results
+### ANSI-SQL compatibility and query results
 
 Support for the configs that let you maintain older behavior that wasn't ANSI-SQL compliant have been removed:
 
@@ -141,7 +139,7 @@ For more information about how to update your queries, see the [migration guide]
 
 [#17568](https://github.com/apache/druid/pull/17568) [#17609](https://github.com/apache/druid/pull/17609)
 
-#### Java support
+### Java support
 
 Java support in Druid has been updated:
 
@@ -152,13 +150,13 @@ We recommend that you upgrade to Java 17.
 
 [#17466](https://github.com/apache/druid/pull/17466)
 
-#### Javascript support
+### Javascript support
 
 - Javascript tiered broker selector strategy and Javascript filters currently do not work on Java 17.
 
 ### Deprecations
 
-#### Hadoop-based ingestion
+### Hadoop-based ingestion
 
 Hadoop-based ingestion is now deprecated. We recommend that you migrate to SQL-based ingestion. 
 
diff --git a/docs/latest/tutorials/cluster.md b/docs/latest/tutorials/cluster.md
index 69159f17df..f347411301 100644
--- a/docs/latest/tutorials/cluster.md
+++ b/docs/latest/tutorials/cluster.md
@@ -150,14 +150,14 @@ First, download and unpack the release archive. It's best to do this on a single
 since you will be editing the configurations and then copying the modified distribution out to all
 of your servers.
 
-[Download](https://www.apache.org/dyn/closer.cgi?path=/druid/34.0.0/apache-druid34.0.0-bin.tar.gz)
-the 34.0.0 release.
+[Download](https://www.apache.org/dyn/closer.cgi?path=/druid/35.0.0/apache-druid35.0.0-bin.tar.gz)
+the 35.0.0 release.
 
 Extract Druid by running the following commands in your terminal:
 
 ```bash
-tar -xzf apache-druid-34.0.0-bin.tar.gz
-cd apache-druid-34.0.0
+tar -xzf apache-druid-35.0.0-bin.tar.gz
+cd apache-druid-35.0.0
 ```
 
 In the package, you should find:
@@ -423,7 +423,7 @@ Copy the Druid distribution and your edited configurations to your Master server
 If you have been editing the configurations on your local machine, you can use *rsync* to copy them:
 
 ```bash
-rsync -az apache-druid-34.0.0/ MASTER_SERVER:apache-druid-34.0.0/
+rsync -az apache-druid-35.0.0/ MASTER_SERVER:apache-druid-35.0.0/
 ```
 
 ### No Zookeeper on Master
diff --git a/docs/latest/tutorials/docker.md b/docs/latest/tutorials/docker.md
index f15168a06e..76e29fd54b 100644
--- a/docs/latest/tutorials/docker.md
+++ b/docs/latest/tutorials/docker.md
@@ -48,7 +48,7 @@ You can modify the value of `DRUID_SINGLE_NODE_CONF` in the Docker [`environment
 
 Create a directory to hold the Druid Docker files.
 
-The Druid source code contains [an example `docker-compose.yml`](https://github.com/apache/druid/blob/34.0.0/distribution/docker/docker-compose.yml) which pulls an image from Docker Hub and is suited to be used as an example environment and to experiment with Docker based Druid configuration and deployments. [Download](https://raw.githubusercontent.com/apache/druid/34.0.0/distribution/docker/docker-compose.yml) this file to the directory created above.
+The Druid source code contains [an example `docker-compose.yml`](https://github.com/apache/druid/blob/35.0.0/distribution/docker/docker-compose.yml) which pulls an image from Docker Hub and is suited to be used as an example environment and to experiment with Docker based Druid configuration and deployments. [Download](https://raw.githubusercontent.com/apache/druid/35.0.0/distribution/docker/docker-compose.yml) this file to the directory created above.
 
 ### Compose file
 
@@ -58,7 +58,7 @@ It will also create a named volume `druid_shared` as deep storage to keep and sh
 
 ### Environment file
 
-The Druid `docker-compose.yml` example uses an [environment file](https://docs.docker.com/compose/environment-variables/#the-env_file-configuration-option) to specify the complete Druid configuration, including the environment variables described in [Configuration](#configuration). This file is named `environment` by default, and must be in the same directory as the `docker-compose.yml` file. [Download](https://raw.githubusercontent.com/apache/druid/34.0.0/distribution/docker/environment) the example `environment` file to the directory created above. The options in this file work well for trying Druid and for using the tutorial.
+The Druid `docker-compose.yml` example uses an [environment file](https://docs.docker.com/compose/environment-variables/#the-env_file-configuration-option) to specify the complete Druid configuration, including the environment variables described in [Configuration](#configuration). This file is named `environment` by default, and must be in the same directory as the `docker-compose.yml` file. [Download](https://raw.githubusercontent.com/apache/druid/35.0.0/distribution/docker/environment) the example `environment` file to the directory created above. The options in this file work well for trying Druid and for using the tutorial.
 
 The single-file approach is inadequate for a production system. Instead we suggest using either `DRUID_COMMON_CONFIG` and `DRUID_CONFIG_${service}` or specially tailored, service-specific environment files.
 
@@ -81,7 +81,7 @@ Production configuration:
 
 Logging configuration:
 
-* `DRUID_LOG4J` -- set the entire [`log4j.xml` configuration file](https://logging.apache.org/log4j/2.x/manual/configuration.html#XML)  verbatim. ([Example](https://github.com/apache/druid/blob/34.0.0/distribution/docker/environment#L52))
+* `DRUID_LOG4J` -- set the entire [`log4j.xml` configuration file](https://logging.apache.org/log4j/2.x/manual/configuration.html#XML)  verbatim. ([Example](https://github.com/apache/druid/blob/35.0.0/distribution/docker/environment#L52))
 * `DRUID_LOG_LEVEL` -- override the default [Log4j log level](https://en.wikipedia.org/wiki/Log4j#Log4j_log_levels)
 * `DRUID_SERVICE_LOG4J` -- set the entire [`log4j.xml` configuration file](https://logging.apache.org/log4j/2.x/manual/configuration.html#XML)  verbatim specific to a service.
 * `DRUID_SERVICE_LOG_LEVEL` -- override the default [Log4j log level](https://en.wikipedia.org/wiki/Log4j#Log4j_log_levels) in the service specific log4j.
@@ -131,7 +131,7 @@ You can explore the Druid containers using Docker to start a shell:
 docker exec -ti <id> sh
 ```
 
-Where `<id>` is the container id found with `docker ps`. Druid is installed in `/opt/druid`. The [script](https://github.com/apache/druid/blob/34.0.0/distribution/docker/druid.sh) which consumes the environment variables mentioned above, and which launches Druid, is located at `/druid.sh`.
+Where `<id>` is the container id found with `docker ps`. Druid is installed in `/opt/druid`. The [script](https://github.com/apache/druid/blob/35.0.0/distribution/docker/druid.sh) which consumes the environment variables mentioned above, and which launches Druid, is located at `/druid.sh`.
 
 Run `docker compose down` to shut down the cluster. Your data is persisted as a set of [Docker volumes](https://docs.docker.com/storage/volumes/) and will be available when you restart your Druid cluster.
 
diff --git a/docs/latest/tutorials/index.md b/docs/latest/tutorials/index.md
index ec67480748..390f7ebc10 100644
--- a/docs/latest/tutorials/index.md
+++ b/docs/latest/tutorials/index.md
@@ -45,7 +45,7 @@ The software requirements for the installation machine are:
 * Perl 5
 
 Java must be available. Either it is on your path, or set one of the `JAVA_HOME` or `DRUID_JAVA_HOME` environment variables.
-You can run `apache-druid-34.0.0/bin/verify-java` to verify Java requirements for your environment.
+You can run `apache-druid-35.0.0/bin/verify-java` to verify Java requirements for your environment.
 
 Before installing a production Druid instance, be sure to review the [security
 overview](../operations/security-overview.md). In general, avoid running Druid as root user. Consider creating a
@@ -53,13 +53,13 @@ dedicated user account for running Druid.
 
 ## Install Druid
 
-Download the [34.0.0 release](https://druid.apache.org/downloads/) from Apache Druid. 
+Download the [35.0.0 release](https://druid.apache.org/downloads/) from Apache Druid. 
 
 In your terminal, extract the file and change directories to the distribution directory:
 
 ```bash
-tar -xzf apache-druid-34.0.0-bin.tar.gz
-cd apache-druid-34.0.0
+tar -xzf apache-druid-35.0.0-bin.tar.gz
+cd apache-druid-35.0.0
 ```
 
 The distribution directory contains `LICENSE` and `NOTICE` files and subdirectories for executable files, configuration files, sample data and more.
@@ -71,7 +71,7 @@ This configuration includes default settings that are appropriate for this tutor
 
 You can view the default settings in the configuration files located in `conf/druid/auto`.
 
-From the `apache-druid-34.0.0` package root, run the following command:
+From the `apache-druid-35.0.0` package root, run the following command:
 
 ```bash
 ./bin/start-druid
@@ -85,20 +85,20 @@ $ ./bin/start-druid
 [Tue Nov 29 16:31:06 2022] Starting Apache Druid.
 [Tue Nov 29 16:31:06 2022] Open http://localhost:8888/ in your browser to access the web console.
 [Tue Nov 29 16:31:06 2022] Or, if you have enabled TLS, use https on port 9088.
-[Tue Nov 29 16:31:06 2022] Starting services with log directory [/apache-druid-34.0.0/log].
+[Tue Nov 29 16:31:06 2022] Starting services with log directory [/apache-druid-35.0.0/log].
 [Tue Nov 29 16:31:06 2022] Running command[zk]: bin/run-zk conf
-[Tue Nov 29 16:31:06 2022] Running command[broker]: bin/run-druid broker /apache-druid-34.0.0/conf/druid/single-server/quickstart '-Xms1187m -Xmx1187m -XX:MaxDirectMemorySize=791m'
-[Tue Nov 29 16:31:06 2022] Running command[router]: bin/run-druid router /apache-druid-34.0.0/conf/druid/single-server/quickstart '-Xms128m -Xmx128m'
-[Tue Nov 29 16:31:06 2022] Running command[coordinator-overlord]: bin/run-druid coordinator-overlord /apache-druid-34.0.0/conf/druid/single-server/quickstart '-Xms1290m -Xmx1290m'
-[Tue Nov 29 16:31:06 2022] Running command[historical]: bin/run-druid historical /apache-druid-34.0.0/conf/druid/single-server/quickstart '-Xms1376m -Xmx1376m -XX:MaxDirectMemorySize=2064m'
-[Tue Nov 29 16:31:06 2022] Running command[middleManager]: bin/run-druid middleManager /apache-druid-34.0.0/conf/druid/single-server/quickstart '-Xms64m -Xmx64m' '-Ddruid.worker.capacity=2 -Ddruid.indexer.runner.javaOptsArray=["-server","-Duser.timezone=UTC","-Dfile.encoding=UTF-8","-XX:+ExitOnOutOfMemoryError","-Djava.util.logging.manager=org.apache.logging.log4j.jul.LogManager","-Xms256m","-Xmx256m","-XX:MaxDirectMemorySize=256m"]'
+[Tue Nov 29 16:31:06 2022] Running command[broker]: bin/run-druid broker /apache-druid-35.0.0/conf/druid/single-server/quickstart '-Xms1187m -Xmx1187m -XX:MaxDirectMemorySize=791m'
+[Tue Nov 29 16:31:06 2022] Running command[router]: bin/run-druid router /apache-druid-35.0.0/conf/druid/single-server/quickstart '-Xms128m -Xmx128m'
+[Tue Nov 29 16:31:06 2022] Running command[coordinator-overlord]: bin/run-druid coordinator-overlord /apache-druid-35.0.0/conf/druid/single-server/quickstart '-Xms1290m -Xmx1290m'
+[Tue Nov 29 16:31:06 2022] Running command[historical]: bin/run-druid historical /apache-druid-35.0.0/conf/druid/single-server/quickstart '-Xms1376m -Xmx1376m -XX:MaxDirectMemorySize=2064m'
+[Tue Nov 29 16:31:06 2022] Running command[middleManager]: bin/run-druid middleManager /apache-druid-35.0.0/conf/druid/single-server/quickstart '-Xms64m -Xmx64m' '-Ddruid.worker.capacity=2 -Ddruid.indexer.runner.javaOptsArray=["-server","-Duser.timezone=UTC","-Dfile.encoding=UTF-8","-XX:+ExitOnOutOfMemoryError","-Djava.util.logging.manager=org.apache.logging.log4j.jul.LogManager","-Xms256m","-Xmx256m","-XX:MaxDirectMemorySize=256m"]'
 ```
 
 Druid may use up to 80% of the total available system memory.
 To explicitly set the total memory available to Druid, pass a value for the memory parameter. For example, `./bin/start-druid -m 16g`. 
 
-Druid stores all persistent state data, such as the cluster metadata store and data segments, in `apache-druid-34.0.0/var`.
-Each service writes to a log file under `apache-druid-34.0.0/log`.
+Druid stores all persistent state data, such as the cluster metadata store and data segments, in `apache-druid-35.0.0/var`.
+Each service writes to a log file under `apache-druid-35.0.0/log`.
 
 At any time, you can revert Druid to its original, post-installation state by deleting the entire `var` directory. You may want to do this, for example, between Druid tutorials or after experimentation, to start with a fresh instance. 
 
diff --git a/docs/latest/tutorials/tutorial-batch-hadoop.md b/docs/latest/tutorials/tutorial-batch-hadoop.md
index cba190e7d0..10ec1aa288 100644
--- a/docs/latest/tutorials/tutorial-batch-hadoop.md
+++ b/docs/latest/tutorials/tutorial-batch-hadoop.md
@@ -25,12 +25,11 @@ sidebar_label: Load from Apache Hadoop
 
 :::caution[Deprecated]
 
-Hadoop-based ingestion is deprecated. We recommend one of Druid's other supported ingestion methods, such as [SQL-based ingestion](../multi-stage-query/index.md) or [MiddleManager-less ingestion using Kubernetes](../development/extensions-core/k8s-jobs.md)
-
-You must now explicitly opt-in to using the deprecated `index_hadoop` task type. To opt-in, set `druid.indexer.task.allowHadoopTaskExecution` to `true` in your `common.runtime.properties` file. For more information, see [#18239](https://github.com/apache/druid/pull/18239)
+Hadoop-based ingestion is deprecated. For more information, see the [upgrade notes](../release-info/upgrade-notes.md#hadoop-based-ingestion).
 
 :::
 
+
 This tutorial shows you how to load data files into Apache Druid using a remote Hadoop cluster.
 
 For this tutorial, we'll assume that you've already completed the previous
@@ -49,7 +48,7 @@ For this tutorial, we've provided a Dockerfile for a Hadoop 3.3.6 cluster, which
 
 This Dockerfile and related files are located at `quickstart/tutorial/hadoop/docker`.
 
-From the `apache-druid-34.0.0` package root, run the following commands to build a Docker image named "druid-hadoop-demo" with version tag "3.3.6":
+From the `apache-druid-35.0.0` package root, run the following commands to build a Docker image named "druid-hadoop-demo" with version tag "3.3.6":
 
 ```bash
 cd quickstart/tutorial/hadoop/docker
diff --git a/docs/latest/tutorials/tutorial-batch.md b/docs/latest/tutorials/tutorial-batch.md
index ace77b5336..ced8f67441 100644
--- a/docs/latest/tutorials/tutorial-batch.md
+++ b/docs/latest/tutorials/tutorial-batch.md
@@ -149,7 +149,7 @@ Once the spec is submitted, you can follow the same instructions as above to wai
 
 Let's briefly discuss how we would've submitted the ingestion task without using the script. You do not need to run these commands.
 
-To submit the task, POST it to Druid in a new terminal window from the `apache-druid-34.0.0` directory:
+To submit the task, POST it to Druid in a new terminal window from the `apache-druid-35.0.0` directory:
 
 ```bash
 curl -X 'POST' -H 'Content-Type:application/json' -d @quickstart/tutorial/wikipedia-index.json http://localhost:8081/druid/indexer/v1/task
diff --git a/docs/latest/tutorials/tutorial-ingestion-spec.md b/docs/latest/tutorials/tutorial-ingestion-spec.md
index 8e339a8dc2..3f7ea42c79 100644
--- a/docs/latest/tutorials/tutorial-ingestion-spec.md
+++ b/docs/latest/tutorials/tutorial-ingestion-spec.md
@@ -582,7 +582,7 @@ We've finished defining the ingestion spec, it should now look like the followin
 
 ## Submit the task and query the data
 
-From the `apache-druid-34.0.0` package root, run the following command:
+From the `apache-druid-35.0.0` package root, run the following command:
 
 ```bash
 bin/post-index-task --file quickstart/ingestion-tutorial-index.json --url http://localhost:8081
diff --git a/docs/latest/tutorials/tutorial-kerberos-hadoop.md b/docs/latest/tutorials/tutorial-kerberos-hadoop.md
index cace9b8794..0ec798e34a 100644
--- a/docs/latest/tutorials/tutorial-kerberos-hadoop.md
+++ b/docs/latest/tutorials/tutorial-kerberos-hadoop.md
@@ -25,9 +25,7 @@ sidebar_label: Kerberized HDFS deep storage
 
 :::caution[Deprecated]
 
-Hadoop-based ingestion is deprecated. We recommend one of Druid's other supported ingestion methods, such as [SQL-based ingestion](../multi-stage-query/index.md) or [MiddleManager-less ingestion using Kubernetes](../development/extensions-core/k8s-jobs.md)
-
-You must now explicitly opt-in to using the deprecated `index_hadoop` task type. To opt-in, set `druid.indexer.task.allowHadoopTaskExecution` to `true` in your `common.runtime.properties` file. For more information, see [#18239](https://github.com/apache/druid/pull/18239)
+Hadoop-based ingestion is deprecated. For more information, see the [upgrade notes](../release-info/upgrade-notes.md#hadoop-based-ingestion).
 
 :::
 
diff --git a/published_versions/data/example-manifests-v2.tsv b/published_versions/data/example-manifests-v2.tsv
new file mode 100644
index 0000000000..cfeaa183ca
--- /dev/null
+++ b/published_versions/data/example-manifests-v2.tsv
@@ -0,0 +1,2 @@
+name	description	spec
+Wikipedia Edits	Edits on Wikipedia from one day	{"type":"index_parallel","spec":{"ioConfig":{"type":"index_parallel","inputSource":{"type":"http","uris":["https://druid.apache.org/data/wikipedia.json.gz"]}},"dataSchema":{"granularitySpec":{"segmentGranularity":"day"}},"tuningConfig":{"type":"index_parallel"}}}
diff --git a/published_versions/data/example-manifests.tsv b/published_versions/data/example-manifests.tsv
new file mode 100644
index 0000000000..758401c4bd
--- /dev/null
+++ b/published_versions/data/example-manifests.tsv
@@ -0,0 +1,2 @@
+name	description	spec
+Wikipedia Edits	Edits on Wikipedia from one day	{"type":"index_parallel","ioConfig":{"type":"index_parallel","firehose":{"type":"http","uris":["https://druid.apache.org/data/wikipedia.json.gz"]}},"tuningConfig":{"type":"index_parallel"},"dataSchema":{"dataSource":"new-data-source","granularitySpec":{"type":"uniform","segmentGranularity":"DAY","queryGranularity":"HOUR"}}}
diff --git a/published_versions/data/wikipedia.json.gz b/published_versions/data/wikipedia.json.gz
new file mode 100644
index 0000000000..184863cc3b
Binary files /dev/null and b/published_versions/data/wikipedia.json.gz differ
diff --git a/static/js/version.js b/static/js/version.js
index b7053e7c5f..3cdb4d1e3f 100644
--- a/static/js/version.js
+++ b/static/js/version.js
@@ -26,6 +26,10 @@ Used by
 
 
 const Releases = [
+  {
+    version: "35.0.0",
+    date: "Oct 28 2025",
+  },
   {
     version: "34.0.0",
     date: "Aug 11 2025",
@@ -33,10 +37,6 @@ const Releases = [
   {
     version: "33.0.0",
     date: "Apr 29 2025",
-  },
-  {
-    version: "32.0.1",
-    date: "Mar 19 2025",
   }
 ]
 
diff --git a/yarn.lock b/yarn.lock
index a8f61f987c..330499d255 100644
--- a/yarn.lock
+++ b/yarn.lock
@@ -2109,15 +2109,10 @@
     mkdirp "^1.0.4"
     rimraf "^3.0.2"
 
-"@parcel/watcher-linux-x64-glibc@2.5.1":
+"@parcel/watcher-darwin-arm64@2.5.1":
   version "2.5.1"
-  resolved "https://registry.npmjs.org/@parcel/watcher-linux-x64-glibc/-/watcher-linux-x64-glibc-2.5.1.tgz"
-  integrity sha512-GcESn8NZySmfwlTsIur+49yDqSny2IhPeZfXunQi48DMugKeZ7uy1FX83pO0X22sHntJ4Ub+9k34XQCX+oHt2A==
-
-"@parcel/watcher-linux-x64-musl@2.5.1":
-  version "2.5.1"
-  resolved "https://registry.npmjs.org/@parcel/watcher-linux-x64-musl/-/watcher-linux-x64-musl-2.5.1.tgz"
-  integrity sha512-n0E2EQbatQ3bXhcH2D1XIAANAcTZkQICBPVaxMeaCVBtOpBZpWJuf7LwyWPSBDITb7In8mqQgJ7gH8CILCURXg==
+  resolved "https://registry.npmjs.org/@parcel/watcher-darwin-arm64/-/watcher-darwin-arm64-2.5.1.tgz"
+  integrity sha512-eAzPv5osDmZyBhou8PoF4i6RQXAfeKL9tjb3QzYuccXFMQU0ruIc/POh30ePnaOyD1UXdlKguHBmsTs53tVoPw==
 
 "@parcel/watcher@^2.4.1":
   version "2.5.1"
@@ -5742,6 +5737,11 @@ fs.realpath@^1.0.0:
   resolved "https://registry.npmjs.org/fs.realpath/-/fs.realpath-1.0.0.tgz"
   integrity sha512-OO0pH2lK6a0hZnAdau5ItzHPI6pUlvI7jMVnxUQRtw4owF2wk8lOSabtGDCTP4Ggrg2MbGnWO9X8K1t4+fGMDw==
 
+fsevents@~2.3.2:
+  version "2.3.3"
+  resolved "https://registry.npmjs.org/fsevents/-/fsevents-2.3.3.tgz"
+  integrity sha512-5xoDfX+fL7faATnagmWPpbFtwh/R77WmMMqqHGS65C3vvB0YHrgF+B1YmZ3441tMj5n63k0212XNoJwzlhffQw==
+
 function-bind@^1.1.2:
   version "1.1.2"
   resolved "https://registry.npmjs.org/function-bind/-/function-bind-1.1.2.tgz"