diff --git a/.github/workflows/jekyll-spec-insert.yml b/.github/workflows/jekyll-spec-insert.yml
new file mode 100644
index 0000000000..cefd477be2
--- /dev/null
+++ b/.github/workflows/jekyll-spec-insert.yml
@@ -0,0 +1,20 @@
+name: Lint and Test Jekyll Spec Insert
+on:
+  push:
+    paths:
+      - 'spec-insert/**'
+  pull_request:
+    paths:
+      - 'spec-insert/**'
+jobs:
+  lint-and-test:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+      - uses: ruby/setup-ruby@v1
+        with: { ruby-version: 3.3.0 }
+      - run: bundle install
+      - working-directory: spec-insert
+        run: |
+          bundle exec rubocop
+          bundle exec rspec
diff --git a/.github/workflows/update-api-components.yml b/.github/workflows/update-api-components.yml
new file mode 100644
index 0000000000..42cc1d2827
--- /dev/null
+++ b/.github/workflows/update-api-components.yml
@@ -0,0 +1,52 @@
+name: Update API Components
+on:
+  workflow_dispatch:
+  schedule:
+    - cron: "0 0 * * 0" # Every Sunday at midnight GMT
+jobs:
+  update-api-components:
+    if: ${{ github.repository == 'opensearch-project/documentation-website' }}
+    runs-on: ubuntu-latest
+    permissions:
+      contents: write
+      pull-requests: write
+    steps:
+      - uses: actions/checkout@v4
+        with:
+          submodules: recursive
+          fetch-depth: 0
+
+      - run: git config --global pull.rebase true
+
+      - uses: ruby/setup-ruby@v1
+        with: { ruby-version: 3.3.0 }
+
+      - run: bundle install
+
+      - name: Download spec and insert into documentation
+        run: bundle exec jekyll spec-insert
+
+      - name: Get current date
+        id: date
+        run: echo "date=$(date +'%Y-%m-%d')" >> $GITHUB_ENV
+
+      - name: GitHub App token
+        id: github_app_token
+        uses: tibdex/github-app-token@v2.1.0
+        with:
+          app_id: ${{ secrets.APP_ID }}
+          private_key: ${{ secrets.APP_PRIVATE_KEY }}
+
+      - name: Create pull request
+        uses: peter-evans/create-pull-request@v6
+        with:
+          token: ${{ steps.github_app_token.outputs.token }}
+          commit-message: "Updated API components to reflect the latest OpenSearch API spec (${{ env.date }})"
+          title: "[AUTOCUT] Update API components to reflect the latest OpenSearch API spec (${{ env.date }})"
+          body: |
+            Update API components to reflect the latest [OpenSearch API spec](https://github.com/opensearch-project/opensearch-api-specification/releases/download/main-latest/opensearch-openapi.yaml).
+            Date: ${{ env.date }}
+          branch: update-api-components-${{ env.date }}
+          base: main
+          signoff: true
+          labels: autocut
\ No newline at end of file
diff --git a/.ruby-version b/.ruby-version
deleted file mode 100644
index 4772543317..0000000000
--- a/.ruby-version
+++ /dev/null
@@ -1 +0,0 @@
-3.3.2
diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md
index a3628b3b6e..f6d9b87ee8 100644
--- a/CONTRIBUTING.md
+++ b/CONTRIBUTING.md
@@ -84,7 +84,7 @@ Follow these steps to set up your local copy of the repository:
 
    ```
    curl -sSL https://get.rvm.io | bash -s stable
-   rvm install 3.2.4
+   rvm install 3.3.2
    ruby -v
    ```
 
@@ -158,6 +158,23 @@ To ensure that our documentation adheres to the [OpenSearch Project Style Guidel
 
 Optionally, you can install the [Vale VSCode](https://github.com/chrischinchilla/vale-vscode) extension, which integrates Vale with Visual Studio Code. By default, only _errors_ and _warnings_ are underlined. To change the minimum alert level to include _suggestions_, go to **Vale VSCode** > **Extension Settings** and select **suggestion** in the **Vale > Vale CLI: Min Alert Level** dropdown list. 
 
+## Troubleshooting
+
+This section provides information about potential solutions for known issues.
+
+### Installing Ruby on an Apple silicon machine
+
+If you're having trouble installing Ruby with `rvm` on an Apple silicon machine, it could be because of an OpenSSL version misalignment. To fix this issue, use the following command, replacing `<openssl-version>` with your [desired version](https://github.com/ruby/openssl/blob/master/README.md):
+
+```
+# Assumes Brew is installed
+curl -sSL https://get.rvm.io | bash -s stable
+rvm install 3.2.4 --with-openssl-dir=$(brew --prefix openssl@<openssl-version>)
+ruby -v
+```
+
 ## Getting help
 
 For help with the contribution process, reach out to one of the [points of contact](README.md#points-of-contact).
+
+
diff --git a/DEVELOPER_GUIDE.md b/DEVELOPER_GUIDE.md
new file mode 100644
index 0000000000..9b0ec1c79d
--- /dev/null
+++ b/DEVELOPER_GUIDE.md
@@ -0,0 +1,135 @@
+# Developer guide
+- [Introduction](#introduction)
+- [Starting the Jekyll server locally](#starting-the-jekyll-server-locally)
+- [Using the spec-insert Jekyll plugin](#using-the-spec-insert-jekyll-plugin)
+  - [Ignoring files and folders](#ignoring-files-and-folders)
+- [CI/CD](#cicd)
+- [Spec insert components](#spec-insert-components)
+  - [Query parameters](#query-parameters)
+  - [Path parameters](#path-parameters)
+  - [Paths and HTTP methods](#paths-and-http-methods)
+
+## Introduction
+
+The `.md` documents in this repository are rendered into HTML pages using [Jekyll](https://jekyllrb.com/). These HTML pages are hosted on [opensearch.org](https://opensearch.org/docs/latest/).
+
+## Starting the Jekyll server locally
+You can run the Jekyll server locally to view the rendered HTML pages using the following steps:
+
+1. Install [Ruby](https://www.ruby-lang.org/en/documentation/installation/) 3.1.0 or later for your operating system.
+2. Install the required gems by running `bundle install`.
+3. Run `bundle exec jekyll serve` to start the Jekyll server locally (this can take several minutes to complete).
+4. Open your browser and navigate to `http://localhost:4000` to view the rendered HTML pages.
+
+## Using the `spec-insert` Jekyll plugin
+The `spec-insert` Jekyll plugin is used to insert API components into Markdown files. The plugin downloads the [latest OpenSearch specification](https://github.com/opensearch-project/opensearch-api-specification) and renders the API components from the spec. This aims to reduce the manual effort required to keep the documentation up to date.
+
+To use this plugin, make sure that you have installed Ruby 3.1.0 or later and the required gems by running `bundle install`.
+
+Edit your Markdown file and insert the following snippet where you want render an API component:
+
+```markdown
+<!-- spec_insert_start 
+api: <API_NAME>
+component: <COMPONENT_NAME>
+other_argument: <OTHER_ARGUMENT>
+-->
+
+This is where the API component will be inserted.
+Everything between the `spec_insert_start` and `spec_insert_end` tags will be overwritten.
+
+<!-- spec_insert_end -->
+```
+
+Then run the following Jekyll command to render the API components:
+```shell
+bundle exec jekyll spec-insert
+```
+
+If you are working on multiple Markdown files and do not want to keep running the `jekyll spec-insert` command, you can add the `--watch` (or `-W`) flag to the command to watch for changes in the Markdown files and automatically render the API components:
+
+```shell
+bundle exec jekyll spec-insert --watch
+```
+
+Depending on the text editor you are using, you may need to manually reload the file from disk to see the changes applied by the plugin if the editor does not automatically reload the file periodically.
+
+The plugin will pull the newest OpenSearch API spec from its [repository](https://github.com/opensearch-project/opensearch-api-specification) if the spec file does not exist locally or if it is older than 24 hours. To tell the plugin to always pull the newest spec, you can add the `--refresh-spec` (or `-R`) flag to the command:
+
+```shell
+bundle exec jekyll spec-insert --refresh-spec
+```
+
+### Ignoring files and folders
+The `spec-insert` plugin ignores all files and folders listed in the [./_config.yml#exclude](./_config.yml) list, which is also the list of files and folders that Jekyll ignores.
+
+## CI/CD
+The `spec-insert` plugin is run as part of the CI/CD pipeline to ensure that the API components are up to date in the documentation. This is performed through the [update-api-components.yml](.github/workflows/update-api-components.yml) GitHub Actions workflow, which creates a pull request containing the updated API components every Sunday.
+
+## Spec insert components
+All spec insert components accept the following arguments:
+- `api` (String; required): The name of the API to render the component from. This is equivalent to the `x-operation-group` field in the OpenSearch OpenAPI Spec.
+- `component` (String; required): The name of the component to render,  such as `query_parameters`, `path_parameters`, or `paths_and_http_methods`.
+- `omit_header` (Boolean; Default is `false`): If set to `true`, the markdown header of the component will not be rendered.
+
+### Paths and HTTP methods
+To insert paths and HTTP methods for the `search` API, use the following snippet:
+```markdown
+<!-- spec_insert_start
+api: search
+component: paths_and_http_methods
+-->
+<!-- spec_insert_end -->
+```
+
+### Path parameters
+
+To insert a path parameters table of the `indices.create` API, use the following snippet. Use the `x-operation-group` field from OpenSearch OpenAPI Spec for the `api` value:
+
+```markdown
+<!-- spec_insert_start
+api: indices.create
+component: path_parameters
+-->
+<!-- spec_insert_end -->
+```
+This table accepts the same arguments as the query parameters table except the `include_global` argument.
+
+### Query parameters
+To insert the API query parameters table of the `cat.indices` API, use the following snippet:
+```markdown
+<!-- spec_insert_start
+api: cat.indices
+component: query_parameters
+-->
+<!-- spec_insert_end -->
+```
+
+This will insert the query parameters of the `cat.indices` API into the `.md` file with three default columns: `Parameter`, `Type`, and `Description`. You can customize the query parameters table by adding the `columns` argument which accepts a comma-separated list of column names. The available column names are:
+
+- `Parameter`
+- `Type`
+- `Description`
+- `Required`
+- `Default`
+
+_When `Required`/`Default` is not chosen, the information will be written in the `Description` column._
+
+You can also customize this component with the following settings:
+
+- `include_global` (Boolean; default is `false`): Includes global query parameters in the table.
+- `include_deprecated` (Boolean; default is `true`): Includes deprecated parameters in the table.
+- `pretty` (Boolean; default is `false`): Renders the table in the pretty format instead of the compact format.
+
+The following snippet inserts the specified columns into the query parameters table:
+
+```markdown
+<!-- spec_insert_start
+api: cat.indices
+component: query_parameters
+include_global: true
+include_deprecated: false
+pretty: true
+-->
+<!-- spec_insert_end -->
+```
diff --git a/Gemfile b/Gemfile
index 7825dcd02b..fee04f3c48 100644
--- a/Gemfile
+++ b/Gemfile
@@ -1,4 +1,9 @@
-source "http://rubygems.org"
+# frozen_string_literal: true
+
+source 'https://rubygems.org'
+
+# Manually add csv gem since Ruby 3.4.0 no longer includes it
+gem 'csv', '~> 3.0'
 
 # Hello! This is where you manage which Jekyll version is used to run.
 # When you want to use a different version, change it below, save the
@@ -8,12 +13,12 @@ source "http://rubygems.org"
 #
 # This will help ensure the proper Jekyll version is running.
 # Happy Jekylling!
-gem "jekyll", "~> 4.3.2"
+gem 'jekyll', '~> 4.3.2'
 
 # This is the default theme for new Jekyll sites. You may change this to anything you like.
-gem "just-the-docs", "~> 0.3.3"
-gem "jekyll-remote-theme", "~> 0.4"
-gem "jekyll-redirect-from", "~> 0.16"
+gem 'jekyll-redirect-from', '~> 0.16'
+gem 'jekyll-remote-theme', '~> 0.4'
+gem 'just-the-docs', '~> 0.3.3'
 
 # If you want to use GitHub Pages, remove the "gem "jekyll"" above and
 # uncomment the line below. To upgrade, run `bundle update github-pages`.
@@ -22,21 +27,31 @@ gem "jekyll-redirect-from", "~> 0.16"
 
 # If you have any plugins, put them here!
 group :jekyll_plugins do
-  gem "jekyll-last-modified-at"
-  gem "jekyll-sitemap"
+  gem 'jekyll-last-modified-at'
+  gem 'jekyll-sitemap'
+  gem 'jekyll-spec-insert', :path => './spec-insert'
 end
 
 # Windows does not include zoneinfo files, so bundle the tzinfo-data gem
-gem "tzinfo-data", platforms: [:mingw, :mswin, :x64_mingw, :jruby]
+gem 'tzinfo-data', platforms: %i[mingw mswin x64_mingw jruby]
 
 # Performance-booster for watching directories on Windows
-gem "wdm", "~> 0.1.0" if Gem.win_platform?
+gem 'wdm', '~> 0.1.0' if Gem.win_platform?
 
 # Installs webrick dependency for building locally
-gem "webrick", "~> 1.7"
-
+gem 'webrick', '~> 1.7'
 
 # Link checker
-gem "typhoeus"
-gem "ruby-link-checker"
-gem "ruby-enum"
+gem 'ruby-enum'
+gem 'ruby-link-checker'
+gem 'typhoeus'
+
+# Spec Insert
+gem 'activesupport', '~> 7'
+gem 'mustache', '~> 1'
+
+group :development, :test do
+  gem 'rspec'
+  gem 'rubocop', '~> 1.44', require: false
+  gem 'rubocop-rake', require: false
+end
diff --git a/README.md b/README.md
index 66beb1948c..52321335c7 100644
--- a/README.md
+++ b/README.md
@@ -3,6 +3,7 @@
 # About the OpenSearch documentation repo
 
 The `documentation-website` repository contains the user documentation for OpenSearch. You can find the rendered documentation at [opensearch.org/docs](https://opensearch.org/docs).
+The markdown files in this repository are rendered into HTML pages using [Jekyll](https://jekyllrb.com/). Check the [DEVELOPER_GUIDE](DEVELOPER_GUIDE.md) for more information about how to use Jekyll for this repository.
 
 
 ## Contributing
diff --git a/_aggregations/bucket/nested.md b/_aggregations/bucket/nested.md
index 89c44c6457..affda8e437 100644
--- a/_aggregations/bucket/nested.md
+++ b/_aggregations/bucket/nested.md
@@ -96,8 +96,8 @@ GET logs/_search
 "aggregations" : {
   "pages" : {
     "doc_count" : 2,
-    "min_price" : {
-      "value" : 200.0
+    "min_load_time" : {
+      "value" : 200
     }
   }
  }
diff --git a/_analyzers/character-filters/html-character-filter.md b/_analyzers/character-filters/html-character-filter.md
index 9fb98d9744..ef55930bdf 100644
--- a/_analyzers/character-filters/html-character-filter.md
+++ b/_analyzers/character-filters/html-character-filter.md
@@ -1,11 +1,11 @@
 ---
 layout: default
-title: html_strip character filter
+title: HTML strip
 parent: Character filters
 nav_order: 100
 ---
 
-# `html_strip` character filter
+# HTML strip character filter
 
 The `html_strip` character filter removes HTML tags, such as `<div>`, `<p>`, and `<a>`, from the input text and renders plain text. The filter can be configured to preserve certain tags or decode specific HTML entities, such as `&nbsp;`, into spaces.
 
diff --git a/_analyzers/language-analyzers.md b/_analyzers/language-analyzers.md
deleted file mode 100644
index ca4ba320dd..0000000000
--- a/_analyzers/language-analyzers.md
+++ /dev/null
@@ -1,44 +0,0 @@
----
-layout: default
-title: Language analyzers
-nav_order: 100
-parent: Analyzers
-redirect_from:
-  - /query-dsl/analyzers/language-analyzers/
----
-
-# Language analyzers
-
-OpenSearch supports the following language analyzers:
-`arabic`, `armenian`, `basque`, `bengali`, `brazilian`, `bulgarian`, `catalan`, `czech`, `danish`, `dutch`, `english`, `estonian`, `finnish`, `french`, `galician`, `german`, `greek`, `hindi`, `hungarian`, `indonesian`, `irish`, `italian`, `latvian`, `lithuanian`, `norwegian`, `persian`, `portuguese`, `romanian`, `russian`, `sorani`, `spanish`, `swedish`, `turkish`, and `thai`.
-
-To use the analyzer when you map an index, specify the value within your query. For example, to map your index with the French language analyzer, specify the `french` value for the analyzer field:
-
-```json
- "analyzer": "french"
-```
-
-#### Example request
-
-The following query specifies the `french` language analyzer for the index `my-index`:
-
-```json
-PUT my-index
-{
-  "mappings": {
-    "properties": {
-      "text": { 
-        "type": "text",
-        "fields": {
-          "french": { 
-            "type": "text",
-            "analyzer": "french"
-          }
-        }
-      }
-    }
-  }
-}
-```
-
-<!-- TO do: each of the options needs its own section with an example. Convert table to individual sections, and then give a streamlined list with valid values. -->
diff --git a/_analyzers/language-analyzers/arabic.md b/_analyzers/language-analyzers/arabic.md
new file mode 100644
index 0000000000..e61c684cbb
--- /dev/null
+++ b/_analyzers/language-analyzers/arabic.md
@@ -0,0 +1,182 @@
+---
+layout: default
+title: Arabic
+parent: Language analyzers
+grand_parent: Analyzers
+nav_order: 10
+---
+
+# Arabic analyzer
+
+The built-in `arabic` analyzer can be applied to a text field using the following command:
+
+```json
+PUT /arabic-index
+{
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "arabic"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can use `stem_exclusion` with this language analyzer using the following command:
+
+```json
+PUT index_with_stem_exclusion_arabic
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_arabic_analyzer":{
+          "type":"arabic",
+          "stem_exclusion":["تكنولوجيا","سلطة "]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Arabic analyzer internals
+
+The `arabic` analyzer is built using the following components:
+
+- Tokenizer: `standard`
+
+- Token filters:
+  - lowercase
+  - decimal_digit
+  - stop (Arabic)
+  - normalization (Arabic)
+  - keyword
+  - stemmer (Arabic)
+
+## Custom Arabic analyzer
+
+You can create a custom Arabic analyzer using the following command:
+
+```json
+PUT /arabic-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "arabic_stop": {
+          "type": "stop",
+          "stopwords": "_arabic_"
+        },
+        "arabic_stemmer": {
+          "type": "stemmer",
+          "language": "arabic"
+        },
+        "arabic_normalization": {
+          "type": "arabic_normalization"
+        },
+        "decimal_digit": {
+          "type": "decimal_digit"
+        },
+        "arabic_keywords": {
+          "type":       "keyword_marker",
+          "keywords":   [] 
+        }
+      },
+      "analyzer": {
+        "arabic_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "arabic_normalization",
+            "decimal_digit",
+            "arabic_stop",
+            "arabic_keywords",
+            "arabic_stemmer"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "arabic_analyzer"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /arabic-index/_analyze
+{
+  "field": "content",
+  "text": "الطلاب يدرسون في الجامعات العربية. أرقامهم ١٢٣٤٥٦."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "طلاب",
+      "start_offset": 0,
+      "end_offset": 6,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "يدرس",
+      "start_offset": 7,
+      "end_offset": 13,
+      "type": "<ALPHANUM>",
+      "position": 1
+    },
+    {
+      "token": "جامع",
+      "start_offset": 17,
+      "end_offset": 25,
+      "type": "<ALPHANUM>",
+      "position": 3
+    },
+    {
+      "token": "عرب",
+      "start_offset": 26,
+      "end_offset": 33,
+      "type": "<ALPHANUM>",
+      "position": 4
+    },
+    {
+      "token": "ارقامهم",
+      "start_offset": 35,
+      "end_offset": 42,
+      "type": "<ALPHANUM>",
+      "position": 5
+    },
+    {
+      "token": "123456",
+      "start_offset": 43,
+      "end_offset": 49,
+      "type": "<NUM>",
+      "position": 6
+    }
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/language-analyzers/armenian.md b/_analyzers/language-analyzers/armenian.md
new file mode 100644
index 0000000000..9bd0549c80
--- /dev/null
+++ b/_analyzers/language-analyzers/armenian.md
@@ -0,0 +1,137 @@
+---
+layout: default
+title: Armenian
+parent: Language analyzers
+grand_parent: Analyzers
+nav_order: 20
+---
+
+# Armenian analyzer
+
+The built-in `armenian` analyzer can be applied to a text field using the following command:
+
+```json
+PUT /arabic-index
+{
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "armenian"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can use `stem_exclusion` with this language analyzer using the following command:
+
+```json
+PUT index_with_stem_exclusion_armenian_analyzer
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_armenian_analyzer": {
+          "type": "armenian",
+          "stem_exclusion": ["բարև", "խաղաղություն"] 
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Armenian analyzer internals
+
+The `armenian` analyzer is built using the following components:
+
+- Tokenizer: `standard`
+
+- Token filters:
+  - lowercase
+  - stop (Armenian)
+  - keyword
+  - stemmer (Armenian)
+
+## Custom Armenian analyzer
+
+You can create a custom Armenian analyzer using the following command:
+
+```json
+PUT /armenian-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "armenian_stop": {
+          "type": "stop",
+          "stopwords": "_armenian_"
+        },
+        "armenian_stemmer": {
+          "type": "stemmer",
+          "language": "armenian"
+        },
+        "armenian_keywords": {
+          "type":       "keyword_marker",
+          "keywords":   [] 
+        }
+      },
+      "analyzer": {
+        "armenian_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "armenian_stop",
+            "armenian_keywords",
+            "armenian_stemmer"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "armenian_analyzer"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+GET armenian-index/_analyze
+{
+  "analyzer": "stem_exclusion_armenian_analyzer",
+  "text": "բարև բոլորին, մենք խաղաղություն ենք ուզում և նոր օր ենք սկսել"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {"token": "բարև","start_offset": 0,"end_offset": 4,"type": "<ALPHANUM>","position": 0},
+    {"token": "բոլոր","start_offset": 5,"end_offset": 12,"type": "<ALPHANUM>","position": 1},
+    {"token": "խաղաղություն","start_offset": 19,"end_offset": 31,"type": "<ALPHANUM>","position": 3},
+    {"token": "ուզ","start_offset": 36,"end_offset": 42,"type": "<ALPHANUM>","position": 5},
+    {"token": "նոր","start_offset": 45,"end_offset": 48,"type": "<ALPHANUM>","position": 7},
+    {"token": "օր","start_offset": 49,"end_offset": 51,"type": "<ALPHANUM>","position": 8},
+    {"token": "սկսել","start_offset": 56,"end_offset": 61,"type": "<ALPHANUM>","position": 10}
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/language-analyzers/basque.md b/_analyzers/language-analyzers/basque.md
new file mode 100644
index 0000000000..e73510cc66
--- /dev/null
+++ b/_analyzers/language-analyzers/basque.md
@@ -0,0 +1,137 @@
+---
+layout: default
+title: Basque
+parent: Language analyzers
+grand_parent: Analyzers
+nav_order: 30
+---
+
+# Basque analyzer
+
+The built-in `basque` analyzer can be applied to a text field using the following command:
+
+```json
+PUT /basque-index
+{
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "basque"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can use `stem_exclusion` with this language analyzer using the following command:
+
+```json
+PUT index_with_stem_exclusion_basque_analyzer
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_basque_analyzer": {
+          "type": "basque",
+          "stem_exclusion": ["autoritate", "baldintza"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Basque analyzer internals
+
+The `basque` analyzer is built using the following components:
+
+- Tokenizer: `standard`
+
+- Token filters:
+  - lowercase
+  - stop (Basque)
+  - keyword
+  - stemmer (Basque)
+
+## Custom Basque analyzer
+
+You can create a custom Basque analyzer using the following command:
+
+```json
+PUT /basque-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "basque_stop": {
+          "type": "stop",
+          "stopwords": "_basque_"
+        },
+        "basque_stemmer": {
+          "type": "stemmer",
+          "language": "basque"
+        },
+        "basque_keywords": {
+          "type":       "keyword_marker",
+          "keywords":   [] 
+        }
+      },
+      "analyzer": {
+        "basque_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "basque_stop",
+            "basque_keywords",
+            "basque_stemmer"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "basque_analyzer"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /basque-index/_analyze
+{
+  "field": "content",
+  "text": "Ikasleek euskal unibertsitateetan ikasten dute. Haien zenbakiak 123456 dira."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {"token": "ikasle","start_offset": 0,"end_offset": 8,"type": "<ALPHANUM>","position": 0},
+    {"token": "euskal","start_offset": 9,"end_offset": 15,"type": "<ALPHANUM>","position": 1},
+    {"token": "unibertsi","start_offset": 16,"end_offset": 33,"type": "<ALPHANUM>","position": 2},
+    {"token": "ikas","start_offset": 34,"end_offset": 41,"type": "<ALPHANUM>","position": 3},
+    {"token": "haien","start_offset": 48,"end_offset": 53,"type": "<ALPHANUM>","position": 5},
+    {"token": "zenba","start_offset": 54,"end_offset": 63,"type": "<ALPHANUM>","position": 6},
+    {"token": "123456","start_offset": 64,"end_offset": 70,"type": "<NUM>","position": 7}
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/language-analyzers/bengali.md b/_analyzers/language-analyzers/bengali.md
new file mode 100644
index 0000000000..af913a01ef
--- /dev/null
+++ b/_analyzers/language-analyzers/bengali.md
@@ -0,0 +1,142 @@
+---
+layout: default
+title: Bengali
+parent: Language analyzers
+grand_parent: Analyzers
+nav_order: 40
+---
+
+# Bengali analyzer
+
+The built-in `bengali` analyzer can be applied to a text field using the following command:
+
+```json
+PUT /bengali-index
+{
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "bengali"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can use `stem_exclusion` with this language analyzer using the following command:
+
+```json
+PUT index_with_stem_exclusion_bengali_analyzer
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_bengali_analyzer": {
+          "type": "bengali",
+          "stem_exclusion": ["কর্তৃপক্ষ", "অনুমোদন"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Bengali analyzer internals
+
+The `bengali` analyzer is built using the following components:
+
+- Tokenizer: `standard`
+
+- Token filters:
+  - lowercase
+  - decimal_digit
+  - indic_normalization
+  - normalization (Bengali)
+  - stop (Bengali)
+  - keyword
+  - stemmer (Bengali)
+
+## Custom Bengali analyzer
+
+You can create a custom Bengali analyzer using the following command:
+
+```json
+PUT /bengali-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "bengali_stop": {
+          "type": "stop",
+          "stopwords": "_bengali_"
+        },
+        "bengali_stemmer": {
+          "type": "stemmer",
+          "language": "bengali"
+        },
+        "bengali_keywords": {
+          "type":       "keyword_marker",
+          "keywords":   [] 
+        }
+      },
+      "analyzer": {
+        "bengali_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "decimal_digit",
+            "indic_normalization",
+            "bengali_normalization",
+            "bengali_stop",
+            "bengali_keywords",
+            "bengali_stemmer"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "bengali_analyzer"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /bengali-index/_analyze
+{
+  "field": "content",
+  "text": "ছাত্ররা বিশ্ববিদ্যালয়ে পড়াশোনা করে। তাদের নম্বরগুলি ১২৩৪৫৬।"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {"token": "ছাত্র","start_offset": 0,"end_offset": 7,"type": "<ALPHANUM>","position": 0},
+    {"token": "বিসসবিদালয়","start_offset": 8,"end_offset": 23,"type": "<ALPHANUM>","position": 1},
+    {"token": "পরাসোন","start_offset": 24,"end_offset": 32,"type": "<ALPHANUM>","position": 2},
+    {"token": "তা","start_offset": 38,"end_offset": 43,"type": "<ALPHANUM>","position": 4},
+    {"token": "নমমর","start_offset": 44,"end_offset": 53,"type": "<ALPHANUM>","position": 5},
+    {"token": "123456","start_offset": 54,"end_offset": 60,"type": "<NUM>","position": 6}
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/language-analyzers/brazilian.md b/_analyzers/language-analyzers/brazilian.md
new file mode 100644
index 0000000000..67db2b92bc
--- /dev/null
+++ b/_analyzers/language-analyzers/brazilian.md
@@ -0,0 +1,137 @@
+---
+layout: default
+title: Brazilian
+parent: Language analyzers
+grand_parent: Analyzers
+nav_order: 50
+---
+
+# Brazilian analyzer
+
+The built-in `brazilian` analyzer can be applied to a text field using the following command:
+
+```json
+PUT /brazilian-index
+{
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "brazilian"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can use `stem_exclusion` with this language analyzer using the following command:
+
+```json
+PUT index_with_stem_exclusion_brazilian_analyzer
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_brazilian_analyzer": {
+          "type": "brazilian",
+          "stem_exclusion": ["autoridade", "aprovação"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Brazilian analyzer internals
+
+The `brazilian` analyzer is built using the following components:
+
+- Tokenizer: `standard`
+
+- Token filters:
+  - lowercase
+  - stop (Brazilian)
+  - keyword
+  - stemmer (Brazilian)
+
+## Custom Brazilian analyzer
+
+You can create a custom Brazilian analyzer using the following command:
+
+```json
+PUT /brazilian-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "brazilian_stop": {
+          "type": "stop",
+          "stopwords": "_brazilian_"
+        },
+        "brazilian_stemmer": {
+          "type": "stemmer",
+          "language": "brazilian"
+        },
+        "brazilian_keywords": {
+          "type":       "keyword_marker",
+          "keywords":   [] 
+        }
+      },
+      "analyzer": {
+        "brazilian_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "brazilian_stop",
+            "brazilian_keywords",
+            "brazilian_stemmer"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "brazilian_analyzer"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /brazilian-index/_analyze
+{
+  "field": "content",
+  "text": "Estudantes estudam em universidades brasileiras. Seus números são 123456."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {"token": "estudant","start_offset": 0,"end_offset": 10,"type": "<ALPHANUM>","position": 0},
+    {"token": "estud","start_offset": 11,"end_offset": 18,"type": "<ALPHANUM>","position": 1},
+    {"token": "univers","start_offset": 22,"end_offset": 35,"type": "<ALPHANUM>","position": 3},
+    {"token": "brasileir","start_offset": 36,"end_offset": 47,"type": "<ALPHANUM>","position": 4},
+    {"token": "numer","start_offset": 54,"end_offset": 61,"type": "<ALPHANUM>","position": 6},
+    {"token": "sao","start_offset": 62,"end_offset": 65,"type": "<ALPHANUM>","position": 7},
+    {"token": "123456","start_offset": 66,"end_offset": 72,"type": "<NUM>","position": 8}
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/language-analyzers/bulgarian.md b/_analyzers/language-analyzers/bulgarian.md
new file mode 100644
index 0000000000..42d5794e18
--- /dev/null
+++ b/_analyzers/language-analyzers/bulgarian.md
@@ -0,0 +1,137 @@
+---
+layout: default
+title: Bulgarian
+parent: Language analyzers
+grand_parent: Analyzers
+nav_order: 60
+---
+
+# Bulgarian analyzer
+
+The built-in `bulgarian` analyzer can be applied to a text field using the following command:
+
+```json
+PUT /bulgarian-index
+{
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "bulgarian"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can use `stem_exclusion` with this language analyzer using the following command:
+
+```json
+PUT index_with_stem_exclusion_bulgarian_analyzer
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_bulgarian_analyzer": {
+          "type": "bulgarian",
+          "stem_exclusion": ["авторитет", "одобрение"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Bulgarian analyzer internals
+
+The `bulgarian` analyzer is built using the following components:
+
+- Tokenizer: `standard`
+
+- Token filters:
+  - lowercase
+  - stop (Bulgarian)
+  - keyword
+  - stemmer (Bulgarian)
+
+## Custom Bulgarian analyzer
+
+You can create a custom Bulgarian analyzer using the following command:
+
+```json
+PUT /bulgarian-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "bulgarian_stop": {
+          "type": "stop",
+          "stopwords": "_bulgarian_"
+        },
+        "bulgarian_stemmer": {
+          "type": "stemmer",
+          "language": "bulgarian"
+        },
+        "bulgarian_keywords": {
+          "type":       "keyword_marker",
+          "keywords":   [] 
+        }
+      },
+      "analyzer": {
+        "bulgarian_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "bulgarian_stop",
+            "bulgarian_keywords",
+            "bulgarian_stemmer"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "bulgarian_analyzer"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /bulgarian-index/_analyze
+{
+  "field": "content",
+  "text": "Студентите учат в българските университети. Техните номера са 123456."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {"token": "студент","start_offset": 0,"end_offset": 10,"type": "<ALPHANUM>","position": 0},
+    {"token": "учат","start_offset": 11,"end_offset": 15,"type": "<ALPHANUM>","position": 1},
+    {"token": "българск","start_offset": 18,"end_offset": 29,"type": "<ALPHANUM>","position": 3},
+    {"token": "университят","start_offset": 30,"end_offset": 42,"type": "<ALPHANUM>","position": 4},
+    {"token": "техн","start_offset": 44,"end_offset": 51,"type": "<ALPHANUM>","position": 5},
+    {"token": "номер","start_offset": 52,"end_offset": 58,"type": "<ALPHANUM>","position": 6},
+    {"token": "123456","start_offset": 62,"end_offset": 68,"type": "<NUM>","position": 8}
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/language-analyzers/catalan.md b/_analyzers/language-analyzers/catalan.md
new file mode 100644
index 0000000000..89762da094
--- /dev/null
+++ b/_analyzers/language-analyzers/catalan.md
@@ -0,0 +1,143 @@
+---
+layout: default
+title: Catalan
+parent: Language analyzers
+grand_parent: Analyzers
+nav_order: 70
+---
+
+# Catalan analyzer
+
+The built-in `catalan` analyzer can be applied to a text field using the following command:
+
+```json
+PUT /catalan-index
+{
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "catalan"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can use `stem_exclusion` with this language analyzer using the following command:
+
+```json
+PUT index_with_stem_exclusion_catalan_analyzer
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_catalan_analyzer": {
+          "type": "catalan",
+          "stem_exclusion": ["autoritat", "aprovació"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Catalan analyzer internals
+
+The `catalan` analyzer is built using the following components:
+
+- Tokenizer: `standard`
+
+- Token filters:
+  - elision (Catalan)
+  - lowercase
+  - stop (Catalan)
+  - keyword
+  - stemmer (Catalan)
+
+## Custom Catalan analyzer
+
+You can create a custom Catalan analyzer using the following command:
+
+```json
+PUT /catalan-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "catalan_stop": {
+          "type": "stop",
+          "stopwords": "_catalan_"
+        },
+        "catalan_elision": {
+          "type":       "elision",
+          "articles":   [ "d", "l", "m", "n", "s", "t"],
+          "articles_case": true
+        },
+        "catalan_stemmer": {
+          "type": "stemmer",
+          "language": "catalan"
+        },
+        "catalan_keywords": {
+          "type":       "keyword_marker",
+          "keywords":   [] 
+        }
+      },
+      "analyzer": {
+        "catalan_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "catalan_elision",
+            "lowercase",
+            "catalan_stop",
+            "catalan_keywords",
+            "catalan_stemmer"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "catalan_analyzer"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /catalan-index/_analyze
+{
+  "field": "content",
+  "text": "Els estudiants estudien a les universitats catalanes. Els seus números són 123456."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {"token": "estud","start_offset": 4,"end_offset": 14,"type": "<ALPHANUM>","position": 1},
+    {"token": "estud","start_offset": 15,"end_offset": 23,"type": "<ALPHANUM>","position": 2},
+    {"token": "univer","start_offset": 30,"end_offset": 42,"type": "<ALPHANUM>","position": 5},
+    {"token": "catalan","start_offset": 43,"end_offset": 52,"type": "<ALPHANUM>","position": 6},
+    {"token": "numer","start_offset": 63,"end_offset": 70,"type": "<ALPHANUM>","position": 9},
+    {"token": "123456","start_offset": 75,"end_offset": 81,"type": "<NUM>","position": 11}
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/language-analyzers/cjk.md b/_analyzers/language-analyzers/cjk.md
new file mode 100644
index 0000000000..aed7e6da22
--- /dev/null
+++ b/_analyzers/language-analyzers/cjk.md
@@ -0,0 +1,142 @@
+---
+layout: default
+title: CJK
+parent: Language analyzers
+grand_parent: Analyzers
+nav_order: 80
+---
+
+# CJK analyzer
+
+The built-in `cjk` analyzer can be applied to a text field using the following command:
+
+```json
+PUT /cjk-index
+{
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "cjk"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can use `stem_exclusion` with this language analyzer using the following command:
+
+```json
+PUT index_with_stem_exclusion_cjk_analyzer
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_cjk_analyzer": {
+          "type": "cjk",
+          "stem_exclusion": ["example", "words"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## CJK analyzer internals
+
+The `cjk` analyzer is built using the following components:
+
+- Tokenizer: `standard`
+
+- Token filters:
+  - cjk_width
+  - lowercase
+  - cjk_bigram
+  - stop (similar to English)
+
+## Custom CJK analyzer
+
+You can create a custom CJK analyzer using the following command:
+
+```json
+PUT /cjk-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "english_stop": {
+          "type":       "stop",
+          "stopwords":  [ 
+            "a", "and", "are", "as", "at", "be", "but", "by", "for",
+            "if", "in", "into", "is", "it", "no", "not", "of", "on",
+            "or", "s", "such", "t", "that", "the", "their", "then",
+            "there", "these", "they", "this", "to", "was", "will",
+            "with", "www"
+          ]
+        }
+      },
+      "analyzer": {
+        "cjk_custom_analyzer": {
+          "tokenizer": "standard",
+          "filter": [
+            "cjk_width",
+            "lowercase",
+            "cjk_bigram",
+            "english_stop"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "cjk_custom_analyzer"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /cjk-index/_analyze
+{
+  "field": "content",
+  "text": "学生们在中国、日本和韩国的大学学习。123456"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {"token": "学生","start_offset": 0,"end_offset": 2,"type": "<DOUBLE>","position": 0},
+    {"token": "生们","start_offset": 1,"end_offset": 3,"type": "<DOUBLE>","position": 1},
+    {"token": "们在","start_offset": 2,"end_offset": 4,"type": "<DOUBLE>","position": 2},
+    {"token": "在中","start_offset": 3,"end_offset": 5,"type": "<DOUBLE>","position": 3},
+    {"token": "中国","start_offset": 4,"end_offset": 6,"type": "<DOUBLE>","position": 4},
+    {"token": "日本","start_offset": 7,"end_offset": 9,"type": "<DOUBLE>","position": 5},
+    {"token": "本和","start_offset": 8,"end_offset": 10,"type": "<DOUBLE>","position": 6},
+    {"token": "和韩","start_offset": 9,"end_offset": 11,"type": "<DOUBLE>","position": 7},
+    {"token": "韩国","start_offset": 10,"end_offset": 12,"type": "<DOUBLE>","position": 8},
+    {"token": "国的","start_offset": 11,"end_offset": 13,"type": "<DOUBLE>","position": 9},
+    {"token": "的大","start_offset": 12,"end_offset": 14,"type": "<DOUBLE>","position": 10},
+    {"token": "大学","start_offset": 13,"end_offset": 15,"type": "<DOUBLE>","position": 11},
+    {"token": "学学","start_offset": 14,"end_offset": 16,"type": "<DOUBLE>","position": 12},
+    {"token": "学习","start_offset": 15,"end_offset": 17,"type": "<DOUBLE>","position": 13},
+    {"token": "123456","start_offset": 18,"end_offset": 24,"type": "<NUM>","position": 14}
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/language-analyzers/czech.md b/_analyzers/language-analyzers/czech.md
new file mode 100644
index 0000000000..c1778cd0f4
--- /dev/null
+++ b/_analyzers/language-analyzers/czech.md
@@ -0,0 +1,172 @@
+---
+layout: default
+title: Czech
+parent: Language analyzers
+grand_parent: Analyzers
+nav_order: 90
+---
+
+# Czech analyzer
+
+The built-in `czech` analyzer can be applied to a text field using the following command:
+
+```json
+PUT /czech-index
+{
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "czech"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can use `stem_exclusion` with this language analyzer using the following command:
+
+```json
+PUT index_with_stem_exclusion_czech_analyzer
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_czech_analyzer": {
+          "type": "czech",
+          "stem_exclusion": ["autorita", "schválení"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Czech analyzer internals
+
+The `czech` analyzer is built using the following components:
+
+- Tokenizer: `standard`
+
+- Token filters:
+  - lowercase
+  - stop (Czech)
+  - keyword
+  - stemmer (Czech)
+
+## Custom Czech analyzer
+
+You can create a custom Czech analyzer using the following command:
+
+```json
+PUT /czech-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "czech_stop": {
+          "type": "stop",
+          "stopwords": "_czech_"
+        },
+        "czech_stemmer": {
+          "type": "stemmer",
+          "language": "czech"
+        },
+        "czech_keywords": {
+          "type":       "keyword_marker",
+          "keywords":   [] 
+        }
+      },
+      "analyzer": {
+        "czech_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "czech_stop",
+            "czech_keywords",
+            "czech_stemmer"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "czech_analyzer"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /czech-index/_analyze
+{
+  "field": "content",
+  "text": "Studenti studují na českých univerzitách. Jejich čísla jsou 123456."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "student",
+      "start_offset": 0,
+      "end_offset": 8,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "studuj",
+      "start_offset": 9,
+      "end_offset": 16,
+      "type": "<ALPHANUM>",
+      "position": 1
+    },
+    {
+      "token": "česk",
+      "start_offset": 20,
+      "end_offset": 27,
+      "type": "<ALPHANUM>",
+      "position": 3
+    },
+    {
+      "token": "univerzit",
+      "start_offset": 28,
+      "end_offset": 40,
+      "type": "<ALPHANUM>",
+      "position": 4
+    },
+    {
+      "token": "čísl",
+      "start_offset": 49,
+      "end_offset": 54,
+      "type": "<ALPHANUM>",
+      "position": 6
+    },
+    {
+      "token": "123456",
+      "start_offset": 60,
+      "end_offset": 66,
+      "type": "<NUM>",
+      "position": 8
+    }
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/language-analyzers/danish.md b/_analyzers/language-analyzers/danish.md
new file mode 100644
index 0000000000..b5ee1b0e97
--- /dev/null
+++ b/_analyzers/language-analyzers/danish.md
@@ -0,0 +1,172 @@
+---
+layout: default
+title: Danish
+parent: Language analyzers
+grand_parent: Analyzers
+nav_order: 100
+---
+
+# Danish analyzer
+
+The built-in `danish` analyzer can be applied to a text field using the following command:
+
+```json
+PUT /danish-index
+{
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "danish"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can use `stem_exclusion` with this language analyzer using the following command:
+
+```json
+PUT index_with_stem_exclusion_danish_analyzer
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_danish_analyzer": {
+          "type": "danish",
+          "stem_exclusion": ["autoritet", "godkendelse"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Danish analyzer internals
+
+The `danish` analyzer is built using the following components:
+
+- Tokenizer: `standard`
+
+- Token filters:
+  - lowercase
+  - stop (Danish)
+  - keyword
+  - stemmer (Danish)
+
+## Custom Danish analyzer
+
+You can create a custom Danish analyzer using the following command:
+
+```json
+PUT /danish-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "danish_stop": {
+          "type": "stop",
+          "stopwords": "_danish_"
+        },
+        "danish_stemmer": {
+          "type": "stemmer",
+          "language": "danish"
+        },
+        "danish_keywords": {
+          "type":       "keyword_marker",
+          "keywords":   [] 
+        }
+      },
+      "analyzer": {
+        "danish_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "danish_stop",
+            "danish_keywords",
+            "danish_stemmer"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "danish_analyzer"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /danish-index/_analyze
+{
+  "field": "content",
+  "text": "Studerende studerer på de danske universiteter. Deres numre er 123456."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "stud",
+      "start_offset": 0,
+      "end_offset": 10,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "stud",
+      "start_offset": 11,
+      "end_offset": 19,
+      "type": "<ALPHANUM>",
+      "position": 1
+    },
+    {
+      "token": "dansk",
+      "start_offset": 26,
+      "end_offset": 32,
+      "type": "<ALPHANUM>",
+      "position": 4
+    },
+    {
+      "token": "universitet",
+      "start_offset": 33,
+      "end_offset": 46,
+      "type": "<ALPHANUM>",
+      "position": 5
+    },
+    {
+      "token": "numr",
+      "start_offset": 54,
+      "end_offset": 59,
+      "type": "<ALPHANUM>",
+      "position": 7
+    },
+    {
+      "token": "123456",
+      "start_offset": 63,
+      "end_offset": 69,
+      "type": "<NUM>",
+      "position": 9
+    }
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/language-analyzers/dutch.md b/_analyzers/language-analyzers/dutch.md
new file mode 100644
index 0000000000..0259707d78
--- /dev/null
+++ b/_analyzers/language-analyzers/dutch.md
@@ -0,0 +1,148 @@
+---
+layout: default
+title: Dutch
+parent: Language analyzers
+grand_parent: Analyzers
+nav_order: 110
+---
+
+# Dutch analyzer
+
+The built-in `dutch` analyzer can be applied to a text field using the following command:
+
+```json
+PUT /dutch-index
+{
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "dutch"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can use `stem_exclusion` with this language analyzer using the following command:
+
+```json
+PUT index_with_stem_exclusion_dutch_analyzer
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_dutch_analyzer": {
+          "type": "dutch",
+          "stem_exclusion": ["autoriteit", "goedkeuring"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Dutch analyzer internals
+
+The `dutch` analyzer is built using the following components:
+
+- Tokenizer: `standard`
+
+- Token filters:
+  - lowercase
+  - stop (Dutch)
+  - keyword
+  - stemmer_override
+  - stemmer (Dutch)
+
+## Custom Dutch analyzer
+
+You can create a custom Dutch analyzer using the following command:
+
+```json
+PUT /dutch-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "dutch_stop": {
+          "type": "stop",
+          "stopwords": "_dutch_"
+        },
+        "dutch_stemmer": {
+          "type": "stemmer",
+          "language": "dutch"
+        },
+        "dutch_keywords": {
+          "type": "keyword_marker",
+          "keywords": []
+        },
+        "dutch_override": {
+          "type": "stemmer_override",
+          "rules": [
+            "fiets=>fiets",
+            "bromfiets=>bromfiets",
+            "ei=>eier",
+            "kind=>kinder"
+          ]
+        }
+      },
+      "analyzer": {
+        "dutch_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "dutch_stop",
+            "dutch_keywords",
+            "dutch_override",
+            "dutch_stemmer"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "dutch_analyzer"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /dutch-index/_analyze
+{
+  "field": "content",
+  "text": "De studenten studeren in Nederland en bezoeken Amsterdam. Hun nummers zijn 123456."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {"token": "student","start_offset": 3,"end_offset": 12,"type": "<ALPHANUM>","position": 1},
+    {"token": "studer","start_offset": 13,"end_offset": 21,"type": "<ALPHANUM>","position": 2},
+    {"token": "nederland","start_offset": 25,"end_offset": 34,"type": "<ALPHANUM>","position": 4},
+    {"token": "bezoek","start_offset": 38,"end_offset": 46,"type": "<ALPHANUM>","position": 6},
+    {"token": "amsterdam","start_offset": 47,"end_offset": 56,"type": "<ALPHANUM>","position": 7},
+    {"token": "nummer","start_offset": 62,"end_offset": 69,"type": "<ALPHANUM>","position": 9},
+    {"token": "123456","start_offset": 75,"end_offset": 81,"type": "<NUM>","position": 11}
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/language-analyzers/english.md b/_analyzers/language-analyzers/english.md
new file mode 100644
index 0000000000..2d0b600312
--- /dev/null
+++ b/_analyzers/language-analyzers/english.md
@@ -0,0 +1,143 @@
+---
+layout: default
+title: English
+parent: Language analyzers
+grand_parent: Analyzers
+nav_order: 120
+---
+
+# English analyzer
+
+The built-in `english` analyzer can be applied to a text field using the following command:
+
+```json
+PUT /english-index
+{
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "english"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can use `stem_exclusion` with this language analyzer using the following command:
+
+```json
+PUT index_with_stem_exclusion_english_analyzer
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_english_analyzer": {
+          "type": "english",
+          "stem_exclusion": ["authority", "authorization"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## English analyzer internals
+
+The `english` analyzer is built using the following components:
+
+- Tokenizer: `standard`
+
+- Token filters:
+  - stemmer (possessive_english)
+  - lowercase
+  - stop (English)
+  - keyword
+  - stemmer (English)
+
+## Custom English analyzer
+
+You can create a custom English analyzer using the following command:
+
+```json
+PUT /english-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "english_stop": {
+          "type": "stop",
+          "stopwords": "_english_"
+        },
+        "english_stemmer": {
+          "type": "stemmer",
+          "language": "english"
+        },
+        "english_keywords": {
+          "type": "keyword_marker",
+          "keywords": []
+        },
+        "english_possessive_stemmer": {
+          "type":       "stemmer",
+          "language":   "possessive_english"
+        }
+      },
+      "analyzer": {
+        "english_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "english_possessive_stemmer",
+            "lowercase",
+            "english_stop",
+            "english_keywords",
+            "english_stemmer"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "english_analyzer"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /english-index/_analyze
+{
+  "field": "content",
+  "text": "The students study in the USA and work at NASA. Their numbers are 123456."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {"token": "student","start_offset": 4,"end_offset": 12,"type": "<ALPHANUM>","position": 1},
+    {"token": "studi","start_offset": 13,"end_offset": 18,"type": "<ALPHANUM>","position": 2},
+    {"token": "usa","start_offset": 26,"end_offset": 29,"type": "<ALPHANUM>","position": 5},
+    {"token": "work","start_offset": 34,"end_offset": 38,"type": "<ALPHANUM>","position": 7},
+    {"token": "nasa","start_offset": 42,"end_offset": 46,"type": "<ALPHANUM>","position": 9},
+    {"token": "number","start_offset": 54,"end_offset": 61,"type": "<ALPHANUM>","position": 11},
+    {"token": "123456","start_offset": 66,"end_offset": 72,"type": "<NUM>","position": 13}
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/language-analyzers/estonian.md b/_analyzers/language-analyzers/estonian.md
new file mode 100644
index 0000000000..a4cb664f18
--- /dev/null
+++ b/_analyzers/language-analyzers/estonian.md
@@ -0,0 +1,139 @@
+---
+layout: default
+title: Estonian
+parent: Language analyzers
+grand_parent: Analyzers
+nav_order: 130
+---
+
+# Estonian analyzer
+
+The built-in `estonian` analyzer can be applied to a text field using the following command:
+
+```json
+PUT /estonian-index
+{
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "estonian"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can use `stem_exclusion` with this language analyzer using the following command:
+
+```json
+PUT index_with_stem_exclusion_estonian_analyzer
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_estonian_analyzer": {
+          "type": "estonian",
+          "stem_exclusion": ["autoriteet", "kinnitus"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Estonian analyzer internals
+
+The `estonian` analyzer is built using the following components:
+
+- Tokenizer: `standard`
+
+- Token filters:
+  - lowercase
+  - stop (Estonian)
+  - keyword
+  - stemmer (Estonian)
+
+## Custom Estonian analyzer
+
+You can create a custom Estonian analyzer using the following command:
+
+```json
+PUT /estonian-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "estonian_stop": {
+          "type": "stop",
+          "stopwords": "_estonian_"
+        },
+        "estonian_stemmer": {
+          "type": "stemmer",
+          "language": "estonian"
+        },
+        "estonian_keywords": {
+          "type": "keyword_marker",
+          "keywords": []
+        }
+      },
+      "analyzer": {
+        "estonian_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "estonian_stop",
+            "estonian_keywords",
+            "estonian_stemmer"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "estonian_analyzer"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /estonian-index/_analyze
+{
+  "field": "content",
+  "text": "Õpilased õpivad Tallinnas ja Eesti ülikoolides. Nende numbrid on 123456."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {"token": "õpilase","start_offset": 0,"end_offset": 8,"type": "<ALPHANUM>","position": 0},
+    {"token": "õpi","start_offset": 9,"end_offset": 15,"type": "<ALPHANUM>","position": 1},
+    {"token": "tallinna","start_offset": 16,"end_offset": 25,"type": "<ALPHANUM>","position": 2},
+    {"token": "eesti","start_offset": 29,"end_offset": 34,"type": "<ALPHANUM>","position": 4},
+    {"token": "ülikooli","start_offset": 35,"end_offset": 46,"type": "<ALPHANUM>","position": 5},
+    {"token": "nende","start_offset": 48,"end_offset": 53,"type": "<ALPHANUM>","position": 6},
+    {"token": "numbri","start_offset": 54,"end_offset": 61,"type": "<ALPHANUM>","position": 7},
+    {"token": "on","start_offset": 62,"end_offset": 64,"type": "<ALPHANUM>","position": 8},
+    {"token": "123456","start_offset": 65,"end_offset": 71,"type": "<NUM>","position": 9}
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/language-analyzers/finnish.md b/_analyzers/language-analyzers/finnish.md
new file mode 100644
index 0000000000..6f559650d2
--- /dev/null
+++ b/_analyzers/language-analyzers/finnish.md
@@ -0,0 +1,137 @@
+---
+layout: default
+title: Finnish
+parent: Language analyzers
+grand_parent: Analyzers
+nav_order: 140
+---
+
+# Finnish analyzer
+
+The built-in `finnish` analyzer can be applied to a text field using the following command:
+
+```json
+PUT /finnish-index
+{
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "finnish"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can use `stem_exclusion` with this language analyzer using the following command:
+
+```json
+PUT index_with_stem_exclusion_finnish_analyzer
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_finnish_analyzer": {
+          "type": "finnish",
+          "stem_exclusion": ["valta", "hyväksyntä"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Finnish analyzer internals
+
+The `finnish` analyzer is built using the following components:
+
+- Tokenizer: `standard`
+
+- Token filters:
+  - lowercase
+  - stop (Finnish)
+  - keyword
+  - stemmer (Finnish)
+
+## Custom Finnish analyzer
+
+You can create a custom Finnish analyzer using the following command:
+
+```json
+PUT /finnish-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "finnish_stop": {
+          "type": "stop",
+          "stopwords": "_finnish_"
+        },
+        "finnish_stemmer": {
+          "type": "stemmer",
+          "language": "finnish"
+        },
+        "finnish_keywords": {
+          "type": "keyword_marker",
+          "keywords": ["Helsinki", "Suomi"]
+        }
+      },
+      "analyzer": {
+        "finnish_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "finnish_stop",
+            "finnish_keywords",
+            "finnish_stemmer"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "finnish_analyzer"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /finnish-index/_analyze
+{
+  "field": "content",
+  "text": "Opiskelijat opiskelevat Helsingissä ja Suomen yliopistoissa. Heidän numeronsa ovat 123456."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {"token": "opiskelij","start_offset": 0,"end_offset": 11,"type": "<ALPHANUM>","position": 0},
+    {"token": "opiskelev","start_offset": 12,"end_offset": 23,"type": "<ALPHANUM>","position": 1},
+    {"token": "helsing","start_offset": 24,"end_offset": 35,"type": "<ALPHANUM>","position": 2},
+    {"token": "suome","start_offset": 39,"end_offset": 45,"type": "<ALPHANUM>","position": 4},
+    {"token": "yliopisto","start_offset": 46,"end_offset": 59,"type": "<ALPHANUM>","position": 5},
+    {"token": "numero","start_offset": 68,"end_offset": 77,"type": "<ALPHANUM>","position": 7},
+    {"token": "123456","start_offset": 83,"end_offset": 89,"type": "<NUM>","position": 9}
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/language-analyzers/french.md b/_analyzers/language-analyzers/french.md
new file mode 100644
index 0000000000..64e7ab5415
--- /dev/null
+++ b/_analyzers/language-analyzers/french.md
@@ -0,0 +1,148 @@
+---
+layout: default
+title: French
+parent: Language analyzers
+grand_parent: Analyzers
+nav_order: 150
+---
+
+# French analyzer
+
+The built-in `french` analyzer can be applied to a text field using the following command:
+
+```json
+PUT /french-index
+{
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "french"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can use `stem_exclusion` with this language analyzer using the following command:
+
+```json
+PUT index_with_stem_exclusion_french_analyzer
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_french_analyzer": {
+          "type": "french",
+          "stem_exclusion": ["autorité", "acceptation"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## French analyzer internals
+
+The `french` analyzer is built using the following components:
+
+- Tokenizer: `standard`
+
+- Token filters:
+  - elision (French)
+  - lowercase
+  - stop (French)
+  - keyword
+  - stemmer (French)
+
+## Custom French analyzer
+
+You can create a custom French analyzer using the following command:
+
+```json
+PUT /french-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "french_stop": {
+          "type": "stop",
+          "stopwords": "_french_"
+        },
+        "french_elision": {
+          "type":         "elision",
+          "articles_case": true,
+          "articles": [
+              "l", "m", "t", "qu", "n", "s",
+              "j", "d", "c", "jusqu", "quoiqu",
+              "lorsqu", "puisqu"
+            ]
+        },
+        "french_stemmer": {
+          "type": "stemmer",
+          "language": "light_french"
+        },
+        "french_keywords": {
+          "type": "keyword_marker",
+          "keywords": []
+        }
+      },
+      "analyzer": {
+        "french_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "french_elision",
+            "lowercase",
+            "french_stop",
+            "french_keywords",
+            "french_stemmer"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "french_analyzer"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /french-index/_analyze
+{
+  "field": "content",
+  "text": "Les étudiants étudient à Paris et dans les universités françaises. Leurs numéros sont 123456."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {"token": "etudiant","start_offset": 4,"end_offset": 13,"type": "<ALPHANUM>","position": 1},
+    {"token": "etudient","start_offset": 14,"end_offset": 22,"type": "<ALPHANUM>","position": 2},
+    {"token": "pari","start_offset": 25,"end_offset": 30,"type": "<ALPHANUM>","position": 4},
+    {"token": "universit","start_offset": 43,"end_offset": 54,"type": "<ALPHANUM>","position": 8},
+    {"token": "francais","start_offset": 55,"end_offset": 65,"type": "<ALPHANUM>","position": 9},
+    {"token": "numero","start_offset": 73,"end_offset": 80,"type": "<ALPHANUM>","position": 11},
+    {"token": "123456","start_offset": 86,"end_offset": 92,"type": "<NUM>","position": 13}
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/language-analyzers/galician.md b/_analyzers/language-analyzers/galician.md
new file mode 100644
index 0000000000..00338b23a7
--- /dev/null
+++ b/_analyzers/language-analyzers/galician.md
@@ -0,0 +1,138 @@
+---
+layout: default
+title: Galician
+parent: Language analyzers
+grand_parent: Analyzers
+nav_order: 160
+---
+
+# Galician analyzer
+
+The built-in `galician` analyzer can be applied to a text field using the following command:
+
+```json
+PUT /galician-index
+{
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "galician"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can use `stem_exclusion` with this language analyzer using the following command:
+
+```json
+PUT index_with_stem_exclusion_galician_analyzer
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_galician_analyzer": {
+          "type": "galician",
+          "stem_exclusion": ["autoridade", "aceptación"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Galician analyzer internals
+
+The `galician` analyzer is built using the following components:
+
+- Tokenizer: `standard`
+
+- Token filters:
+  - lowercase
+  - stop (French)
+  - keyword
+  - stemmer (French)
+
+## Custom Galician analyzer
+
+You can create a custom Galician analyzer using the following command:
+
+```json
+PUT /galician-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "galician_stop": {
+          "type": "stop",
+          "stopwords": "_galician_"
+        },
+        "galician_stemmer": {
+          "type": "stemmer",
+          "language": "galician"
+        },
+        "galician_keywords": {
+          "type": "keyword_marker",
+          "keywords": []
+        }
+      },
+      "analyzer": {
+        "galician_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "galician_stop",
+            "galician_keywords",
+            "galician_stemmer"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "galician_analyzer"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /galician-index/_analyze
+{
+  "field": "content",
+  "text": "Os estudantes estudan en Santiago e nas universidades galegas. Os seus números son 123456."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {"token": "estud","start_offset": 3,"end_offset": 13,"type": "<ALPHANUM>","position": 1},
+    {"token": "estud","start_offset": 14,"end_offset": 21,"type": "<ALPHANUM>","position": 2},
+    {"token": "santiag","start_offset": 25,"end_offset": 33,"type": "<ALPHANUM>","position": 4},
+    {"token": "univers","start_offset": 40,"end_offset": 53,"type": "<ALPHANUM>","position": 7},
+    {"token": "galeg","start_offset": 54,"end_offset": 61,"type": "<ALPHANUM>","position": 8},
+    {"token": "numer","start_offset": 71,"end_offset": 78,"type": "<ALPHANUM>","position": 11},
+    {"token": "son","start_offset": 79,"end_offset": 82,"type": "<ALPHANUM>","position": 12},
+    {"token": "123456","start_offset": 83,"end_offset": 89,"type": "<NUM>","position": 13}
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/language-analyzers/german.md b/_analyzers/language-analyzers/german.md
new file mode 100644
index 0000000000..4071ef5378
--- /dev/null
+++ b/_analyzers/language-analyzers/german.md
@@ -0,0 +1,174 @@
+---
+layout: default
+title: German
+parent: Language analyzers
+grand_parent: Analyzers
+nav_order: 170
+---
+
+# German analyzer
+
+The built-in `german` analyzer can be applied to a text field using the following command:
+
+```json
+PUT /german-index
+{
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "german"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can use `stem_exclusion` with this language analyzer using the following command:
+
+```json
+PUT index_with_stem_exclusion_german_analyzer
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_german_analyzer": {
+          "type": "german",
+          "stem_exclusion": ["Autorität", "Genehmigung"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## German analyzer internals
+
+The `german` analyzer is built using the following components:
+
+- Tokenizer: `standard`
+
+- Token filters:
+  - lowercase
+  - stop (German)
+  - keyword
+  - normalization (German)
+  - stemmer (German)
+
+## Custom German analyzer
+
+You can create a custom German analyzer using the following command:
+
+```json
+PUT /german-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "german_stop": {
+          "type": "stop",
+          "stopwords": "_german_"
+        },
+        "german_stemmer": {
+          "type": "stemmer",
+          "language": "light_german"
+        },
+        "german_keywords": {
+          "type": "keyword_marker",
+          "keywords": []
+        }
+      },
+      "analyzer": {
+        "german_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "german_stop",
+            "german_keywords",
+            "german_normalization",
+            "german_stemmer"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "german_analyzer"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /german-index/_analyze
+{
+  "field": "content",
+  "text": "Die Studenten studieren an den deutschen Universitäten. Ihre Nummern sind 123456."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "student",
+      "start_offset": 4,
+      "end_offset": 13,
+      "type": "<ALPHANUM>",
+      "position": 1
+    },
+    {
+      "token": "studi",
+      "start_offset": 14,
+      "end_offset": 23,
+      "type": "<ALPHANUM>",
+      "position": 2
+    },
+    {
+      "token": "deutsch",
+      "start_offset": 31,
+      "end_offset": 40,
+      "type": "<ALPHANUM>",
+      "position": 5
+    },
+    {
+      "token": "universitat",
+      "start_offset": 41,
+      "end_offset": 54,
+      "type": "<ALPHANUM>",
+      "position": 6
+    },
+    {
+      "token": "numm",
+      "start_offset": 61,
+      "end_offset": 68,
+      "type": "<ALPHANUM>",
+      "position": 8
+    },
+    {
+      "token": "123456",
+      "start_offset": 74,
+      "end_offset": 80,
+      "type": "<NUM>",
+      "position": 10
+    }
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/language-analyzers/greek.md b/_analyzers/language-analyzers/greek.md
new file mode 100644
index 0000000000..2446b1e2d6
--- /dev/null
+++ b/_analyzers/language-analyzers/greek.md
@@ -0,0 +1,139 @@
+---
+layout: default
+title: Greek
+parent: Language analyzers
+grand_parent: Analyzers
+nav_order: 180
+---
+
+# Greek analyzer
+
+The built-in `greek` analyzer can be applied to a text field using the following command:
+
+```json
+PUT /greek-index
+{
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "greek"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can use `stem_exclusion` with this language analyzer using the following command:
+
+```json
+PUT index_with_stem_exclusion_greek_analyzer
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_greek_analyzer": {
+          "type": "greek",
+          "stem_exclusion": ["αρχή", "έγκριση"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Greek analyzer internals
+
+The `greek` analyzer is built using the following components:
+
+- Tokenizer: `standard`
+
+- Token filters:
+  - lowercase
+  - stop (Greek)
+  - keyword
+  - stemmer (Greek)
+
+## Custom Greek analyzer
+
+You can create a custom Greek analyzer using the following command:
+
+```json
+PUT /greek-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "greek_stop": {
+          "type": "stop",
+          "stopwords": "_greek_"
+        },
+        "greek_stemmer": {
+          "type": "stemmer",
+          "language": "greek"
+        },
+        "greek_keywords": {
+          "type": "keyword_marker",
+          "keywords": []
+        }
+      },
+      "analyzer": {
+        "greek_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "greek_stop",
+            "greek_keywords",
+            "greek_stemmer"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "greek_analyzer"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /greek-index/_analyze
+{
+  "field": "content",
+  "text": "Οι φοιτητές σπουδάζουν στα ελληνικά πανεπιστήμια. Οι αριθμοί τους είναι 123456."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {"token": "φοιτητές","start_offset": 3,"end_offset": 11,"type": "<ALPHANUM>","position": 1},
+    {"token": "σπουδάζ","start_offset": 12,"end_offset": 22,"type": "<ALPHANUM>","position": 2},
+    {"token": "στα","start_offset": 23,"end_offset": 26,"type": "<ALPHANUM>","position": 3},
+    {"token": "ελληνικά","start_offset": 27,"end_offset": 35,"type": "<ALPHANUM>","position": 4},
+    {"token": "πανεπιστήμ","start_offset": 36,"end_offset": 48,"type": "<ALPHANUM>","position": 5},
+    {"token": "αριθμοί","start_offset": 53,"end_offset": 60,"type": "<ALPHANUM>","position": 7},
+    {"token": "τους","start_offset": 61,"end_offset": 65,"type": "<ALPHANUM>","position": 8},
+    {"token": "είνα","start_offset": 66,"end_offset": 71,"type": "<ALPHANUM>","position": 9},
+    {"token": "123456","start_offset": 72,"end_offset": 78,"type": "<NUM>","position": 10}
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/language-analyzers/hindi.md b/_analyzers/language-analyzers/hindi.md
new file mode 100644
index 0000000000..93f2eea319
--- /dev/null
+++ b/_analyzers/language-analyzers/hindi.md
@@ -0,0 +1,178 @@
+---
+layout: default
+title: Hindi
+parent: Language analyzers
+grand_parent: Analyzers
+nav_order: 190
+---
+
+# Hindi analyzer
+
+The built-in `hindi` analyzer can be applied to a text field using the following command:
+
+```json
+PUT /hindi-index
+{
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "hindi"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can use `stem_exclusion` with this language analyzer using the following command:
+
+```json
+PUT index_with_stem_exclusion_hindi_analyzer
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_hindi_analyzer": {
+          "type": "hindi",
+          "stem_exclusion": ["अधिकार", "अनुमोदन"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Hindi analyzer internals
+
+The `hindi` analyzer is built using the following components:
+
+- Tokenizer: `standard`
+
+- Token filters:
+  - lowercase
+  - decimal_digit
+  - keyword
+  - normalization (indic)
+  - normalization (Hindi)
+  - stop (Hindi)
+  - stemmer (Hindi)
+
+## Custom Hindi analyzer
+
+You can create a custom Hindi analyzer using the following command:
+
+```json
+PUT /hindi-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "hindi_stop": {
+          "type": "stop",
+          "stopwords": "_hindi_"
+        },
+        "hindi_stemmer": {
+          "type": "stemmer",
+          "language": "hindi"
+        },
+        "hindi_keywords": {
+          "type": "keyword_marker",
+          "keywords": []
+        }
+      },
+      "analyzer": {
+        "hindi_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "decimal_digit",
+            "hindi_keywords",
+            "indic_normalization",
+            "hindi_normalization",
+            "hindi_stop",
+            "hindi_stemmer"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "hindi_analyzer"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /hindi-index/_analyze
+{
+  "field": "content",
+  "text": "छात्र भारतीय विश्वविद्यालयों में पढ़ते हैं। उनके नंबर १२३४५६ हैं।"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "छातर",
+      "start_offset": 0,
+      "end_offset": 5,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "भारतिय",
+      "start_offset": 6,
+      "end_offset": 12,
+      "type": "<ALPHANUM>",
+      "position": 1
+    },
+    {
+      "token": "विशवविदयालय",
+      "start_offset": 13,
+      "end_offset": 28,
+      "type": "<ALPHANUM>",
+      "position": 2
+    },
+    {
+      "token": "पढ",
+      "start_offset": 33,
+      "end_offset": 38,
+      "type": "<ALPHANUM>",
+      "position": 4
+    },
+    {
+      "token": "नंबर",
+      "start_offset": 49,
+      "end_offset": 53,
+      "type": "<ALPHANUM>",
+      "position": 7
+    },
+    {
+      "token": "123456",
+      "start_offset": 54,
+      "end_offset": 60,
+      "type": "<NUM>",
+      "position": 8
+    }
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/language-analyzers/hungarian.md b/_analyzers/language-analyzers/hungarian.md
new file mode 100644
index 0000000000..d115c5d29c
--- /dev/null
+++ b/_analyzers/language-analyzers/hungarian.md
@@ -0,0 +1,172 @@
+---
+layout: default
+title: Hungarian
+parent: Language analyzers
+grand_parent: Analyzers
+nav_order: 200
+---
+
+# Hungarian analyzer
+
+The built-in `hungarian` analyzer can be applied to a text field using the following command:
+
+```json
+PUT /hungarian-index
+{
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "hungarian"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can use `stem_exclusion` with this language analyzer using the following command:
+
+```json
+PUT index_with_stem_exclusion_hungarian_analyzer
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_hungarian_analyzer": {
+          "type": "hungarian",
+          "stem_exclusion": ["hatalom", "jóváhagyás"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Hungarian analyzer internals
+
+The `hungarian` analyzer is built using the following components:
+
+- Tokenizer: `standard`
+
+- Token filters:
+  - lowercase
+  - stop (Hungarian)
+  - keyword
+  - stemmer (Hungarian)
+
+## Custom Hungarian analyzer
+
+You can create a custom Hungarian analyzer using the following command:
+
+```json
+PUT /hungarian-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "hungarian_stop": {
+          "type": "stop",
+          "stopwords": "_hungarian_"
+        },
+        "hungarian_stemmer": {
+          "type": "stemmer",
+          "language": "hungarian"
+        },
+        "hungarian_keywords": {
+          "type": "keyword_marker",
+          "keywords": []
+        }
+      },
+      "analyzer": {
+        "hungarian_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "hungarian_stop",
+            "hungarian_keywords",
+            "hungarian_stemmer"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "hungarian_analyzer"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /hungarian-index/_analyze
+{
+  "field": "content",
+  "text": "A diákok a magyar egyetemeken tanulnak. A számaik 123456."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "diák",
+      "start_offset": 2,
+      "end_offset": 8,
+      "type": "<ALPHANUM>",
+      "position": 1
+    },
+    {
+      "token": "magyar",
+      "start_offset": 11,
+      "end_offset": 17,
+      "type": "<ALPHANUM>",
+      "position": 3
+    },
+    {
+      "token": "egyetem",
+      "start_offset": 18,
+      "end_offset": 29,
+      "type": "<ALPHANUM>",
+      "position": 4
+    },
+    {
+      "token": "tanul",
+      "start_offset": 30,
+      "end_offset": 38,
+      "type": "<ALPHANUM>",
+      "position": 5
+    },
+    {
+      "token": "szám",
+      "start_offset": 42,
+      "end_offset": 49,
+      "type": "<ALPHANUM>",
+      "position": 7
+    },
+    {
+      "token": "123456",
+      "start_offset": 50,
+      "end_offset": 56,
+      "type": "<NUM>",
+      "position": 8
+    }
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/language-analyzers/index.md b/_analyzers/language-analyzers/index.md
new file mode 100644
index 0000000000..89a4a42254
--- /dev/null
+++ b/_analyzers/language-analyzers/index.md
@@ -0,0 +1,135 @@
+---
+layout: default
+title: Language analyzers
+nav_order: 100
+parent: Analyzers
+has_children: true
+has_toc: true
+redirect_from:
+  - /query-dsl/analyzers/language-analyzers/
+  - /analyzers/language-analyzers/
+---
+
+# Language analyzers
+
+OpenSearch supports the following language analyzers:
+`arabic`, `armenian`, `basque`, `bengali`, `brazilian`, `bulgarian`, `catalan`, `czech`, `danish`, `dutch`, `english`, `estonian`, `finnish`, `french`, `galician`, `german`, `greek`, `hindi`, `hungarian`, `indonesian`, `irish`, `italian`, `latvian`, `lithuanian`, `norwegian`, `persian`, `portuguese`, `romanian`, `russian`, `sorani`, `spanish`, `swedish`, `thai`, and `turkish`.
+
+To use an analyzer when you map an index, specify the value in your query. For example, to map your index with the French language analyzer, specify the `french` value in the analyzer field:
+
+```json
+ "analyzer": "french"
+```
+
+#### Example request
+
+The following query specifies an index `my-index` with the `content` field configured as multi-field, and a sub-field named `french` is configured with the `french` language analyzer:
+
+```json
+PUT my-index
+{
+  "mappings": {
+    "properties": {
+      "content": { 
+        "type": "text",
+        "fields": {
+          "french": { 
+            "type": "text",
+            "analyzer": "french"
+          }
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+The default `french` analyzer can also be configured for the entire index using the following query:
+
+```json
+PUT my-index
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "default": {
+          "type": "french"
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text"
+      },
+      "title": {
+        "type": "text"
+      },
+      "description": {
+        "type": "text"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can apply stem exclusion to any language analyzer by providing a list of lowercase words that should be excluded from stemming. Internally, OpenSearch uses the `keyword_marker` token filter to mark these words as keywords, ensuring that they are not stemmed.
+
+## Stem exclusion example
+
+Use the following request to configure `stem_exclusion`:
+
+```json
+PUT index_with_stem_exclusion_english_analyzer
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_english_analyzer":{
+          "type":"english",
+          "stem_exclusion": ["manager", "management"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+
+## Stem exclusion with custom analyzers
+
+All language analyzers consist of tokenizers and token filters specific to a particular language. If you want to implement a custom version of the language analyzer with stem exclusion, you need to configure the `keyword_marker` token filter and list the words excluded from stemming in the `keywords` parameter:
+
+```json
+PUT index_with_keyword_marker_analyzer
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "protected_keywords_filter": {
+          "type": "keyword_marker",
+          "keywords": ["Apple", "OpenSearch"]
+        }
+      },
+      "analyzer": {
+        "custom_english_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "protected_keywords_filter",
+            "english_stemmer"
+          ]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
diff --git a/_analyzers/language-analyzers/indonesian.md b/_analyzers/language-analyzers/indonesian.md
new file mode 100644
index 0000000000..5c3d430b3a
--- /dev/null
+++ b/_analyzers/language-analyzers/indonesian.md
@@ -0,0 +1,172 @@
+---
+layout: default
+title: Indonesian
+parent: Language analyzers
+grand_parent: Analyzers
+nav_order: 210
+---
+
+# Indonesian analyzer
+
+The built-in `indonesian` analyzer can be applied to a text field using the following command:
+
+```json
+PUT /indonesian-index
+{
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "indonesian"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can use `stem_exclusion` with this language analyzer using the following command:
+
+```json
+PUT index_with_stem_exclusion_indonesian_analyzer
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_indonesian_analyzer": {
+          "type": "indonesian",
+          "stem_exclusion": ["otoritas", "persetujuan"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Indonesian analyzer internals
+
+The `indonesian` analyzer is built using the following components:
+
+- Tokenizer: `standard`
+
+- Token filters:
+  - lowercase
+  - stop (Indonesian)
+  - keyword
+  - stemmer (Indonesian)
+
+## Custom Indonesian analyzer
+
+You can create a custom Indonesian analyzer using the following command:
+
+```json
+PUT /hungarian-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "hungarian_stop": {
+          "type": "stop",
+          "stopwords": "_hungarian_"
+        },
+        "hungarian_stemmer": {
+          "type": "stemmer",
+          "language": "hungarian"
+        },
+        "hungarian_keywords": {
+          "type": "keyword_marker",
+          "keywords": []
+        }
+      },
+      "analyzer": {
+        "hungarian_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "hungarian_stop",
+            "hungarian_keywords",
+            "hungarian_stemmer"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "hungarian_analyzer"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /indonesian-index/_analyze
+{
+  "field": "content",
+  "text": "Mahasiswa belajar di universitas Indonesia. Nomor mereka adalah 123456."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "mahasiswa",
+      "start_offset": 0,
+      "end_offset": 9,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "ajar",
+      "start_offset": 10,
+      "end_offset": 17,
+      "type": "<ALPHANUM>",
+      "position": 1
+    },
+    {
+      "token": "universitas",
+      "start_offset": 21,
+      "end_offset": 32,
+      "type": "<ALPHANUM>",
+      "position": 3
+    },
+    {
+      "token": "indonesia",
+      "start_offset": 33,
+      "end_offset": 42,
+      "type": "<ALPHANUM>",
+      "position": 4
+    },
+    {
+      "token": "nomor",
+      "start_offset": 44,
+      "end_offset": 49,
+      "type": "<ALPHANUM>",
+      "position": 5
+    },
+    {
+      "token": "123456",
+      "start_offset": 64,
+      "end_offset": 70,
+      "type": "<NUM>",
+      "position": 8
+    }
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/language-analyzers/irish.md b/_analyzers/language-analyzers/irish.md
new file mode 100644
index 0000000000..3e1535d134
--- /dev/null
+++ b/_analyzers/language-analyzers/irish.md
@@ -0,0 +1,157 @@
+---
+layout: default
+title: Irish
+parent: Language analyzers
+grand_parent: Analyzers
+nav_order: 210
+---
+
+# Irish analyzer
+
+The built-in `irish` analyzer can be applied to a text field using the following command:
+
+```json
+PUT /irish-index
+{
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "irish"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can use `stem_exclusion` with this language analyzer using the following command:
+
+```json
+PUT index_with_stem_exclusion_irish_analyzer
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_irish_analyzer": {
+          "type": "irish",
+          "stem_exclusion": ["údarás", "faomhadh"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Irish analyzer internals
+
+The `irish` analyzer is built using the following components:
+
+- Tokenizer: `standard`
+
+- Token filters:
+  - hyphenation (Irish)
+  - elision (Irish)
+  - lowercase (Irish)
+  - stop (Irish)
+  - keyword
+  - stemmer (Irish)
+
+## Custom Irish analyzer
+
+You can create a custom Irish analyzer using the following command:
+
+```json
+PUT /irish-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "irish_stop": {
+          "type": "stop",
+          "stopwords": "_irish_"
+        },
+        "irish_elision": {
+          "type":       "elision",
+          "articles":   [ "d", "m", "b" ],
+          "articles_case": true
+        },
+        "irish_hyphenation": {
+          "type":       "stop",
+          "stopwords":  [ "h", "n", "t" ],
+          "ignore_case": true
+        },
+        "irish_lowercase": {
+          "type":       "lowercase",
+          "language":   "irish"
+        },
+        "irish_stemmer": {
+          "type": "stemmer",
+          "language": "irish"
+        },
+        "irish_keywords": {
+          "type": "keyword_marker",
+          "keywords": []
+        }
+      },
+      "analyzer": {
+        "irish_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "irish_hyphenation",
+            "irish_elision",
+            "irish_lowercase",
+            "irish_stop",
+            "irish_keywords",
+            "irish_stemmer"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "irish_analyzer"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /irish-index/_analyze
+{
+  "field": "content",
+  "text": "Tá mic léinn ag staidéar in ollscoileanna na hÉireann. Is iad a gcuid uimhreacha ná 123456."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {"token": "tá","start_offset": 0,"end_offset": 2,"type": "<ALPHANUM>","position": 0},
+    {"token": "mic","start_offset": 3,"end_offset": 6,"type": "<ALPHANUM>","position": 1},
+    {"token": "léinn","start_offset": 7,"end_offset": 12,"type": "<ALPHANUM>","position": 2},
+    {"token": "staidéar","start_offset": 16,"end_offset": 24,"type": "<ALPHANUM>","position": 4},
+    {"token": "ollscoileanna","start_offset": 28,"end_offset": 41,"type": "<ALPHANUM>","position": 6},
+    {"token": "héireann","start_offset": 45,"end_offset": 53,"type": "<ALPHANUM>","position": 8},
+    {"token": "cuid","start_offset": 64,"end_offset": 69,"type": "<ALPHANUM>","position": 12},
+    {"token": "uimhreacha","start_offset": 70,"end_offset": 80,"type": "<ALPHANUM>","position": 13},
+    {"token": "123456","start_offset": 84,"end_offset": 90,"type": "<NUM>","position": 15}
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/language-analyzers/italian.md b/_analyzers/language-analyzers/italian.md
new file mode 100644
index 0000000000..190056d63c
--- /dev/null
+++ b/_analyzers/language-analyzers/italian.md
@@ -0,0 +1,148 @@
+---
+layout: default
+title: Italian
+parent: Language analyzers
+grand_parent: Analyzers
+nav_order: 220
+---
+
+# Italian analyzer
+
+The built-in `italian` analyzer can be applied to a text field using the following command:
+
+```json
+PUT /italian-index
+{
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "italian"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can use `stem_exclusion` with this language analyzer using the following command:
+
+```json
+PUT index_with_stem_exclusion_italian_analyzer
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_italian_analyzer": {
+          "type": "italian",
+          "stem_exclusion": ["autorità", "approvazione"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Italian analyzer internals
+
+The `italian` analyzer is built using the following components:
+
+- Tokenizer: `standard`
+
+- Token filters:
+  - elision (Italian)
+  - lowercase
+  - stop (Italian)
+  - keyword
+  - stemmer (Italian)
+
+## Custom Italian analyzer
+
+You can create a custom Italian analyzer using the following command:
+
+```json
+PUT /italian-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "italian_stop": {
+          "type": "stop",
+          "stopwords": "_italian_"
+        },
+        "italian_elision": {
+          "type": "elision",
+          "articles": [
+                "c", "l", "all", "dall", "dell",
+                "nell", "sull", "coll", "pell",
+                "gl", "agl", "dagl", "degl", "negl",
+                "sugl", "un", "m", "t", "s", "v", "d"
+          ],
+          "articles_case": true
+        },
+        "italian_stemmer": {
+          "type": "stemmer",
+          "language": "light_italian"
+        },
+        "italian_keywords": {
+          "type": "keyword_marker",
+          "keywords": []
+        }
+      },
+      "analyzer": {
+        "italian_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "italian_elision",
+            "lowercase",
+            "italian_stop",
+            "italian_keywords",
+            "italian_stemmer"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "italian_analyzer"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /italian-index/_analyze
+{
+  "field": "content",
+  "text": "Gli studenti studiano nelle università italiane. I loro numeri sono 123456."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {"token": "student","start_offset": 4,"end_offset": 12,"type": "<ALPHANUM>","position": 1},
+    {"token": "studian","start_offset": 13,"end_offset": 21,"type": "<ALPHANUM>","position": 2},
+    {"token": "universit","start_offset": 28,"end_offset": 38,"type": "<ALPHANUM>","position": 4},
+    {"token": "italian","start_offset": 39,"end_offset": 47,"type": "<ALPHANUM>","position": 5},
+    {"token": "numer","start_offset": 56,"end_offset": 62,"type": "<ALPHANUM>","position": 8},
+    {"token": "123456","start_offset": 68,"end_offset": 74,"type": "<NUM>","position": 10}
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/language-analyzers/latvian.md b/_analyzers/language-analyzers/latvian.md
new file mode 100644
index 0000000000..2301759763
--- /dev/null
+++ b/_analyzers/language-analyzers/latvian.md
@@ -0,0 +1,148 @@
+---
+layout: default
+title: Latvian
+parent: Language analyzers
+grand_parent: Analyzers
+nav_order: 230
+---
+
+# Latvian analyzer
+
+The built-in `latvian` analyzer can be applied to a text field using the following command:
+
+```json
+PUT /latvian-index
+{
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "latvian"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can use `stem_exclusion` with this language analyzer using the following command:
+
+```json
+PUT index_with_stem_exclusion_latvian_analyzer
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_latvian_analyzer": {
+          "type": "latvian",
+          "stem_exclusion": ["autoritāte", "apstiprinājums"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Latvian analyzer internals
+
+The `latvian` analyzer is built using the following components:
+
+- Tokenizer: `standard`
+
+- Token filters:
+  - lowercase
+  - stop (Latvian)
+  - keyword
+  - stemmer (Latvian)
+
+## Custom Latvian analyzer
+
+You can create a custom Latvian analyzer using the following command:
+
+```json
+PUT /italian-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "italian_stop": {
+          "type": "stop",
+          "stopwords": "_italian_"
+        },
+        "italian_elision": {
+          "type": "elision",
+          "articles": [
+                "c", "l", "all", "dall", "dell",
+                "nell", "sull", "coll", "pell",
+                "gl", "agl", "dagl", "degl", "negl",
+                "sugl", "un", "m", "t", "s", "v", "d"
+          ],
+          "articles_case": true
+        },
+        "italian_stemmer": {
+          "type": "stemmer",
+          "language": "light_italian"
+        },
+        "italian_keywords": {
+          "type": "keyword_marker",
+          "keywords": []
+        }
+      },
+      "analyzer": {
+        "italian_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "italian_elision",
+            "lowercase",
+            "italian_stop",
+            "italian_keywords",
+            "italian_stemmer"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "italian_analyzer"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /latvian-index/_analyze
+{
+  "field": "content",
+  "text": "Studenti mācās Latvijas universitātēs. Viņu numuri ir 123456."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {"token": "student","start_offset": 0,"end_offset": 8,"type": "<ALPHANUM>","position": 0},
+    {"token": "māc","start_offset": 9,"end_offset": 14,"type": "<ALPHANUM>","position": 1},
+    {"token": "latvij","start_offset": 15,"end_offset": 23,"type": "<ALPHANUM>","position": 2},
+    {"token": "universitāt","start_offset": 24,"end_offset": 37,"type": "<ALPHANUM>","position": 3},
+    {"token": "vin","start_offset": 39,"end_offset": 43,"type": "<ALPHANUM>","position": 4},
+    {"token": "numur","start_offset": 44,"end_offset": 50,"type": "<ALPHANUM>","position": 5},
+    {"token": "123456","start_offset": 54,"end_offset": 60,"type": "<NUM>","position": 7}
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/language-analyzers/lithuanian.md b/_analyzers/language-analyzers/lithuanian.md
new file mode 100644
index 0000000000..ca5966c54e
--- /dev/null
+++ b/_analyzers/language-analyzers/lithuanian.md
@@ -0,0 +1,136 @@
+---
+layout: default
+title: Lithuanian
+parent: Language analyzers
+grand_parent: Analyzers
+nav_order: 230
+---
+
+# Lithuanian analyzer
+
+The built-in `lithuanian` analyzer can be applied to a text field using the following command:
+
+```json
+PUT /lithuanian-index
+{
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "lithuanian"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can use `stem_exclusion` with this language analyzer using the following command:
+
+```json
+PUT index_with_stem_exclusion_lithuanian_analyzer
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_lithuanian_analyzer": {
+          "type": "lithuanian",
+          "stem_exclusion": ["autoritetas", "patvirtinimas"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Lithuanian analyzer internals
+
+The `lithuanian` analyzer is built using the following components:
+
+- Tokenizer: `standard`
+
+- Token filters:
+  - lowercase
+  - stop (Lithuanian)
+  - keyword
+  - stemmer (Lithuanian)
+
+## Custom Lithuanian analyzer
+
+You can create a custom Lithuanian analyzer using the following command:
+
+```json
+PUT /lithuanian-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "lithuanian_stop": {
+          "type": "stop",
+          "stopwords": "_lithuanian_"
+        },
+        "lithuanian_stemmer": {
+          "type": "stemmer",
+          "language": "lithuanian"
+        },
+        "lithuanian_keywords": {
+          "type": "keyword_marker",
+          "keywords": []
+        }
+      },
+      "analyzer": {
+        "lithuanian_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "lithuanian_stop",
+            "lithuanian_keywords",
+            "lithuanian_stemmer"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "lithuanian_analyzer"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /lithuanian-index/_analyze
+{
+  "field": "content",
+  "text": "Studentai mokosi Lietuvos universitetuose. Jų numeriai yra 123456."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {"token": "student","start_offset": 0,"end_offset": 9,"type": "<ALPHANUM>","position": 0},
+    {"token": "mok","start_offset": 10,"end_offset": 16,"type": "<ALPHANUM>","position": 1},
+    {"token": "lietuv","start_offset": 17,"end_offset": 25,"type": "<ALPHANUM>","position": 2},
+    {"token": "universitet","start_offset": 26,"end_offset": 41,"type": "<ALPHANUM>","position": 3},
+    {"token": "num","start_offset": 46,"end_offset": 54,"type": "<ALPHANUM>","position": 5},
+    {"token": "123456","start_offset": 59,"end_offset": 65,"type": "<NUM>","position": 7}
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/language-analyzers/norwegian.md b/_analyzers/language-analyzers/norwegian.md
new file mode 100644
index 0000000000..cfb04eebf3
--- /dev/null
+++ b/_analyzers/language-analyzers/norwegian.md
@@ -0,0 +1,137 @@
+---
+layout: default
+title: Norwegian
+parent: Language analyzers
+grand_parent: Analyzers
+nav_order: 240
+---
+
+# Norwegian analyzer
+
+The built-in `norwegian` analyzer can be applied to a text field using the following command:
+
+```json
+PUT /norwegian-index
+{
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "norwegian"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can use `stem_exclusion` with this language analyzer using the following command:
+
+```json
+PUT index_with_stem_exclusion_norwegian_analyzer
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_norwegian_analyzer": {
+          "type": "norwegian",
+          "stem_exclusion": ["autoritet", "godkjenning"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Norwegian analyzer internals
+
+The `norwegian` analyzer is built using the following components:
+
+- Tokenizer: `standard`
+
+- Token filters:
+  - lowercase
+  - stop (Norwegian)
+  - keyword
+  - stemmer (Norwegian)
+
+## Custom Norwegian analyzer
+
+You can create a custom Norwegian analyzer using the following command:
+
+```json
+PUT /norwegian-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "norwegian_stop": {
+          "type": "stop",
+          "stopwords": "_norwegian_"
+        },
+        "norwegian_stemmer": {
+          "type": "stemmer",
+          "language": "norwegian"
+        },
+        "norwegian_keywords": {
+          "type": "keyword_marker",
+          "keywords": []
+        }
+      },
+      "analyzer": {
+        "norwegian_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "norwegian_stop",
+            "norwegian_keywords",
+            "norwegian_stemmer"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "norwegian_analyzer"
+      }
+    }
+  }
+}
+
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /norwegian-index/_analyze
+{
+  "field": "content",
+  "text": "Studentene studerer ved norske universiteter. Deres nummer er 123456."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {"token": "student","start_offset": 0,"end_offset": 10,"type": "<ALPHANUM>","position": 0},
+    {"token": "studer","start_offset": 11,"end_offset": 19,"type": "<ALPHANUM>","position": 1},
+    {"token": "norsk","start_offset": 24,"end_offset": 30,"type": "<ALPHANUM>","position": 3},
+    {"token": "universitet","start_offset": 31,"end_offset": 44,"type": "<ALPHANUM>","position": 4},
+    {"token": "numm","start_offset": 52,"end_offset": 58,"type": "<ALPHANUM>","position": 6},
+    {"token": "123456","start_offset": 62,"end_offset": 68,"type": "<NUM>","position": 8}
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/language-analyzers/persian.md b/_analyzers/language-analyzers/persian.md
new file mode 100644
index 0000000000..40b38656fd
--- /dev/null
+++ b/_analyzers/language-analyzers/persian.md
@@ -0,0 +1,144 @@
+---
+layout: default
+title: Persian
+parent: Language analyzers
+grand_parent: Analyzers
+nav_order: 250
+---
+
+# Persian analyzer
+
+The built-in `persian` analyzer can be applied to a text field using the following command:
+
+```json
+PUT /persian-index
+{
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "persian"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can use `stem_exclusion` with this language analyzer using the following command:
+
+```json
+PUT index_with_stem_exclusion_persian_analyzer
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_persian_analyzer": {
+          "type": "persian",
+          "stem_exclusion": ["حکومت", "تأیید"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Persian analyzer internals
+
+The `persian` analyzer is built using the following components:
+
+- Tokenizer: `standard`
+
+- Char filter: `mapping`
+
+- Token filters:
+  - lowercase
+  - decimal_digit
+  - normalization (Arabic)
+  - normalization (Persian)
+  - keyword
+  - stemmer (Norwegian)
+
+## Custom Persian analyzer
+
+You can create a custom Persian analyzer using the following command:
+
+```json
+PUT /persian-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "persian_stop": {
+          "type": "stop",
+          "stopwords": "_persian_"
+        },
+        "persian_keywords": {
+          "type": "keyword_marker",
+          "keywords": []
+        }
+      },
+      "char_filter": {
+        "null_width_replace_with_space": {
+            "type":       "mapping",
+            "mappings": [ "\\u200C=>\\u0020"] 
+        }
+      },
+      "analyzer": {
+        "persian_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "char_filter": [ "null_width_replace_with_space" ],
+          "filter": [
+            "lowercase",
+            "decimal_digit",
+            "arabic_normalization",
+            "persian_normalization",
+            "persian_stop"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "persian_analyzer"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /persian-index/_analyze
+{
+  "field": "content",
+  "text": "دانشجویان در دانشگاه‌های ایرانی تحصیل می‌کنند. شماره‌های آن‌ها ۱۲۳۴۵۶ است."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {"token": "دانشجويان","start_offset": 0,"end_offset": 9,"type": "<ALPHANUM>","position": 0},
+    {"token": "دانشگاه","start_offset": 13,"end_offset": 20,"type": "<ALPHANUM>","position": 2},
+    {"token": "ايراني","start_offset": 25,"end_offset": 31,"type": "<ALPHANUM>","position": 4},
+    {"token": "تحصيل","start_offset": 32,"end_offset": 37,"type": "<ALPHANUM>","position": 5},
+    {"token": "شماره","start_offset": 47,"end_offset": 52,"type": "<ALPHANUM>","position": 8},
+    {"token": "123456","start_offset": 63,"end_offset": 69,"type": "<NUM>","position": 12}
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/language-analyzers/portuguese.md b/_analyzers/language-analyzers/portuguese.md
new file mode 100644
index 0000000000..166ffa0010
--- /dev/null
+++ b/_analyzers/language-analyzers/portuguese.md
@@ -0,0 +1,172 @@
+---
+layout: default
+title: Portuguese
+parent: Language analyzers
+grand_parent: Analyzers
+nav_order: 260
+---
+
+# Portuguese analyzer
+
+The built-in `portuguese` analyzer can be applied to a text field using the following command:
+
+```json
+PUT /portuguese-index
+{
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "portuguese"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can use `stem_exclusion` with this language analyzer using the following command:
+
+```json
+PUT index_with_stem_exclusion_portuguese_analyzer
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_portuguese_analyzer": {
+          "type": "portuguese",
+          "stem_exclusion": ["autoridade", "aprovação"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Portuguese analyzer internals
+
+The `portuguese` analyzer is built using the following components:
+
+- Tokenizer: `standard`
+
+- Token filters:
+  - lowercase
+  - stop (Portuguese)
+  - keyword
+  - stemmer (Portuguese)
+
+## Custom Portuguese analyzer
+
+You can create a custom Portuguese analyzer using the following command:
+
+```json
+PUT /portuguese-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "portuguese_stop": {
+          "type": "stop",
+          "stopwords": "_portuguese_"
+        },
+        "portuguese_stemmer": {
+          "type": "stemmer",
+          "language": "light_portuguese"
+        },
+        "portuguese_keywords": {
+          "type": "keyword_marker",
+          "keywords": []
+        }
+      },
+      "analyzer": {
+        "portuguese_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "portuguese_stop",
+            "portuguese_keywords",
+            "portuguese_stemmer"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "portuguese_analyzer"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /portuguese-index/_analyze
+{
+  "field": "content",
+  "text": "Os estudantes estudam nas universidades brasileiras. Seus números são 123456."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "estudant",
+      "start_offset": 3,
+      "end_offset": 13,
+      "type": "<ALPHANUM>",
+      "position": 1
+    },
+    {
+      "token": "estudam",
+      "start_offset": 14,
+      "end_offset": 21,
+      "type": "<ALPHANUM>",
+      "position": 2
+    },
+    {
+      "token": "universidad",
+      "start_offset": 26,
+      "end_offset": 39,
+      "type": "<ALPHANUM>",
+      "position": 4
+    },
+    {
+      "token": "brasileir",
+      "start_offset": 40,
+      "end_offset": 51,
+      "type": "<ALPHANUM>",
+      "position": 5
+    },
+    {
+      "token": "numer",
+      "start_offset": 58,
+      "end_offset": 65,
+      "type": "<ALPHANUM>",
+      "position": 7
+    },
+    {
+      "token": "123456",
+      "start_offset": 70,
+      "end_offset": 76,
+      "type": "<NUM>",
+      "position": 9
+    }
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/language-analyzers/romanian.md b/_analyzers/language-analyzers/romanian.md
new file mode 100644
index 0000000000..cad0953385
--- /dev/null
+++ b/_analyzers/language-analyzers/romanian.md
@@ -0,0 +1,172 @@
+---
+layout: default
+title: Romanian
+parent: Language analyzers
+grand_parent: Analyzers
+nav_order: 270
+---
+
+# Romanian analyzer
+
+The built-in `romanian` analyzer can be applied to a text field using the following command:
+
+```json
+PUT /romanian-index
+{
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "romanian"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can use `stem_exclusion` with this language analyzer using the following command:
+
+```json
+PUT index_with_stem_exclusion_romanian_analyzer
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_romanian_analyzer": {
+          "type": "romanian",
+          "stem_exclusion": ["autoritate", "aprobat"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Romanian analyzer internals
+
+The `romanian` analyzer is built using the following components:
+
+- Tokenizer: `standard`
+
+- Token filters:
+  - lowercase
+  - stop (Romanian)
+  - keyword
+  - stemmer (Romanian)
+
+## Custom Romanian analyzer
+
+You can create a custom Romanian analyzer using the following command:
+
+```json
+PUT /romanian-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "romanian_stop": {
+          "type": "stop",
+          "stopwords": "_romanian_"
+        },
+        "romanian_stemmer": {
+          "type": "stemmer",
+          "language": "romanian"
+        },
+        "romanian_keywords": {
+          "type": "keyword_marker",
+          "keywords": []
+        }
+      },
+      "analyzer": {
+        "romanian_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "romanian_stop",
+            "romanian_keywords",
+            "romanian_stemmer"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "romanian_analyzer"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /romanian-index/_analyze
+{
+  "field": "content",
+  "text": "Studenții învață la universitățile din România. Numerele lor sunt 123456."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "studenț",
+      "start_offset": 0,
+      "end_offset": 9,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "învaț",
+      "start_offset": 10,
+      "end_offset": 16,
+      "type": "<ALPHANUM>",
+      "position": 1
+    },
+    {
+      "token": "universităț",
+      "start_offset": 20,
+      "end_offset": 34,
+      "type": "<ALPHANUM>",
+      "position": 3
+    },
+    {
+      "token": "român",
+      "start_offset": 39,
+      "end_offset": 46,
+      "type": "<ALPHANUM>",
+      "position": 5
+    },
+    {
+      "token": "numer",
+      "start_offset": 48,
+      "end_offset": 56,
+      "type": "<ALPHANUM>",
+      "position": 6
+    },
+    {
+      "token": "123456",
+      "start_offset": 66,
+      "end_offset": 72,
+      "type": "<NUM>",
+      "position": 9
+    }
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/language-analyzers/russian.md b/_analyzers/language-analyzers/russian.md
new file mode 100644
index 0000000000..bd57ba0b27
--- /dev/null
+++ b/_analyzers/language-analyzers/russian.md
@@ -0,0 +1,172 @@
+---
+layout: default
+title: Russian
+parent: Language analyzers
+grand_parent: Analyzers
+nav_order: 280
+---
+
+# Russian analyzer
+
+The built-in `russian` analyzer can be applied to a text field using the following command:
+
+```json
+PUT /russian-index
+{
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "russian"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can use `stem_exclusion` with this language analyzer using the following command:
+
+```json
+PUT index_with_stem_exclusion_russian_analyzer
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_russian_analyzer": {
+          "type": "russian",
+          "stem_exclusion": ["авторитет", "одобрение"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Russian analyzer internals
+
+The `russian` analyzer is built using the following components:
+
+- Tokenizer: `standard`
+
+- Token filters:
+  - lowercase
+  - stop (Russian)
+  - keyword
+  - stemmer (Russian)
+
+## Custom Russian analyzer
+
+You can create a custom Russian analyzer using the following command:
+
+```json
+PUT /russian-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "russian_stop": {
+          "type": "stop",
+          "stopwords": "_russian_"
+        },
+        "russian_stemmer": {
+          "type": "stemmer",
+          "language": "russian"
+        },
+        "russian_keywords": {
+          "type": "keyword_marker",
+          "keywords": []
+        }
+      },
+      "analyzer": {
+        "russian_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "russian_stop",
+            "russian_keywords",
+            "russian_stemmer"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "russian_analyzer"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /russian-index/_analyze
+{
+  "field": "content",
+  "text": "Студенты учатся в университетах России. Их номера 123456."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "студент",
+      "start_offset": 0,
+      "end_offset": 8,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "учат",
+      "start_offset": 9,
+      "end_offset": 15,
+      "type": "<ALPHANUM>",
+      "position": 1
+    },
+    {
+      "token": "университет",
+      "start_offset": 18,
+      "end_offset": 31,
+      "type": "<ALPHANUM>",
+      "position": 3
+    },
+    {
+      "token": "росс",
+      "start_offset": 32,
+      "end_offset": 38,
+      "type": "<ALPHANUM>",
+      "position": 4
+    },
+    {
+      "token": "номер",
+      "start_offset": 43,
+      "end_offset": 49,
+      "type": "<ALPHANUM>",
+      "position": 6
+    },
+    {
+      "token": "123456",
+      "start_offset": 50,
+      "end_offset": 56,
+      "type": "<NUM>",
+      "position": 7
+    }
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/language-analyzers/sorani.md b/_analyzers/language-analyzers/sorani.md
new file mode 100644
index 0000000000..f71d43c481
--- /dev/null
+++ b/_analyzers/language-analyzers/sorani.md
@@ -0,0 +1,168 @@
+---
+layout: default
+title: Sorani
+parent: Language analyzers
+grand_parent: Analyzers
+nav_order: 290
+---
+
+# Sorani analyzer
+
+The built-in `sorani` analyzer can be applied to a text field using the following command:
+
+```json
+PUT /sorani-index
+{
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "sorani"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can use `stem_exclusion` with this language analyzer using the following command:
+
+```json
+PUT index_with_stem_exclusion_sorani_analyzer
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_sorani_analyzer": {
+          "type": "sorani",
+          "stem_exclusion": ["مؤسسه", "اجازه"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Sorani analyzer internals
+
+The `sorani` analyzer is built using the following components:
+
+- Tokenizer: `standard`
+
+- Token filters:
+  - normalization (Sorani)
+  - lowercase
+  - decimal_digit
+  - stop (Sorani)
+  - keyword
+  - stemmer (Sorani)
+
+## Custom Sorani analyzer
+
+You can create a custom Sorani analyzer using the following command:
+
+```json
+PUT /sorani-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "sorani_stop": {
+          "type": "stop",
+          "stopwords": "_sorani_"
+        },
+        "sorani_stemmer": {
+          "type": "stemmer",
+          "language": "sorani"
+        },
+        "sorani_keywords": {
+          "type": "keyword_marker",
+          "keywords": []
+        }
+      },
+      "analyzer": {
+        "sorani_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "decimal_digit",
+            "sorani_stop",
+            "sorani_keywords",
+            "sorani_stemmer"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "sorani_analyzer"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /sorani-index/_analyze
+{
+  "field": "content",
+  "text": "خوێندنی فەرمی لە هەولێرەوە. ژمارەکان ١٢٣٤٥٦."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "خوێندن",
+      "start_offset": 0,
+      "end_offset": 7,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "فەرم",
+      "start_offset": 8,
+      "end_offset": 13,
+      "type": "<ALPHANUM>",
+      "position": 1
+    },
+    {
+      "token": "هەولێر",
+      "start_offset": 17,
+      "end_offset": 26,
+      "type": "<ALPHANUM>",
+      "position": 3
+    },
+    {
+      "token": "ژمار",
+      "start_offset": 28,
+      "end_offset": 36,
+      "type": "<ALPHANUM>",
+      "position": 4
+    },
+    {
+      "token": "123456",
+      "start_offset": 37,
+      "end_offset": 43,
+      "type": "<NUM>",
+      "position": 5
+    }
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/language-analyzers/spanish.md b/_analyzers/language-analyzers/spanish.md
new file mode 100644
index 0000000000..8a0d8fad3c
--- /dev/null
+++ b/_analyzers/language-analyzers/spanish.md
@@ -0,0 +1,172 @@
+---
+layout: default
+title: Spanish
+parent: Language analyzers
+grand_parent: Analyzers
+nav_order: 300
+---
+
+# Spanish analyzer
+
+The built-in `spanish` analyzer can be applied to a text field using the following command:
+
+```json
+PUT /spanish-index
+{
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "spanish"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can use `stem_exclusion` with this language analyzer using the following command:
+
+```json
+PUT index_with_stem_exclusion_spanish_analyzer
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_spanish_analyzer": {
+          "type": "spanish",
+          "stem_exclusion": ["autoridad", "aprobación"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Spanish analyzer internals
+
+The `spanish` analyzer is built using the following components:
+
+- Tokenizer: `standard`
+
+- Token filters:
+  - lowercase
+  - stop (Spanish)
+  - keyword
+  - stemmer (Spanish)
+
+## Custom Spanish analyzer
+
+You can create a custom Spanish analyzer using the following command:
+
+```json
+PUT /spanish-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "spanish_stop": {
+          "type": "stop",
+          "stopwords": "_spanish_"
+        },
+        "spanish_stemmer": {
+          "type": "stemmer",
+          "language": "light_spanish"
+        },
+        "spanish_keywords": {
+          "type": "keyword_marker",
+          "keywords": []
+        }
+      },
+      "analyzer": {
+        "spanish_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "spanish_stop",
+            "spanish_keywords",
+            "spanish_stemmer"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "spanish_analyzer"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /spanish-index/_analyze
+{
+  "field": "content",
+  "text": "Los estudiantes estudian en universidades españolas. Sus números son 123456."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "estudiant",
+      "start_offset": 4,
+      "end_offset": 15,
+      "type": "<ALPHANUM>",
+      "position": 1
+    },
+    {
+      "token": "estudian",
+      "start_offset": 16,
+      "end_offset": 24,
+      "type": "<ALPHANUM>",
+      "position": 2
+    },
+    {
+      "token": "universidad",
+      "start_offset": 28,
+      "end_offset": 41,
+      "type": "<ALPHANUM>",
+      "position": 4
+    },
+    {
+      "token": "español",
+      "start_offset": 42,
+      "end_offset": 51,
+      "type": "<ALPHANUM>",
+      "position": 5
+    },
+    {
+      "token": "numer",
+      "start_offset": 57,
+      "end_offset": 64,
+      "type": "<ALPHANUM>",
+      "position": 7
+    },
+    {
+      "token": "123456",
+      "start_offset": 69,
+      "end_offset": 75,
+      "type": "<NUM>",
+      "position": 9
+    }
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/language-analyzers/swedish.md b/_analyzers/language-analyzers/swedish.md
new file mode 100644
index 0000000000..9da595f12e
--- /dev/null
+++ b/_analyzers/language-analyzers/swedish.md
@@ -0,0 +1,172 @@
+---
+layout: default
+title: Swedish
+parent: Language analyzers
+grand_parent: Analyzers
+nav_order: 310
+---
+
+# Swedish analyzer
+
+The built-in `swedish` analyzer can be applied to a text field using the following command:
+
+```json
+PUT /swedish-index
+{
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "swedish"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can use `stem_exclusion` with this language analyzer using the following command:
+
+```json
+PUT index_with_stem_exclusion_swedish_analyzer
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_swedish_analyzer": {
+          "type": "swedish",
+          "stem_exclusion": ["myndighet", "godkännande"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Swedish analyzer internals
+
+The `swedish` analyzer is built using the following components:
+
+- Tokenizer: `standard`
+
+- Token filters:
+  - lowercase
+  - stop (Swedish)
+  - keyword
+  - stemmer (Swedish)
+
+## Custom Swedish analyzer
+
+You can create a custom Swedish analyzer using the following command:
+
+```json
+PUT /swedish-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "swedish_stop": {
+          "type": "stop",
+          "stopwords": "_swedish_"
+        },
+        "swedish_stemmer": {
+          "type": "stemmer",
+          "language": "swedish"
+        },
+        "swedish_keywords": {
+          "type": "keyword_marker",
+          "keywords": []
+        }
+      },
+      "analyzer": {
+        "swedish_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "swedish_stop",
+            "swedish_keywords",
+            "swedish_stemmer"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "swedish_analyzer"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /swedish-index/_analyze
+{
+  "field": "content",
+  "text": "Studenter studerar vid svenska universitet. Deras nummer är 123456."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "student",
+      "start_offset": 0,
+      "end_offset": 9,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "studer",
+      "start_offset": 10,
+      "end_offset": 18,
+      "type": "<ALPHANUM>",
+      "position": 1
+    },
+    {
+      "token": "svensk",
+      "start_offset": 23,
+      "end_offset": 30,
+      "type": "<ALPHANUM>",
+      "position": 3
+    },
+    {
+      "token": "universitet",
+      "start_offset": 31,
+      "end_offset": 42,
+      "type": "<ALPHANUM>",
+      "position": 4
+    },
+    {
+      "token": "numm",
+      "start_offset": 50,
+      "end_offset": 56,
+      "type": "<ALPHANUM>",
+      "position": 6
+    },
+    {
+      "token": "123456",
+      "start_offset": 60,
+      "end_offset": 66,
+      "type": "<NUM>",
+      "position": 8
+    }
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/language-analyzers/thai.md b/_analyzers/language-analyzers/thai.md
new file mode 100644
index 0000000000..e4daa1f0be
--- /dev/null
+++ b/_analyzers/language-analyzers/thai.md
@@ -0,0 +1,132 @@
+---
+layout: default
+title: Thai
+parent: Language analyzers
+grand_parent: Analyzers
+nav_order: 320
+---
+
+# Thai analyzer
+
+The built-in `thai` analyzer can be applied to a text field using the following command:
+
+```json
+PUT /thai-index
+{
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "thai"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can use `stem_exclusion` with this language analyzer using the following command:
+
+```json
+PUT index_with_stem_exclusion_thai_analyzer
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_thai_analyzer": {
+          "type": "thai",
+          "stem_exclusion": ["อำนาจ", "การอนุมัติ"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Thai analyzer internals
+
+The `thai` analyzer is built using the following components:
+
+- Tokenizer: `thai`
+
+- Token filters:
+  - lowercase
+  - decimal_digit
+  - stop (Thai)
+  - keyword
+
+## Custom Thai analyzer
+
+You can create a custom Thai analyzer using the following command:
+
+```json
+PUT /thai-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "thai_stop": {
+          "type": "stop",
+          "stopwords": "_thai_"
+        },
+        "thai_keywords": {
+          "type": "keyword_marker",
+          "keywords": []
+        }
+      },
+      "analyzer": {
+        "thai_analyzer": {
+          "tokenizer": "thai",
+          "filter": [
+            "lowercase",
+            "decimal_digit",
+            "thai_stop",
+            "thai_keywords"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "thai_analyzer"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /thai-index/_analyze
+{
+  "field": "content",
+  "text": "นักเรียนกำลังศึกษาอยู่ที่มหาวิทยาลัยไทย หมายเลข 123456."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {"token": "นักเรียน","start_offset": 0,"end_offset": 8,"type": "word","position": 0},
+    {"token": "กำลัง","start_offset": 8,"end_offset": 13,"type": "word","position": 1},
+    {"token": "ศึกษา","start_offset": 13,"end_offset": 18,"type": "word","position": 2},
+    {"token": "มหาวิทยาลัย","start_offset": 25,"end_offset": 36,"type": "word","position": 5},
+    {"token": "ไทย","start_offset": 36,"end_offset": 39,"type": "word","position": 6},
+    {"token": "หมายเลข","start_offset": 40,"end_offset": 47,"type": "word","position": 7},
+    {"token": "123456","start_offset": 48,"end_offset": 54,"type": "word","position": 8}
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/language-analyzers/turkish.md b/_analyzers/language-analyzers/turkish.md
new file mode 100644
index 0000000000..fb36c5413c
--- /dev/null
+++ b/_analyzers/language-analyzers/turkish.md
@@ -0,0 +1,143 @@
+---
+layout: default
+title: Turkish
+parent: Language analyzers
+grand_parent: Analyzers
+nav_order: 330
+---
+
+# Turkish analyzer
+
+The built-in `turkish` analyzer can be applied to a text field using the following command:
+
+```json
+PUT /turkish-index
+{
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "turkish"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Stem exclusion
+
+You can use `stem_exclusion` with this language analyzer using the following command:
+
+```json
+PUT index_with_stem_exclusion_turkish_analyzer
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "stem_exclusion_turkish_analyzer": {
+          "type": "turkish",
+          "stem_exclusion": ["otorite", "onay"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Turkish analyzer internals
+
+The `turkish` analyzer is built using the following components:
+
+- Tokenizer: `standard`
+
+- Token filters:
+  - apostrophe
+  - lowercase (Turkish)
+  - stop (Turkish)
+  - keyword
+  - stemmer (Turkish)
+
+## Custom Turkish analyzer
+
+You can create a custom Turkish analyzer using the following command:
+
+```json
+PUT /turkish-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "turkish_stop": {
+          "type": "stop",
+          "stopwords": "_turkish_"
+        },
+        "turkish_stemmer": {
+          "type": "stemmer",
+          "language": "turkish"
+        },
+        "turkish_lowercase": {
+          "type":       "lowercase",
+          "language":   "turkish"
+        },
+        "turkish_keywords": {
+          "type": "keyword_marker",
+          "keywords": []
+        }
+      },
+      "analyzer": {
+        "turkish_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "apostrophe",
+            "turkish_lowercase",
+            "turkish_stop",
+            "turkish_keywords",
+            "turkish_stemmer"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "turkish_analyzer"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /turkish-index/_analyze
+{
+  "field": "content",
+  "text": "Öğrenciler Türk üniversitelerinde öğrenim görüyor. Numara 123456."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {"token": "öğrenci","start_offset": 0,"end_offset": 10,"type": "<ALPHANUM>","position": 0},
+    {"token": "türk","start_offset": 11,"end_offset": 15,"type": "<ALPHANUM>","position": 1},
+    {"token": "üniversite","start_offset": 16,"end_offset": 33,"type": "<ALPHANUM>","position": 2},
+    {"token": "öğre","start_offset": 34,"end_offset": 41,"type": "<ALPHANUM>","position": 3},
+    {"token": "görüyor","start_offset": 42,"end_offset": 49,"type": "<ALPHANUM>","position": 4},
+    {"token": "numar","start_offset": 51,"end_offset": 57,"type": "<ALPHANUM>","position": 5},
+    {"token": "123456","start_offset": 58,"end_offset": 64,"type": "<NUM>","position": 6}
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/supported-analyzers/index.md b/_analyzers/supported-analyzers/index.md
index 5616936179..43e41b8d6a 100644
--- a/_analyzers/supported-analyzers/index.md
+++ b/_analyzers/supported-analyzers/index.md
@@ -24,12 +24,12 @@ Analyzer | Analysis performed | Analyzer output
 **Stop** | - Parses strings into tokens on any non-letter character <br> - Removes non-letter characters <br> - Removes stop words <br> - Converts tokens to lowercase | [`s`, `fun`, `contribute`, `brand`, `new`, `pr`, `opensearch`]
 **Keyword** (no-op) | - Outputs the entire string unchanged | [`It’s fun to contribute a brand-new PR or 2 to OpenSearch!`]
 **Pattern** | - Parses strings into tokens using regular expressions <br> - Supports converting strings to lowercase <br> - Supports removing stop words | [`it`, `s`, `fun`, `to`, `contribute`, `a`,`brand`, `new`, `pr`, `or`, `2`, `to`, `opensearch`]
-[**Language**]({{site.url}}{{site.baseurl}}/analyzers/language-analyzers/) | Performs analysis specific to a certain language (for example, `english`). | [`fun`, `contribut`, `brand`, `new`, `pr`, `2`, `opensearch`]
+[**Language**]({{site.url}}{{site.baseurl}}/analyzers/language-analyzers/index/) | Performs analysis specific to a certain language (for example, `english`). | [`fun`, `contribut`, `brand`, `new`, `pr`, `2`, `opensearch`]
 **Fingerprint** | - Parses strings on any non-letter character <br> - Normalizes characters by converting them to ASCII <br> - Converts tokens to lowercase <br> - Sorts, deduplicates, and concatenates tokens into a single token <br> - Supports removing stop words | [`2 a brand contribute fun it's new opensearch or pr to`] <br> Note that the apostrophe was converted to its ASCII counterpart.
 
 ## Language analyzers
 
-OpenSearch supports multiple language analyzers. For more information, see [Language analyzers]({{site.url}}{{site.baseurl}}/analyzers/language-analyzers/).
+OpenSearch supports multiple language analyzers. For more information, see [Language analyzers]({{site.url}}{{site.baseurl}}/analyzers/language-analyzers/index).
 
 ## Additional analyzers
 
diff --git a/_analyzers/token-filters/condition.md b/_analyzers/token-filters/condition.md
index eb3c348728..5e87c2cbbf 100644
--- a/_analyzers/token-filters/condition.md
+++ b/_analyzers/token-filters/condition.md
@@ -1,6 +1,6 @@
 ---
 layout: default
-title: condition
+title: Condition
 parent: Token filters
 nav_order: 70
 ---
diff --git a/_analyzers/token-filters/dictionary-decompounder.md b/_analyzers/token-filters/dictionary-decompounder.md
new file mode 100644
index 0000000000..ced6fd6fbc
--- /dev/null
+++ b/_analyzers/token-filters/dictionary-decompounder.md
@@ -0,0 +1,101 @@
+---
+layout: default
+title: Dictionary decompounder
+parent: Token filters
+nav_order: 110
+---
+
+# Dictionary decompounder token filter
+
+The `dictionary_decompounder` token filter is used to split compound words into their constituent parts based on a predefined dictionary. This filter is particularly useful for languages like German, Dutch, or Finnish, in which compound words are common, so breaking them down can improve search relevance. The `dictionary_decompounder` token filter determines whether each token (word) can be split into smaller tokens based on a list of known words. If the token can be split into known words, the filter generates the subtokens for the token.
+
+## Parameters
+
+The `dictionary_decompounder` token filter has the following parameters.
+
+Parameter | Required/Optional | Data type | Description
+:--- | :--- | :--- | :--- 
+`word_list` | Required unless `word_list_path` is configured | Array of strings | The dictionary of words that the filter uses to split compound words.
+`word_list_path` | Required unless `word_list` is configured | String | A file path to a text file containing the dictionary words. Accepts either an absolute path or a path relative to the `config` directory. The dictionary file must be UTF-8 encoded, and each word must be listed on a separate line.
+`min_word_size` | Optional | Integer | The minimum length of the entire compound word that will be considered for splitting. If a compound word is shorter than this value, it is not split. Default is `5`.
+`min_subword_size` | Optional | Integer | The minimum length for any subword. If a subword is shorter than this value, it is not included in the output. Default is `2`.
+`max_subword_size` | Optional | Integer | The maximum length for any subword. If a subword is longer than this value, it is not included in the output. Default is `15`.
+`only_longest_match` | Optional | Boolean | If set to `true`, only the longest matching subword will be returned. Default is `false`.
+
+## Example
+
+The following example request creates a new index named `decompound_example` and configures an analyzer with the `dictionary_decompounder` filter:
+
+```json
+PUT /decompound_example
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "my_dictionary_decompounder": {
+          "type": "dictionary_decompounder",
+          "word_list": ["slow", "green", "turtle"]
+        }
+      },
+      "analyzer": {
+        "my_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": ["lowercase", "my_dictionary_decompounder"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /decompound_example/_analyze
+{
+  "analyzer": "my_analyzer",
+  "text": "slowgreenturtleswim"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "slowgreenturtleswim",
+      "start_offset": 0,
+      "end_offset": 19,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "slow",
+      "start_offset": 0,
+      "end_offset": 19,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "green",
+      "start_offset": 0,
+      "end_offset": 19,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "turtle",
+      "start_offset": 0,
+      "end_offset": 19,
+      "type": "<ALPHANUM>",
+      "position": 0
+    }
+  ]
+}
+```
diff --git a/_analyzers/token-filters/edge-ngram.md b/_analyzers/token-filters/edge-ngram.md
new file mode 100644
index 0000000000..be3eaf6fab
--- /dev/null
+++ b/_analyzers/token-filters/edge-ngram.md
@@ -0,0 +1,111 @@
+---
+layout: default
+title: Edge n-gram
+parent: Token filters
+nav_order: 120
+---
+# Edge n-gram token filter
+The `edge_ngram` token filter is very similar to the `ngram` token filter, where a particular string is split into substrings of different lengths. The `edge_ngram` token filter, however, generates n-grams (substrings) only from the beginning (edge) of a token. It's particularly useful in scenarios like autocomplete or prefix matching, where you want to match the beginning of words or phrases as the user types them.
+
+## Parameters
+
+The `edge_ngram` token filter can be configured with the following parameters.
+
+Parameter | Required/Optional | Data type | Description
+:--- | :--- | :--- | :--- 
+`min_gram` | Optional | Integer | The minimum length of the n-grams that will be generated. Default is `1`.
+`max_gram` | Optional | Integer | The maximum length of the n-grams that will be generated. Default is `1` for the `edge_ngram` filter and `2` for custom token filters. Avoid setting this parameter to a low value. If the value is set too low, only very short n-grams will be generated and the search term will not be found. For example, if `max_gram` is set to `3` and you index the word "banana", the longest generated token will be "ban". If the user searches for "banana", no matches will be returned. You can use the `truncate` token filter as a search analyzer to mitigate this risk.
+`preserve_original` | Optional | Boolean | Includes the original token in the output. Default is `false` .
+
+## Example
+
+The following example request creates a new index named `edge_ngram_example` and configures an analyzer with the `edge_ngram` filter:
+
+```json
+PUT /edge_ngram_example
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "my_edge_ngram": {
+          "type": "edge_ngram",
+          "min_gram": 3,
+          "max_gram": 4
+        }
+      },
+      "analyzer": {
+        "my_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": ["lowercase", "my_edge_ngram"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /edge_ngram_example/_analyze
+{
+  "analyzer": "my_analyzer",
+  "text": "slow green turtle"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "slo",
+      "start_offset": 0,
+      "end_offset": 4,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "slow",
+      "start_offset": 0,
+      "end_offset": 4,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "gre",
+      "start_offset": 5,
+      "end_offset": 10,
+      "type": "<ALPHANUM>",
+      "position": 1
+    },
+    {
+      "token": "gree",
+      "start_offset": 5,
+      "end_offset": 10,
+      "type": "<ALPHANUM>",
+      "position": 1
+    },
+    {
+      "token": "tur",
+      "start_offset": 11,
+      "end_offset": 17,
+      "type": "<ALPHANUM>",
+      "position": 2
+    },
+    {
+      "token": "turt",
+      "start_offset": 11,
+      "end_offset": 17,
+      "type": "<ALPHANUM>",
+      "position": 2
+    }
+  ]
+}
+```
diff --git a/_analyzers/token-filters/elision.md b/_analyzers/token-filters/elision.md
new file mode 100644
index 0000000000..abc6dba658
--- /dev/null
+++ b/_analyzers/token-filters/elision.md
@@ -0,0 +1,124 @@
+---
+layout: default
+title: Elision
+parent: Token filters
+nav_order: 130
+---
+
+# Elision token filter
+
+The `elision` token filter is used to remove elided characters from words in certain languages. Elision typically occurs in languages such as French, in which words are often contracted and combined with the following word, typically by omitting a vowel and replacing it with an apostrophe. 
+
+The `elision` token filter is already preconfigured in the following [language analyzers]({{site.url}}{{site.baseurl}}/analyzers/language-analyzers/): `catalan`, `french`, `irish`, and `italian`.
+{: .note}
+
+## Parameters
+
+The custom `elision` token filter can be configured with the following parameters.
+
+Parameter | Required/Optional | Data type | Description
+:--- | :--- | :--- | :--- 
+`articles` | Required if `articles_path` is not configured | Array of strings | Defines which articles or short words should be removed when they appear as part of an elision.
+`articles_path` | Required if `articles` is not configured | String | Specifies the path to a custom list of articles that should be removed during the analysis process. 
+`articles_case` | Optional | Boolean | Specifies whether the filter is case sensitive when matching elisions. Default is `false`.
+
+## Example
+
+The default set of French elisions is `l'`, `m'`, `t'`, `qu'`, `n'`, `s'`, `j'`, `d'`, `c'`, `jusqu'`, `quoiqu'`, `lorsqu'`, and `puisqu'`. You can update this by configuring the `french_elision` token filter. The following example request creates a new index named `french_texts` and configures an analyzer with a `french_elision` filter:
+
+```json
+PUT /french_texts
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "french_elision": {
+          "type": "elision",
+          "articles": [ "l", "t", "m", "d", "n", "s", "j" ]
+        }
+      },
+      "analyzer": {
+        "french_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": ["lowercase", "french_elision"]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "text": {
+        "type": "text",
+        "analyzer": "french_analyzer"
+      }
+    }
+  }
+}
+
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /french_texts/_analyze
+{
+  "analyzer": "french_analyzer",
+  "text": "L'étudiant aime l'école et le travail."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "étudiant",
+      "start_offset": 0,
+      "end_offset": 10,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "aime",
+      "start_offset": 11,
+      "end_offset": 15,
+      "type": "<ALPHANUM>",
+      "position": 1
+    },
+    {
+      "token": "école",
+      "start_offset": 16,
+      "end_offset": 23,
+      "type": "<ALPHANUM>",
+      "position": 2
+    },
+    {
+      "token": "et",
+      "start_offset": 24,
+      "end_offset": 26,
+      "type": "<ALPHANUM>",
+      "position": 3
+    },
+    {
+      "token": "le",
+      "start_offset": 27,
+      "end_offset": 29,
+      "type": "<ALPHANUM>",
+      "position": 4
+    },
+    {
+      "token": "travail",
+      "start_offset": 30,
+      "end_offset": 37,
+      "type": "<ALPHANUM>",
+      "position": 5
+    }
+  ]
+}
+```
diff --git a/_analyzers/token-filters/fingerprint.md b/_analyzers/token-filters/fingerprint.md
new file mode 100644
index 0000000000..75c6615459
--- /dev/null
+++ b/_analyzers/token-filters/fingerprint.md
@@ -0,0 +1,86 @@
+---
+layout: default
+title: Fingerprint
+parent: Token filters
+nav_order: 140
+---
+
+# Fingerprint token filter
+
+The `fingerprint` token filter is used to standardize and deduplicate text. This is particularly useful when consistency in text processing is crucial. The `fingerprint` token filter achieves this by processing text using the following steps:
+
+1. **Lowercasing**: Converts all text to lowercase.
+2. **Splitting**: Breaks the text into tokens.
+3. **Sorting**: Arranges the tokens in alphabetical order.
+4. **Removing duplicates**: Eliminates repeated tokens.
+5. **Joining tokens**: Combines the tokens into a single string, typically joined by a space or another specified separator.
+
+## Parameters
+
+The `fingerprint` token filter can be configured with the following two parameters.
+
+Parameter | Required/Optional | Data type | Description
+:--- | :--- | :--- | :--- 
+`max_output_size` | Optional | Integer | Limits the length of the generated fingerprint string. If the concatenated string exceeds the `max_output_size`, the filter will not produce any output, resulting in an empty token. Default is `255`.
+`separator` | Optional | String | Defines the character(s) used to join the tokens into a single string after they have been sorted and deduplicated. Default is space (`" "`).
+
+## Example
+
+The following example request creates a new index named `my_index` and configures an analyzer with a `fingerprint` token filter:
+
+```json
+PUT /my_index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "my_fingerprint": {
+          "type": "fingerprint",
+          "max_output_size": 200,
+          "separator": "-"
+        }
+      },
+      "analyzer": {
+        "my_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "my_fingerprint"
+          ]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /my_index/_analyze
+{
+  "analyzer": "my_analyzer",
+  "text": "OpenSearch is a powerful search engine that scales easily"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "a-easily-engine-is-opensearch-powerful-scales-search-that",
+      "start_offset": 0,
+      "end_offset": 57,
+      "type": "fingerprint",
+      "position": 0
+    }
+  ]
+}
+```
diff --git a/_analyzers/token-filters/flatten-graph.md b/_analyzers/token-filters/flatten-graph.md
new file mode 100644
index 0000000000..8d51c57400
--- /dev/null
+++ b/_analyzers/token-filters/flatten-graph.md
@@ -0,0 +1,109 @@
+---
+layout: default
+title: Flatten graph
+parent: Token filters
+nav_order: 150
+---
+
+# Flatten graph token filter
+
+The `flatten_graph` token filter is used to handle complex token relationships that occur when multiple tokens are generated at the same position in a graph structure. Some token filters, like `synonym_graph` and `word_delimiter_graph`, generate multi-position tokens---tokens that overlap or span multiple positions. These token graphs are useful for search queries but are not directly supported during indexing. The `flatten_graph` token filter resolves multi-position tokens into a linear sequence of tokens. Flattening the graph ensures compatibility with the indexing process. 
+
+Token graph flattening is a lossy process. Whenever possible, avoid using the `flatten_graph` filter. Instead, apply graph token filters exclusively in search analyzers, removing the need for the `flatten_graph` filter.
+{: .important}
+
+## Example
+
+The following example request creates a new index named `test_index` and configures an analyzer with a `flatten_graph` filter:
+
+```json
+PUT /test_index
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "my_index_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "my_custom_filter",
+            "flatten_graph"
+          ]
+        }
+      },
+      "filter": {
+        "my_custom_filter": {
+          "type": "word_delimiter_graph",
+          "catenate_all": true
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /test_index/_analyze
+{
+  "analyzer": "my_index_analyzer",
+  "text": "OpenSearch helped many employers"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "OpenSearch",
+      "start_offset": 0,
+      "end_offset": 10,
+      "type": "<ALPHANUM>",
+      "position": 0,
+      "positionLength": 2
+    },
+    {
+      "token": "Open",
+      "start_offset": 0,
+      "end_offset": 4,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "Search",
+      "start_offset": 4,
+      "end_offset": 10,
+      "type": "<ALPHANUM>",
+      "position": 1
+    },
+    {
+      "token": "helped",
+      "start_offset": 11,
+      "end_offset": 17,
+      "type": "<ALPHANUM>",
+      "position": 2
+    },
+    {
+      "token": "many",
+      "start_offset": 18,
+      "end_offset": 22,
+      "type": "<ALPHANUM>",
+      "position": 3
+    },
+    {
+      "token": "employers",
+      "start_offset": 23,
+      "end_offset": 32,
+      "type": "<ALPHANUM>",
+      "position": 4
+    }
+  ]
+}
+```
diff --git a/_analyzers/token-filters/hunspell.md b/_analyzers/token-filters/hunspell.md
new file mode 100644
index 0000000000..6720ba74de
--- /dev/null
+++ b/_analyzers/token-filters/hunspell.md
@@ -0,0 +1,108 @@
+---
+layout: default
+title: Hunspell
+parent: Token filters
+nav_order: 160
+---
+
+# Hunspell token filter
+
+The `hunspell` token filter is used for stemming and morphological analysis of words in a specific language. This filter applies Hunspell dictionaries, which are widely used in spell checkers. It works by breaking down words into their root forms (stemming).
+
+The Hunspell dictionary files are automatically loaded at startup from the `<OS_PATH_CONF>/hunspell/<locale>` directory. For example, the `en_GB` locale must have at least one `.aff` file and one or more `.dic` files in the `<OS_PATH_CONF>/hunspell/en_GB/` directory.
+
+You can download these files from [LibreOffice dictionaries](https://github.com/LibreOffice/dictionaries).
+
+## Parameters
+
+The `hunspell` token filter can be configured with the following parameters.
+
+Parameter | Required/Optional | Data type | Description
+:--- | :--- | :--- | :--- 
+`language/lang/locale` | At least one of the three is required | String | Specifies the language for the Hunspell dictionary.
+`dedup` | Optional | Boolean | Determines whether to remove multiple duplicate stemming terms for the same token. Default is `true`.
+`dictionary` | Optional | Array of strings | Configures the dictionary files to be used for the Hunspell dictionary. Default is all files in the `<OS_PATH_CONF>/hunspell/<locale>` directory.
+`longest_only` | Optional | Boolean | Specifies whether only the longest stemmed version of the token should be returned. Default is `false`.
+
+## Example
+
+The following example request creates a new index named `my_index` and configures an analyzer with a `hunspell` filter:
+
+```json
+PUT /my_index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "my_hunspell_filter": {
+          "type": "hunspell",
+          "lang": "en_GB",
+          "dedup": true,
+          "longest_only": true
+        }
+      },
+      "analyzer": {
+        "my_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "my_hunspell_filter"
+          ]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /my_index/_analyze
+{
+  "analyzer": "my_analyzer",
+  "text": "the turtle moves slowly"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "the",
+      "start_offset": 0,
+      "end_offset": 3,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "turtle",
+      "start_offset": 4,
+      "end_offset": 10,
+      "type": "<ALPHANUM>",
+      "position": 1
+    },
+    {
+      "token": "move",
+      "start_offset": 11,
+      "end_offset": 16,
+      "type": "<ALPHANUM>",
+      "position": 2
+    },
+    {
+      "token": "slow",
+      "start_offset": 17,
+      "end_offset": 23,
+      "type": "<ALPHANUM>",
+      "position": 3
+    }
+  ]
+}
+```
diff --git a/_analyzers/token-filters/hyphenation-decompounder.md b/_analyzers/token-filters/hyphenation-decompounder.md
new file mode 100644
index 0000000000..6e53d4dfd5
--- /dev/null
+++ b/_analyzers/token-filters/hyphenation-decompounder.md
@@ -0,0 +1,102 @@
+---
+layout: default
+title: Hyphenation decompounder
+parent: Token filters
+nav_order: 170
+---
+
+# Hyphenation decompounder token filter
+
+The `hyphenation_decompounder` token filter is used to break down compound words into their constituent parts. This filter is particularly useful for languages like German, Dutch, and Swedish, in which compound words are common. The filter uses hyphenation patterns (typically defined in .xml files) to identify the possible locations within a compound word where it can be split into components. These components are then checked against a provided dictionary. If there is a match, those components are treated as valid tokens. For more information about hyphenation pattern files, see [FOP XML Hyphenation Patterns](https://offo.sourceforge.net/#FOP+XML+Hyphenation+Patterns).
+
+## Parameters
+
+The `hyphenation_decompounder` token filter can be configured with the following parameters.
+
+Parameter | Required/Optional | Data type | Description
+:--- | :--- | :--- | :--- 
+`hyphenation_patterns_path` | Required | String | The path (relative to the `config` directory or absolute) to the hyphenation patterns file, which contains the language-specific rules for word splitting. The file is typically in XML format. Sample files can be downloaded from the [OFFO SourceForge project](https://sourceforge.net/projects/offo/).
+`word_list` | Required if `word_list_path` is not set | Array of strings | A list of words used to validate the components generated by the hyphenation patterns.
+`word_list_path` | Required if `word_list` is not set | String | The path (relative to the `config` directory or absolute) to a list of subwords.
+`max_subword_size` | Optional | Integer | The maximum subword length. If the generated subword exceeds this length, it will not be added to the generated tokens. Default is `15`.
+`min_subword_size` | Optional | Integer | The minimum subword length. If the generated subword is shorter than the specified length, it will not be added to the generated tokens. Default is `2`.
+`min_word_size` | Optional | Integer | The minimum word character length. Word tokens shorter than this length are excluded from decomposition into subwords. Default is `5`.
+`only_longest_match` | Optional | Boolean | Only includes the longest subword in the generated tokens. Default is `false`.
+
+## Example
+
+The following example request creates a new index named `test_index` and configures an analyzer with a `hyphenation_decompounder` filter:
+
+```json
+PUT /test_index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "my_hyphenation_decompounder": {
+          "type": "hyphenation_decompounder",
+          "hyphenation_patterns_path": "analysis/hyphenation_patterns.xml",
+          "word_list": ["notebook", "note", "book"],
+          "min_subword_size": 3,
+          "min_word_size": 5,
+          "only_longest_match": false
+        }
+      },
+      "analyzer": {
+        "my_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "my_hyphenation_decompounder"
+          ]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /test_index/_analyze
+{
+  "analyzer": "my_analyzer",
+  "text": "notebook"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "notebook",
+      "start_offset": 0,
+      "end_offset": 8,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "note",
+      "start_offset": 0,
+      "end_offset": 8,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "book",
+      "start_offset": 0,
+      "end_offset": 8,
+      "type": "<ALPHANUM>",
+      "position": 0
+    }
+  ]
+}
+```
diff --git a/_analyzers/token-filters/index.md b/_analyzers/token-filters/index.md
index 9976feed60..b06489c805 100644
--- a/_analyzers/token-filters/index.md
+++ b/_analyzers/token-filters/index.md
@@ -17,7 +17,7 @@ The following table lists all token filters that OpenSearch supports.
 Token filter | Underlying Lucene token filter|  Description
 [`apostrophe`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/apostrophe/) | [ApostropheFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/tr/ApostropheFilter.html) | In each token containing an apostrophe, the `apostrophe` token filter removes the apostrophe itself and all characters following it. 
 [`asciifolding`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/asciifolding/) | [ASCIIFoldingFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/miscellaneous/ASCIIFoldingFilter.html) | Converts alphabetic, numeric, and symbolic characters.
-`cjk_bigram` | [CJKBigramFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/cjk/CJKBigramFilter.html) | Forms bigrams of Chinese, Japanese, and Korean (CJK) tokens. 
+[`cjk_bigram`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/cjk-bigram/) | [CJKBigramFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/cjk/CJKBigramFilter.html) | Forms bigrams of Chinese, Japanese, and Korean (CJK) tokens. 
 [`cjk_width`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/cjk-width/) | [CJKWidthFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/cjk/CJKWidthFilter.html) | Normalizes Chinese, Japanese, and Korean (CJK) tokens according to the following rules: <br> - Folds full-width ASCII character variants into their equivalent basic Latin characters. <br> - Folds half-width katakana character variants into their equivalent kana characters.
 [`classic`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/classic) | [ClassicFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/classic/ClassicFilter.html) | Performs optional post-processing on the tokens generated by the classic tokenizer. Removes possessives (`'s`) and removes `.` from acronyms.
 [`common_grams`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/common_gram/) | [CommonGramsFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/commongrams/CommonGramsFilter.html) | Generates bigrams for a list of frequently occurring terms. The output contains both single terms and bigrams.
@@ -25,43 +25,43 @@ Token filter | Underlying Lucene token filter|  Description
 [`decimal_digit`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/decimal-digit/) | [DecimalDigitFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/core/DecimalDigitFilter.html) | Converts all digits in the Unicode decimal number general category to basic Latin digits (0--9). 
 [`delimited_payload`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/delimited-payload/) | [DelimitedPayloadTokenFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/payloads/DelimitedPayloadTokenFilter.html) | Separates a token stream into tokens with corresponding payloads, based on a provided delimiter. A token consists of all characters preceding the delimiter, and a payload consists of all characters following the delimiter. For example, if the delimiter is `|`, then for the string `foo|bar`, `foo` is the token and `bar` is the payload. 
 [`delimited_term_freq`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/delimited-term-frequency/) | [DelimitedTermFrequencyTokenFilter](https://lucene.apache.org/core/9_7_0/analysis/common/org/apache/lucene/analysis/miscellaneous/DelimitedTermFrequencyTokenFilter.html) | Separates a token stream into tokens with corresponding term frequencies, based on a provided delimiter. A token consists of all characters before the delimiter, and a term frequency is the integer after the delimiter. For example, if the delimiter is `|`, then for the string `foo|5`, `foo` is the token and `5` is the term frequency.
-`dictionary_decompounder` | [DictionaryCompoundWordTokenFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/compound/DictionaryCompoundWordTokenFilter.html) | Decomposes compound words found in many Germanic languages.
-`edge_ngram` | [EdgeNGramTokenFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/ngram/EdgeNGramTokenFilter.html) | Tokenizes the given token into edge n-grams (n-grams that start at the beginning of the token) of lengths between `min_gram` and `max_gram`. Optionally, keeps the original token.
-`elision` | [ElisionFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/util/ElisionFilter.html) | Removes the specified [elisions](https://en.wikipedia.org/wiki/Elision) from the beginning of tokens. For example, changes `l'avion` (the plane) to `avion` (plane).
-`fingerprint` | [FingerprintFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/miscellaneous/FingerprintFilter.html) | Sorts and deduplicates the token list and concatenates tokens into a single token.
-`flatten_graph` | [FlattenGraphFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/core/FlattenGraphFilter.html) | Flattens a token graph produced by a graph token filter, such as `synonym_graph` or `word_delimiter_graph`, making the graph suitable for indexing.
-`hunspell` | [HunspellStemFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/hunspell/HunspellStemFilter.html) | Uses [Hunspell](https://en.wikipedia.org/wiki/Hunspell) rules to stem tokens. Because Hunspell supports a word having multiple stems, this filter can emit multiple tokens for each consumed token. Requires you to configure one or more language-specific Hunspell dictionaries.
-`hyphenation_decompounder` | [HyphenationCompoundWordTokenFilter](https://lucene.apache.org/core/9_8_0/analysis/common/org/apache/lucene/analysis/compound/HyphenationCompoundWordTokenFilter.html) | Uses XML-based hyphenation patterns to find potential subwords in compound words and checks the subwords against the specified word list. The token output contains only the subwords found in the word list.
-`keep_types` | [TypeTokenFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/core/TypeTokenFilter.html) | Keeps or removes tokens of a specific type.
-`keep_word` | [KeepWordFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/miscellaneous/KeepWordFilter.html) | Checks the tokens against the specified word list and keeps only those that are in the list.
-`keyword_marker` | [KeywordMarkerFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/miscellaneous/KeywordMarkerFilter.html) | Marks specified tokens as keywords, preventing them from being stemmed.
-`keyword_repeat` | [KeywordRepeatFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/miscellaneous/KeywordRepeatFilter.html) | Emits each incoming token twice: once as a keyword and once as a non-keyword.
-`kstem` | [KStemFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/en/KStemFilter.html) | Provides kstem-based stemming for the English language. Combines algorithmic stemming with a built-in dictionary.
-`kuromoji_completion` | [JapaneseCompletionFilter](https://lucene.apache.org/core/9_10_0/analysis/kuromoji/org/apache/lucene/analysis/ja/JapaneseCompletionFilter.html) | Adds Japanese romanized terms to the token stream (in addition to the original tokens). Usually used to support autocomplete on Japanese search terms. Note that the filter has a `mode` parameter, which should be set to `index` when used in an index analyzer and `query` when used in a search analyzer. Requires the `analysis-kuromoji` plugin. For information about installing the plugin, see [Additional plugins]({{site.url}}{{site.baseurl}}/install-and-configure/plugins/#additional-plugins).
-`length` | [LengthFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/miscellaneous/LengthFilter.html) | Removes tokens whose lengths are shorter or longer than the length range specified by `min` and `max`. 
-`limit` | [LimitTokenCountFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/miscellaneous/LimitTokenCountFilter.html) | Limits the number of output tokens. A common use case is to limit the size of document field values based on token count.
-`lowercase` | [LowerCaseFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/core/LowerCaseFilter.html) | Converts tokens to lowercase. The default [LowerCaseFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/core/LowerCaseFilter.html) is for the English language. You can set the `language` parameter to `greek` (uses [GreekLowerCaseFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/el/GreekLowerCaseFilter.html)), `irish` (uses [IrishLowerCaseFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/ga/IrishLowerCaseFilter.html)), or `turkish` (uses [TurkishLowerCaseFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/tr/TurkishLowerCaseFilter.html)).
-`min_hash` | [MinHashFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/minhash/MinHashFilter.html) | Uses the [MinHash technique](https://en.wikipedia.org/wiki/MinHash) to estimate document similarity. Performs the following operations on a token stream sequentially: <br> 1. Hashes each token in the stream. <br> 2. Assigns the hashes to buckets, keeping only the smallest hashes of each bucket. <br> 3. Outputs the smallest hash from each bucket as a token stream.
-`multiplexer` | N/A | Emits multiple tokens at the same position. Runs each token through each of the specified filter lists separately and outputs the results as separate tokens.
-`ngram` | [NGramTokenFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/ngram/NGramTokenFilter.html) | Tokenizes the given token into n-grams of lengths between `min_gram` and `max_gram`.
-Normalization | `arabic_normalization`: [ArabicNormalizer](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/ar/ArabicNormalizer.html) <br> `german_normalization`: [GermanNormalizationFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/de/GermanNormalizationFilter.html) <br> `hindi_normalization`: [HindiNormalizer](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/hi/HindiNormalizer.html) <br> `indic_normalization`: [IndicNormalizer](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/in/IndicNormalizer.html) <br> `sorani_normalization`: [SoraniNormalizer](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/ckb/SoraniNormalizer.html) <br> `persian_normalization`: [PersianNormalizer](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/fa/PersianNormalizer.html) <br> `scandinavian_normalization` : [ScandinavianNormalizationFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/miscellaneous/ScandinavianNormalizationFilter.html) <br> `scandinavian_folding`: [ScandinavianFoldingFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/miscellaneous/ScandinavianFoldingFilter.html) <br> `serbian_normalization`: [SerbianNormalizationFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/sr/SerbianNormalizationFilter.html) | Normalizes the characters of one of the listed languages.
-`pattern_capture` | N/A | Generates a token for every capture group in the provided regular expression. Uses [Java regular expression syntax](https://docs.oracle.com/javase/8/docs/api/java/util/regex/Pattern.html).
-`pattern_replace` | N/A | Matches a pattern in the provided regular expression and replaces matching substrings. Uses [Java regular expression syntax](https://docs.oracle.com/javase/8/docs/api/java/util/regex/Pattern.html).
-`phonetic` | N/A | Uses a phonetic encoder to emit a metaphone token for each token in the token stream. Requires installing the `analysis-phonetic` plugin.
-`porter_stem` | [PorterStemFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/en/PorterStemFilter.html) | Uses the [Porter stemming algorithm](https://tartarus.org/martin/PorterStemmer/) to perform algorithmic stemming for the English language.
-`predicate_token_filter` | N/A | Removes tokens that don’t match the specified predicate script. Supports inline Painless scripts only.
-`remove_duplicates` | [RemoveDuplicatesTokenFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/miscellaneous/RemoveDuplicatesTokenFilter.html) | Removes duplicate tokens that are in the same position.
-`reverse` | [ReverseStringFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/reverse/ReverseStringFilter.html) | Reverses the string corresponding to each token in the token stream. For example, the token `dog` becomes `god`.
-`shingle` | [ShingleFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/shingle/ShingleFilter.html) | Generates shingles of lengths between `min_shingle_size` and `max_shingle_size` for tokens in the token stream. Shingles are similar to n-grams but apply to words instead of letters. For example, two-word shingles added to the list of unigrams [`contribute`, `to`, `opensearch`] are [`contribute to`, `to opensearch`].
-`snowball` | N/A | Stems words using a [Snowball-generated stemmer](https://snowballstem.org/). You can use the `snowball` token filter with the following languages in the `language` field: `Arabic`, `Armenian`, `Basque`, `Catalan`, `Danish`, `Dutch`, `English`, `Estonian`, `Finnish`, `French`, `German`, `German2`, `Hungarian`, `Irish`, `Italian`, `Kp`, `Lithuanian`, `Lovins`, `Norwegian`, `Porter`, `Portuguese`, `Romanian`, `Russian`, `Spanish`, `Swedish`, `Turkish`.
-`stemmer` | N/A | Provides algorithmic stemming for the following languages in the `language` field: `arabic`, `armenian`, `basque`, `bengali`, `brazilian`, `bulgarian`, `catalan`, `czech`, `danish`, `dutch`, `dutch_kp`, `english`, `light_english`, `lovins`, `minimal_english`, `porter2`, `possessive_english`, `estonian`, `finnish`, `light_finnish`, `french`, `light_french`, `minimal_french`, `galician`, `minimal_galician`, `german`, `german2`, `light_german`, `minimal_german`, `greek`, `hindi`, `hungarian`, `light_hungarian`, `indonesian`, `irish`, `italian`, `light_italian`, `latvian`, `Lithuanian`, `norwegian`, `light_norwegian`, `minimal_norwegian`, `light_nynorsk`, `minimal_nynorsk`, `portuguese`, `light_portuguese`, `minimal_portuguese`, `portuguese_rslp`, `romanian`, `russian`, `light_russian`, `sorani`, `spanish`, `light_spanish`, `swedish`, `light_swedish`, `turkish`.
-`stemmer_override` | N/A | Overrides stemming algorithms by applying a custom mapping so that the provided terms are not stemmed.
-`stop` | [StopFilter](https://lucene.apache.org/core/8_7_0/core/org/apache/lucene/analysis/StopFilter.html) | Removes stop words from a token stream.
-`synonym` | N/A | Supplies a synonym list for the analysis process. The synonym list is provided using a configuration file.
-`synonym_graph` | N/A | Supplies a synonym list, including multiword synonyms, for the analysis process.
-`trim` | [TrimFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/miscellaneous/TrimFilter.html) | Trims leading and trailing white space from each token in a stream. 
-`truncate` | [TruncateTokenFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/miscellaneous/TruncateTokenFilter.html) | Truncates tokens whose length exceeds the specified character limit. 
-`unique` | N/A | Ensures each token is unique by removing duplicate tokens from a stream. 
-`uppercase` | [UpperCaseFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/core/LowerCaseFilter.html) | Converts tokens to uppercase. 
-`word_delimiter` | [WordDelimiterFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/miscellaneous/WordDelimiterFilter.html) | Splits tokens at non-alphanumeric characters and performs normalization based on the specified rules. 
-`word_delimiter_graph` | [WordDelimiterGraphFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/miscellaneous/WordDelimiterGraphFilter.html) | Splits tokens at non-alphanumeric characters and performs normalization based on the specified rules. Assigns multi-position tokens a `positionLength` attribute.
+[`dictionary_decompounder`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/dictionary-decompounder/) | [DictionaryCompoundWordTokenFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/compound/DictionaryCompoundWordTokenFilter.html) | Decomposes compound words found in many Germanic languages.
+[`edge_ngram`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/edge-ngram/) | [EdgeNGramTokenFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/ngram/EdgeNGramTokenFilter.html) | Tokenizes the given token into edge n-grams (n-grams that start at the beginning of the token) of lengths between `min_gram` and `max_gram`. Optionally, keeps the original token.
+[`elision`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/elision/) | [ElisionFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/util/ElisionFilter.html) | Removes the specified [elisions](https://en.wikipedia.org/wiki/Elision) from the beginning of tokens. For example, changes `l'avion` (the plane) to `avion` (plane).
+[`fingerprint`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/fingerprint/) | [FingerprintFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/miscellaneous/FingerprintFilter.html) | Sorts and deduplicates the token list and concatenates tokens into a single token.
+[`flatten_graph`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/flatten-graph/)  | [FlattenGraphFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/core/FlattenGraphFilter.html) | Flattens a token graph produced by a graph token filter, such as `synonym_graph` or `word_delimiter_graph`, making the graph suitable for indexing.
+[`hunspell`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/hunspell/) | [HunspellStemFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/hunspell/HunspellStemFilter.html) | Uses [Hunspell](https://en.wikipedia.org/wiki/Hunspell) rules to stem tokens. Because Hunspell allows a word to have multiple stems, this filter can emit multiple tokens for each consumed token. Requires the configuration of one or more language-specific Hunspell dictionaries.
+[`hyphenation_decompounder`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/hyphenation-decompounder/) | [HyphenationCompoundWordTokenFilter](https://lucene.apache.org/core/9_8_0/analysis/common/org/apache/lucene/analysis/compound/HyphenationCompoundWordTokenFilter.html) | Uses XML-based hyphenation patterns to find potential subwords in compound words and checks the subwords against the specified word list. The token output contains only the subwords found in the word list.
+[`keep_types`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/keep-types/) | [TypeTokenFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/core/TypeTokenFilter.html) | Keeps or removes tokens of a specific type.
+[`keep_words`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/keep-words/)  | [KeepWordFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/miscellaneous/KeepWordFilter.html) | Checks the tokens against the specified word list and keeps only those that are in the list.
+[`keyword_marker`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/keyword-marker/)  | [KeywordMarkerFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/miscellaneous/KeywordMarkerFilter.html) | Marks specified tokens as keywords, preventing them from being stemmed.
+[`keyword_repeat`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/keyword-repeat/) | [KeywordRepeatFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/miscellaneous/KeywordRepeatFilter.html) | Emits each incoming token twice: once as a keyword and once as a non-keyword.
+[`kstem`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/kstem/) | [KStemFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/en/KStemFilter.html) | Provides KStem-based stemming for the English language. Combines algorithmic stemming with a built-in dictionary.
+[`kuromoji_completion`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/kuromoji-completion/) | [JapaneseCompletionFilter](https://lucene.apache.org/core/9_10_0/analysis/kuromoji/org/apache/lucene/analysis/ja/JapaneseCompletionFilter.html) | Adds Japanese romanized terms to a token stream (in addition to the original tokens). Usually used to support autocomplete of Japanese search terms. Note that the filter has a `mode` parameter that should be set to `index` when used in an index analyzer and `query` when used in a search analyzer. Requires the `analysis-kuromoji` plugin. For information about installing the plugin, see [Additional plugins]({{site.url}}{{site.baseurl}}/install-and-configure/plugins/#additional-plugins).
+[`length`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/length/) | [LengthFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/miscellaneous/LengthFilter.html) | Removes tokens that are shorter or longer than the length range specified by `min` and `max`. 
+[`limit`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/limit/) | [LimitTokenCountFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/miscellaneous/LimitTokenCountFilter.html) | Limits the number of output tokens. For example, document field value sizes can be limited based on the token count.
+[`lowercase`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/lowercase/) | [LowerCaseFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/core/LowerCaseFilter.html) | Converts tokens to lowercase. The default [LowerCaseFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/core/LowerCaseFilter.html) processes the English language. To process other languages, set the `language` parameter to `greek` (uses [GreekLowerCaseFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/el/GreekLowerCaseFilter.html)), `irish` (uses [IrishLowerCaseFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/ga/IrishLowerCaseFilter.html)), or `turkish` (uses [TurkishLowerCaseFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/tr/TurkishLowerCaseFilter.html)).
+[`min_hash`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/min-hash/) | [MinHashFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/minhash/MinHashFilter.html) | Uses the [MinHash technique](https://en.wikipedia.org/wiki/MinHash) to estimate document similarity. Performs the following operations on a token stream sequentially: <br> 1. Hashes each token in the stream. <br> 2. Assigns the hashes to buckets, keeping only the smallest hashes of each bucket. <br> 3. Outputs the smallest hash from each bucket as a token stream.
+[`multiplexer`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/multiplexer/) | N/A | Emits multiple tokens at the same position. Runs each token through each of the specified filter lists separately and outputs the results as separate tokens.
+[`ngram`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/ngram/) | [NGramTokenFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/ngram/NGramTokenFilter.html) | Tokenizes the given token into n-grams of lengths between `min_gram` and `max_gram`.
+[Normalization]({{site.url}}{{site.baseurl}}/analyzers/token-filters/normalization/) | `arabic_normalization`: [ArabicNormalizer](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/ar/ArabicNormalizer.html) <br> `german_normalization`: [GermanNormalizationFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/de/GermanNormalizationFilter.html) <br> `hindi_normalization`: [HindiNormalizer](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/hi/HindiNormalizer.html) <br> `indic_normalization`: [IndicNormalizer](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/in/IndicNormalizer.html) <br> `sorani_normalization`: [SoraniNormalizer](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/ckb/SoraniNormalizer.html) <br> `persian_normalization`: [PersianNormalizer](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/fa/PersianNormalizer.html) <br> `scandinavian_normalization` : [ScandinavianNormalizationFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/miscellaneous/ScandinavianNormalizationFilter.html) <br> `scandinavian_folding`: [ScandinavianFoldingFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/miscellaneous/ScandinavianFoldingFilter.html) <br> `serbian_normalization`: [SerbianNormalizationFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/sr/SerbianNormalizationFilter.html) | Normalizes the characters of one of the listed languages.
+[`pattern_capture`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/pattern-capture/) | N/A | Generates a token for every capture group in the provided regular expression. Uses [Java regular expression syntax](https://docs.oracle.com/javase/8/docs/api/java/util/regex/Pattern.html).
+[`pattern_replace`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/pattern-replace/) | N/A | Matches a pattern in the provided regular expression and replaces matching substrings. Uses [Java regular expression syntax](https://docs.oracle.com/javase/8/docs/api/java/util/regex/Pattern.html).
+[`phonetic`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/phonetic/) | N/A | Uses a phonetic encoder to emit a metaphone token for each token in the token stream. Requires installing the `analysis-phonetic` plugin.
+[`porter_stem`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/porter-stem/) | [PorterStemFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/en/PorterStemFilter.html) | Uses the [Porter stemming algorithm](https://tartarus.org/martin/PorterStemmer/) to perform algorithmic stemming for the English language.
+[`predicate_token_filter`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/predicate-token-filter/) | N/A | Removes tokens that do not match the specified predicate script. Supports only inline Painless scripts.
+[`remove_duplicates`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/remove-duplicates/) | [RemoveDuplicatesTokenFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/miscellaneous/RemoveDuplicatesTokenFilter.html) | Removes duplicate tokens that are in the same position.
+[`reverse`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/reverse/) | [ReverseStringFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/reverse/ReverseStringFilter.html) | Reverses the string corresponding to each token in the token stream. For example, the token `dog` becomes `god`.
+[`shingle`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/shingle/) | [ShingleFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/shingle/ShingleFilter.html) | Generates shingles of lengths between `min_shingle_size` and `max_shingle_size` for tokens in the token stream. Shingles are similar to n-grams but are generated using words instead of letters. For example, two-word shingles added to the list of unigrams [`contribute`, `to`, `opensearch`] are [`contribute to`, `to opensearch`].
+[`snowball`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/snowball/) | N/A | Stems words using a [Snowball-generated stemmer](https://snowballstem.org/). The `snowball` token filter supports using the following languages in the `language` field: `Arabic`, `Armenian`, `Basque`, `Catalan`, `Danish`, `Dutch`, `English`, `Estonian`, `Finnish`, `French`, `German`, `German2`, `Hungarian`, `Irish`, `Italian`, `Kp`, `Lithuanian`, `Lovins`, `Norwegian`, `Porter`, `Portuguese`, `Romanian`, `Russian`, `Spanish`, `Swedish`, `Turkish`.
+[`stemmer`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/stemmer/) | N/A | Provides algorithmic stemming for the following languages used in the `language` field: `arabic`, `armenian`, `basque`, `bengali`, `brazilian`, `bulgarian`, `catalan`, `czech`, `danish`, `dutch`, `dutch_kp`, `english`, `light_english`, `lovins`, `minimal_english`, `porter2`, `possessive_english`, `estonian`, `finnish`, `light_finnish`, `french`, `light_french`, `minimal_french`, `galician`, `minimal_galician`, `german`, `german2`, `light_german`, `minimal_german`, `greek`, `hindi`, `hungarian`, `light_hungarian`, `indonesian`, `irish`, `italian`, `light_italian`, `latvian`, `Lithuanian`, `norwegian`, `light_norwegian`, `minimal_norwegian`, `light_nynorsk`, `minimal_nynorsk`, `portuguese`, `light_portuguese`, `minimal_portuguese`, `portuguese_rslp`, `romanian`, `russian`, `light_russian`, `sorani`, `spanish`, `light_spanish`, `swedish`, `light_swedish`, `turkish`.
+[`stemmer_override`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/stemmer-override/) | N/A | Overrides stemming algorithms by applying a custom mapping so that the provided terms are not stemmed.
+[`stop`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/stop/) | [StopFilter](https://lucene.apache.org/core/8_7_0/core/org/apache/lucene/analysis/StopFilter.html) | Removes stop words from a token stream.
+[`synonym`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/synonym/) | N/A | Supplies a synonym list for the analysis process. The synonym list is provided using a configuration file.
+[`synonym_graph`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/synonym-graph/) | N/A | Supplies a synonym list, including multiword synonyms, for the analysis process.
+[`trim`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/trim/) | [TrimFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/miscellaneous/TrimFilter.html) | Trims leading and trailing white space characters from each token in a stream. 
+[`truncate`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/truncate/) | [TruncateTokenFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/miscellaneous/TruncateTokenFilter.html) | Truncates tokens with lengths exceeding the specified character limit. 
+[`unique`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/unique/) | N/A | Ensures that each token is unique by removing duplicate tokens from a stream. 
+[`uppercase`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/uppercase/) | [UpperCaseFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/core/LowerCaseFilter.html) | Converts tokens to uppercase. 
+[`word_delimiter`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/word-delimiter/) | [WordDelimiterFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/miscellaneous/WordDelimiterFilter.html) | Splits tokens at non-alphanumeric characters and performs normalization based on the specified rules. 
+[`word_delimiter_graph`]({{site.url}}{{site.baseurl}}/analyzers/token-filters/word-delimiter-graph/) | [WordDelimiterGraphFilter](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/miscellaneous/WordDelimiterGraphFilter.html) | Splits tokens at non-alphanumeric characters and performs normalization based on the specified rules. Assigns a `positionLength` attribute to multi-position tokens.
diff --git a/_analyzers/token-filters/keep-types.md b/_analyzers/token-filters/keep-types.md
new file mode 100644
index 0000000000..59e617f567
--- /dev/null
+++ b/_analyzers/token-filters/keep-types.md
@@ -0,0 +1,115 @@
+---
+layout: default
+title: Keep types
+parent: Token filters
+nav_order: 180
+---
+
+# Keep types token filter
+
+The `keep_types` token filter is a type of token filter used in text analysis to control which token types are kept or discarded. Different tokenizers produce different token types, for example, `<HOST>`, `<NUM>`, or `<ALPHANUM>`.
+
+The `keyword`, `simple_pattern`, and `simple_pattern_split` tokenizers do not support the `keep_types` token filter because these tokenizers do not support token type attributes.
+{: .note}
+
+## Parameters
+
+The `keep_types` token filter can be configured with the following parameters.
+
+Parameter | Required/Optional | Data type | Description
+:--- | :--- | :--- | :--- 
+`types` | Required | List of strings | List of token types to be kept or discarded (determined by the `mode`).
+`mode`| Optional | String | Whether to `include` or `exclude` the token types specified in `types`. Default is `include`.
+ 
+
+## Example
+
+The following example request creates a new index named `test_index` and configures an analyzer with a `keep_types` filter:
+
+```json
+PUT /test_index
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "custom_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": ["lowercase", "keep_types_filter"]
+        }
+      },
+      "filter": {
+        "keep_types_filter": {
+          "type": "keep_types",
+          "types": ["<ALPHANUM>"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+GET /test_index/_analyze
+{
+  "analyzer": "custom_analyzer",
+  "text": "Hello 2 world! This is an example."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "hello",
+      "start_offset": 0,
+      "end_offset": 5,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "world",
+      "start_offset": 8,
+      "end_offset": 13,
+      "type": "<ALPHANUM>",
+      "position": 2
+    },
+    {
+      "token": "this",
+      "start_offset": 15,
+      "end_offset": 19,
+      "type": "<ALPHANUM>",
+      "position": 3
+    },
+    {
+      "token": "is",
+      "start_offset": 20,
+      "end_offset": 22,
+      "type": "<ALPHANUM>",
+      "position": 4
+    },
+    {
+      "token": "an",
+      "start_offset": 23,
+      "end_offset": 25,
+      "type": "<ALPHANUM>",
+      "position": 5
+    },
+    {
+      "token": "example",
+      "start_offset": 26,
+      "end_offset": 33,
+      "type": "<ALPHANUM>",
+      "position": 6
+    }
+  ]
+}
+```
diff --git a/_analyzers/token-filters/keep-words.md b/_analyzers/token-filters/keep-words.md
new file mode 100644
index 0000000000..4a6b199e5c
--- /dev/null
+++ b/_analyzers/token-filters/keep-words.md
@@ -0,0 +1,92 @@
+---
+layout: default
+title: Keep words
+parent: Token filters
+nav_order: 190
+---
+
+# Keep words token filter
+
+The `keep_words` token filter is designed to keep only certain words during the analysis process. This filter is useful if you have a large body of text but are only interested in certain keywords or terms.
+
+## Parameters
+
+The `keep_words` token filter can be configured with the following parameters.
+
+Parameter | Required/Optional | Data type | Description
+:--- | :--- | :--- | :--- 
+`keep_words` |  Required if `keep_words_path` is not configured | List of strings | The list of words to keep.
+`keep_words_path` | Required if `keep_words` is not configured | String | The path to the file containing the list of words to keep.
+`keep_words_case` | Optional | Boolean | Whether to lowercase all words during comparison. Default is `false`.
+ 
+
+## Example
+
+The following example request creates a new index named `my_index` and configures an analyzer with a `keep_words` filter:
+
+```json
+PUT my_index
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "custom_keep_word": {
+          "tokenizer": "standard",
+          "filter": [ "keep_words_filter" ]
+        }
+      },
+      "filter": {
+        "keep_words_filter": {
+          "type": "keep",
+          "keep_words": ["example", "world", "opensearch"],
+          "keep_words_case": true
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+GET /my_index/_analyze
+{
+  "analyzer": "custom_keep_word",
+  "text": "Hello, world! This is an OpenSearch example."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "world",
+      "start_offset": 7,
+      "end_offset": 12,
+      "type": "<ALPHANUM>",
+      "position": 1
+    },
+    {
+      "token": "OpenSearch",
+      "start_offset": 25,
+      "end_offset": 35,
+      "type": "<ALPHANUM>",
+      "position": 5
+    },
+    {
+      "token": "example",
+      "start_offset": 36,
+      "end_offset": 43,
+      "type": "<ALPHANUM>",
+      "position": 6
+    }
+  ]
+}
+```
diff --git a/_analyzers/token-filters/keyword-marker.md b/_analyzers/token-filters/keyword-marker.md
new file mode 100644
index 0000000000..0ec2cb96f5
--- /dev/null
+++ b/_analyzers/token-filters/keyword-marker.md
@@ -0,0 +1,127 @@
+---
+layout: default
+title: Keyword marker
+parent: Token filters
+nav_order: 200
+---
+
+# Keyword marker token filter
+
+The `keyword_marker` token filter is used to prevent certain tokens from being altered by stemmers or other filters. The `keyword_marker` token filter does this by marking the specified tokens as `keywords`, which prevents any stemming or other processing. This ensures that specific words remain in their original form. 
+
+## Parameters
+
+The `keyword_marker` token filter can be configured with the following parameters.
+
+Parameter | Required/Optional | Data type | Description
+:--- | :--- | :--- | :--- 
+`ignore_case` | Optional | Boolean | Whether to ignore the letter case when matching keywords. Default is `false`.
+`keywords` | Required if either `keywords_path` or `keywords_pattern` is not set | List of strings | The list of tokens to mark as keywords. 
+`keywords_path` | Required if either `keywords` or `keywords_pattern` is not set | String | The path (relative to the `config` directory or absolute) to the list of keywords.
+`keywords_pattern` | Required if either `keywords` or `keywords_path` is not set | String | A [regular expression](https://docs.oracle.com/javase/8/docs/api/java/util/regex/Pattern.html) used for matching tokens to be marked as keywords.
+ 
+
+## Example
+
+The following example request creates a new index named `my_index` and configures an analyzer with a `keyword_marker` filter. The filter marks the word `example` as a keyword:
+
+```json
+PUT /my_index
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "custom_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": ["lowercase", "keyword_marker_filter", "stemmer"]
+        }
+      },
+      "filter": {
+        "keyword_marker_filter": {
+          "type": "keyword_marker",
+          "keywords": ["example"]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+GET /my_index/_analyze
+{
+  "analyzer": "custom_analyzer",
+  "text": "Favorite example"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens. Note that while the word `favorite` was stemmed, the word `example` was not stemmed because it was marked as a keyword:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "favorit",
+      "start_offset": 0,
+      "end_offset": 8,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "example",
+      "start_offset": 9,
+      "end_offset": 16,
+      "type": "<ALPHANUM>",
+      "position": 1
+    }
+  ]
+}
+```
+
+You can further examine the impact of the `keyword_marker` token filter by adding the following parameters to the `_analyze` query:
+
+```json
+GET /my_index/_analyze
+{
+  "analyzer": "custom_analyzer",
+  "text": "This is an OpenSearch example demonstrating keyword marker.",
+  "explain": true,
+  "attributes": "keyword"
+}
+```
+{% include copy-curl.html %}
+
+This will produce additional details in the response similar to the following:
+
+```json
+{
+    "name": "porter_stem",
+    "tokens": [
+      ...
+      {
+        "token": "example",
+        "start_offset": 22,
+        "end_offset": 29,
+        "type": "<ALPHANUM>",
+        "position": 4,
+        "keyword": true
+      },
+      {
+        "token": "demonstr",
+        "start_offset": 30,
+        "end_offset": 43,
+        "type": "<ALPHANUM>",
+        "position": 5,
+        "keyword": false
+      },
+      ...
+    ]
+}
+```
diff --git a/_analyzers/token-filters/keyword-repeat.md b/_analyzers/token-filters/keyword-repeat.md
new file mode 100644
index 0000000000..5ba15a037c
--- /dev/null
+++ b/_analyzers/token-filters/keyword-repeat.md
@@ -0,0 +1,160 @@
+---
+layout: default
+title: Keyword repeat
+parent: Token filters
+nav_order: 210
+---
+
+# Keyword repeat token filter
+
+The `keyword_repeat` token filter emits the keyword version of a token into a token stream. This filter is typically used when you want to retain both the original token and its modified version after further token transformations, such as stemming or synonym expansion. The duplicated tokens allow the original, unchanged version of the token to remain in the final analysis alongside the modified versions.
+
+The `keyword_repeat` token filter should be placed before stemming filters. Stemming is not applied to every token, thus you may have duplicate tokens in the same position after stemming. To remove duplicate tokens, use the `remove_duplicates` token filter after the stemmer.
+{: .note} 
+
+
+## Example
+
+The following example request creates a new index named `my_index` and configures an analyzer with a `keyword_repeat` filter:
+
+```json
+PUT /my_index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "my_kstem": {
+          "type": "kstem"
+        },
+        "my_lowercase": {
+          "type": "lowercase"
+        }
+      },
+      "analyzer": {
+        "my_custom_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "my_lowercase",
+            "keyword_repeat",
+            "my_kstem"
+          ]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /my_index/_analyze
+{
+  "analyzer": "my_custom_analyzer",
+  "text": "Stopped quickly"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "stopped",
+      "start_offset": 0,
+      "end_offset": 7,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "stop",
+      "start_offset": 0,
+      "end_offset": 7,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "quickly",
+      "start_offset": 8,
+      "end_offset": 15,
+      "type": "<ALPHANUM>",
+      "position": 1
+    },
+    {
+      "token": "quick",
+      "start_offset": 8,
+      "end_offset": 15,
+      "type": "<ALPHANUM>",
+      "position": 1
+    }
+  ]
+}
+```
+
+You can further examine the impact of the `keyword_repeat` token filter by adding the following parameters to the `_analyze` query:
+
+```json
+POST /my_index/_analyze
+{
+  "analyzer": "my_custom_analyzer",
+  "text": "Stopped quickly",
+  "explain": true,
+  "attributes": "keyword"
+}
+```
+{% include copy-curl.html %}
+
+The response includes detailed information, such as tokenization, filtering, and the application of specific token filters:
+
+```json
+{
+  "detail": {
+    "custom_analyzer": true,
+    "charfilters": [],
+    "tokenizer": {
+      "name": "standard",
+      "tokens": [
+        {"token": "OpenSearch","start_offset": 0,"end_offset": 10,"type": "<ALPHANUM>","position": 0},
+        {"token": "helped","start_offset": 11,"end_offset": 17,"type": "<ALPHANUM>","position": 1},
+        {"token": "many","start_offset": 18,"end_offset": 22,"type": "<ALPHANUM>","position": 2},
+        {"token": "employers","start_offset": 23,"end_offset": 32,"type": "<ALPHANUM>","position": 3}
+      ]
+    },
+    "tokenfilters": [
+      {
+        "name": "lowercase",
+        "tokens": [
+          {"token": "opensearch","start_offset": 0,"end_offset": 10,"type": "<ALPHANUM>","position": 0},
+          {"token": "helped","start_offset": 11,"end_offset": 17,"type": "<ALPHANUM>","position": 1},
+          {"token": "many","start_offset": 18,"end_offset": 22,"type": "<ALPHANUM>","position": 2},
+          {"token": "employers","start_offset": 23,"end_offset": 32,"type": "<ALPHANUM>","position": 3}
+        ]
+      },
+      {
+        "name": "keyword_marker_filter",
+        "tokens": [
+          {"token": "opensearch","start_offset": 0,"end_offset": 10,"type": "<ALPHANUM>","position": 0,"keyword": true},
+          {"token": "helped","start_offset": 11,"end_offset": 17,"type": "<ALPHANUM>","position": 1,"keyword": false},
+          {"token": "many","start_offset": 18,"end_offset": 22,"type": "<ALPHANUM>","position": 2,"keyword": false},
+          {"token": "employers","start_offset": 23,"end_offset": 32,"type": "<ALPHANUM>","position": 3,"keyword": false}
+        ]
+      },
+      {
+        "name": "kstem_filter",
+        "tokens": [
+          {"token": "opensearch","start_offset": 0,"end_offset": 10,"type": "<ALPHANUM>","position": 0,"keyword": true},
+          {"token": "help","start_offset": 11,"end_offset": 17,"type": "<ALPHANUM>","position": 1,"keyword": false},
+          {"token": "many","start_offset": 18,"end_offset": 22,"type": "<ALPHANUM>","position": 2,"keyword": false},
+          {"token": "employer","start_offset": 23,"end_offset": 32,"type": "<ALPHANUM>","position": 3,"keyword": false}
+        ]
+      }
+    ]
+  }
+}
+```
\ No newline at end of file
diff --git a/_analyzers/token-filters/kstem.md b/_analyzers/token-filters/kstem.md
new file mode 100644
index 0000000000..d13fd2c675
--- /dev/null
+++ b/_analyzers/token-filters/kstem.md
@@ -0,0 +1,92 @@
+---
+layout: default
+title: KStem
+parent: Token filters
+nav_order: 220
+---
+
+# KStem token filter
+
+The `kstem` token filter is a stemming filter used to reduce words to their root forms. The filter is a lightweight algorithmic stemmer designed for the English language that performs the following stemming operations:
+
+- Reduces plurals to their singular form.
+- Converts different verb tenses to their base form.
+- Removes common derivational endings, such as "-ing" or "-ed".
+
+The `kstem` token filter is equivalent to the a `stemmer` filter configured with a `light_english` language. It provides a more conservative stemming compared to other stemming filters like `porter_stem`.
+
+The `kstem` token filter is based on the Lucene KStemFilter. For more information, see the [Lucene documentation](https://lucene.apache.org/core/9_10_0/analysis/common/org/apache/lucene/analysis/en/KStemFilter.html).
+
+## Example
+
+The following example request creates a new index named `my_kstem_index` and configures an analyzer with a `kstem` filter:
+
+```json
+PUT /my_kstem_index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "kstem_filter": {
+          "type": "kstem"
+        }
+      },
+      "analyzer": {
+        "my_kstem_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "kstem_filter"
+          ]
+        }
+      }
+    }
+  },
+  "mappings": {
+    "properties": {
+      "content": {
+        "type": "text",
+        "analyzer": "my_kstem_analyzer"
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /my_kstem_index/_analyze
+{
+  "analyzer": "my_kstem_analyzer",
+  "text": "stops stopped"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "stop",
+      "start_offset": 0,
+      "end_offset": 5,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "stop",
+      "start_offset": 6,
+      "end_offset": 13,
+      "type": "<ALPHANUM>",
+      "position": 1
+    }
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/token-filters/kuromoji-completion.md b/_analyzers/token-filters/kuromoji-completion.md
new file mode 100644
index 0000000000..24833e92e1
--- /dev/null
+++ b/_analyzers/token-filters/kuromoji-completion.md
@@ -0,0 +1,127 @@
+---
+layout: default
+title: Kuromoji completion
+parent: Token filters
+nav_order: 230
+---
+
+# Kuromoji completion token filter
+
+The `kuromoji_completion` token filter is used to stem Katakana words in Japanese, which are often used to represent foreign words or loanwords. This filter is especially useful for autocompletion or suggest queries, in which partial matches on Katakana words can be expanded to include their full forms.
+
+To use this token filter, you must first install the `analysis-kuromoji` plugin on all nodes by running `bin/opensearch-plugin install analysis-kuromoji` and then restart the cluster. For more information about installing additional plugins, see [Additional plugins]({{site.url}}{{site.baseurl}}/install-and-configure/additional-plugins/index/).
+
+## Example
+
+The following example request creates a new index named `kuromoji_sample` and configures an analyzer with a `kuromoji_completion` filter:
+
+```json
+PUT kuromoji_sample
+{
+  "settings": {
+    "index": {
+      "analysis": {
+        "analyzer": {
+          "my_analyzer": {
+            "tokenizer": "kuromoji_tokenizer",
+            "filter": [
+              "my_katakana_stemmer"
+            ]
+          }
+        },
+        "filter": {
+          "my_katakana_stemmer": {
+            "type": "kuromoji_completion"
+          }
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer with text that translates to "use a computer":
+
+```json
+POST /kuromoji_sample/_analyze
+{
+  "analyzer": "my_analyzer",
+  "text": "コンピューターを使う"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "コンピューター", // The original Katakana word "computer".
+      "start_offset": 0,
+      "end_offset": 7,
+      "type": "word",
+      "position": 0
+    },
+    {
+      "token": "konpyuーtaー", // Romanized version (Romaji) of "コンピューター".
+      "start_offset": 0,
+      "end_offset": 7,
+      "type": "word",
+      "position": 0
+    },
+    {
+      "token": "konnpyuーtaー", // Another possible romanized version of "コンピューター" (with a slight variation in the spelling).
+      "start_offset": 0,
+      "end_offset": 7,
+      "type": "word",
+      "position": 0
+    },
+    {
+      "token": "を", // A Japanese particle, "wo" or "o"
+      "start_offset": 7,
+      "end_offset": 8,
+      "type": "word",
+      "position": 1
+    },
+    {
+      "token": "wo", // Romanized form of the particle "を" (often pronounced as "o").
+      "start_offset": 7,
+      "end_offset": 8,
+      "type": "word",
+      "position": 1
+    },
+    {
+      "token": "o", // Another version of the romanization.
+      "start_offset": 7,
+      "end_offset": 8,
+      "type": "word",
+      "position": 1
+    },
+    {
+      "token": "使う", // The verb "use" in Kanji.
+      "start_offset": 8,
+      "end_offset": 10,
+      "type": "word",
+      "position": 2
+    },
+    {
+      "token": "tukau", // Romanized version of "使う"
+      "start_offset": 8,
+      "end_offset": 10,
+      "type": "word",
+      "position": 2
+    },
+    {
+      "token": "tsukau", // Another romanized version of "使う", where "tsu" is more phonetically correct
+      "start_offset": 8,
+      "end_offset": 10,
+      "type": "word",
+      "position": 2
+    }
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/token-filters/length.md b/_analyzers/token-filters/length.md
new file mode 100644
index 0000000000..f6c5dcc706
--- /dev/null
+++ b/_analyzers/token-filters/length.md
@@ -0,0 +1,91 @@
+---
+layout: default
+title: Length
+parent: Token filters
+nav_order: 240
+---
+
+# Length token filter
+
+The `length` token filter is used to remove tokens that don't meet specified length criteria (minimum and maximum values) from the token stream.
+
+## Parameters
+
+The `length` token filter can be configured with the following parameters.
+
+Parameter | Required/Optional | Data type | Description
+:--- | :--- | :--- | :--- 
+`min` | Optional | Integer | The minimum token length. Default is `0`.
+`max` | Optional | Integer | The maximum token length. Default is `Integer.MAX_VALUE` (`2147483647`).
+ 
+
+## Example
+
+The following example request creates a new index named `my_index` and configures an analyzer with a `length` filter:
+
+```json
+PUT my_index
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "only_keep_4_to_10_characters": {
+          "tokenizer": "whitespace",
+          "filter": [ "length_4_to_10" ]
+        }
+      },
+      "filter": {
+        "length_4_to_10": {
+          "type": "length",
+          "min": 4,
+          "max": 10
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+GET /my_index/_analyze
+{
+  "analyzer": "only_keep_4_to_10_characters",
+  "text": "OpenSearch is a great tool!"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "OpenSearch",
+      "start_offset": 0,
+      "end_offset": 10,
+      "type": "word",
+      "position": 0
+    },
+    {
+      "token": "great",
+      "start_offset": 16,
+      "end_offset": 21,
+      "type": "word",
+      "position": 3
+    },
+    {
+      "token": "tool!",
+      "start_offset": 22,
+      "end_offset": 27,
+      "type": "word",
+      "position": 4
+    }
+  ]
+}
+```
diff --git a/_analyzers/token-filters/limit.md b/_analyzers/token-filters/limit.md
new file mode 100644
index 0000000000..a849f5f06b
--- /dev/null
+++ b/_analyzers/token-filters/limit.md
@@ -0,0 +1,89 @@
+---
+layout: default
+title: Limit
+parent: Token filters
+nav_order: 250
+---
+
+# Limit token filter
+
+The `limit` token filter is used to limit the number of tokens passed through the analysis chain.
+
+## Parameters
+
+The `limit` token filter can be configured with the following parameters.
+
+Parameter | Required/Optional | Data type | Description
+:--- | :--- | :--- | :--- 
+`max_token_count` | Optional | Integer | The maximum number of tokens to be generated. Default is `1`.
+`consume_all_tokens` | Optional | Boolean | (Expert-level setting) Uses all tokens from the tokenizer, even if the result exceeds `max_token_count`. When this parameter is set, the output still only contains the number of tokens specified by `max_token_count`. However, all tokens generated by the tokenizer are processed. Default is `false`.
+
+## Example
+
+The following example request creates a new index named `my_index` and configures an analyzer with a `limit` filter:
+
+```json
+PUT my_index
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "three_token_limit": {
+          "tokenizer": "standard",
+          "filter": [ "custom_token_limit" ]
+        }
+      },
+      "filter": {
+        "custom_token_limit": {
+          "type": "limit",
+          "max_token_count": 3
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+GET /my_index/_analyze
+{
+  "analyzer": "three_token_limit",
+  "text": "OpenSearch is a powerful and flexible search engine."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "OpenSearch",
+      "start_offset": 0,
+      "end_offset": 10,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "is",
+      "start_offset": 11,
+      "end_offset": 13,
+      "type": "<ALPHANUM>",
+      "position": 1
+    },
+    {
+      "token": "a",
+      "start_offset": 14,
+      "end_offset": 15,
+      "type": "<ALPHANUM>",
+      "position": 2
+    }
+  ]
+}
+```
diff --git a/_analyzers/token-filters/lowercase.md b/_analyzers/token-filters/lowercase.md
new file mode 100644
index 0000000000..89f0f219fa
--- /dev/null
+++ b/_analyzers/token-filters/lowercase.md
@@ -0,0 +1,82 @@
+---
+layout: default
+title: Lowercase
+parent: Token filters
+nav_order: 260
+---
+
+# Lowercase token filter
+
+The `lowercase` token filter is used to convert all characters in the token stream to lowercase, making searches case insensitive.
+
+## Parameters
+
+The `lowercase` token filter can be configured with the following parameter.
+
+Parameter | Required/Optional | Description
+:--- | :--- | :---
+ `language` | Optional | Specifies a language-specific token filter. Valid values are: <br>- [`greek`](https://lucene.apache.org/core/8_7_0/analyzers-common/org/apache/lucene/analysis/el/GreekLowerCaseFilter.html) <br>-  [`irish`](https://lucene.apache.org/core/8_7_0/analyzers-common/org/apache/lucene/analysis/ga/IrishLowerCaseFilter.html) <br>-  [`turkish`](https://lucene.apache.org/core/8_7_0/analyzers-common/org/apache/lucene/analysis/tr/TurkishLowerCaseFilter.html). <br> Default is the [Lucene LowerCaseFilter](https://lucene.apache.org/core/8_7_0/analyzers-common/org/apache/lucene/analysis/core/LowerCaseFilter.html). 
+
+## Example
+
+The following example request creates a new index named `custom_lowercase_example`. It configures an analyzer with a `lowercase` filter and specifies `greek` as the `language`:
+
+```json
+PUT /custom_lowercase_example
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "greek_lowercase_example": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": ["greek_lowercase"]
+        }
+      },
+      "filter": {
+        "greek_lowercase": {
+          "type": "lowercase",
+          "language": "greek"
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+GET /custom_lowercase_example/_analyze
+{
+  "analyzer": "greek_lowercase_example",
+  "text": "Αθήνα ΕΛΛΑΔΑ"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "αθηνα",
+      "start_offset": 0,
+      "end_offset": 5,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "ελλαδα",
+      "start_offset": 6,
+      "end_offset": 12,
+      "type": "<ALPHANUM>",
+      "position": 1
+    }
+  ]
+}
+```
diff --git a/_analyzers/token-filters/min-hash.md b/_analyzers/token-filters/min-hash.md
new file mode 100644
index 0000000000..e4f1a8da91
--- /dev/null
+++ b/_analyzers/token-filters/min-hash.md
@@ -0,0 +1,138 @@
+---
+layout: default
+title: Min hash
+parent: Token filters
+nav_order: 270
+---
+
+# Min hash token filter
+
+The `min_hash` token filter is used to generate hashes for tokens based on a [MinHash](https://en.wikipedia.org/wiki/MinHash) approximation algorithm, which is useful for detecting similarity between documents. The `min_hash` token filter generates hashes for a set of tokens (typically from an analyzed field).
+
+## Parameters
+
+The `min_hash` token filter can be configured with the following parameters.
+
+Parameter | Required/Optional | Data type | Description
+:--- | :--- | :--- | :--- 
+`hash_count` | Optional | Integer | The number of hash values to generate for each token. Increasing this value generally improves the accuracy of similarity estimation but increases the computational cost. Default is `1`.
+`bucket_count` | Optional | Integer | The number of hash buckets to use. This affects the granularity of the hashing. A larger number of buckets provides finer granularity and reduces hash collisions but requires more memory. Default is `512`.
+`hash_set_size` | Optional | Integer | The number of hashes to retain in each bucket. This can influence the hashing quality. Larger set sizes may lead to better similarity detection but consume more memory. Default is `1`.
+`with_rotation` | Optional | Boolean | When set to `true`, the filter populates empty buckets with the value from the first non-empty bucket found to its circular right, provided that the `hash_set_size` is `1`. If the `bucket_count` argument exceeds `1`, this setting automatically defaults to `true`; otherwise, it defaults to `false`.
+
+## Example
+
+The following example request creates a new index named `minhash_index` and configures an analyzer with a `min_hash` filter:
+
+```json
+PUT /minhash_index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "minhash_filter": {
+          "type": "min_hash",
+          "hash_count": 3,
+          "bucket_count": 512,
+          "hash_set_size": 1,
+          "with_rotation": false
+        }
+      },
+      "analyzer": {
+        "minhash_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "minhash_filter"
+          ]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /minhash_index/_analyze
+{
+  "analyzer": "minhash_analyzer",
+  "text": "OpenSearch is very powerful."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens (the tokens are not human readable because they represent hashes):
+
+```json
+{
+  "tokens" : [
+    {
+      "token" : "\u0000\u0000㳠锯ੲ걌䐩䉵",
+      "start_offset" : 0,
+      "end_offset" : 27,
+      "type" : "MIN_HASH",
+      "position" : 0
+    },
+    {
+      "token" : "\u0000\u0000㳠锯ੲ걌䐩䉵",
+      "start_offset" : 0,
+      "end_offset" : 27,
+      "type" : "MIN_HASH",
+      "position" : 0
+    },
+    ...
+```
+
+In order to demonstrate the usefulness of the `min_hash` token filter, you can use the following Python script to compare the two strings using the previously created analyzer:
+
+```python
+from opensearchpy import OpenSearch
+from requests.auth import HTTPBasicAuth
+
+# Initialize the OpenSearch client with authentication
+host = 'https://localhost:9200'  # Update if using a different host/port
+auth = ('admin', 'admin')  # Username and password
+
+# Create the OpenSearch client with SSL verification turned off
+client = OpenSearch(
+    hosts=[host],
+    http_auth=auth,
+    use_ssl=True,
+    verify_certs=False,  # Disable SSL certificate validation
+    ssl_show_warn=False  # Suppress SSL warnings in the output
+)
+
+# Analyzes text and returns the minhash tokens
+def analyze_text(index, text):
+    response = client.indices.analyze(
+        index=index,
+        body={
+            "analyzer": "minhash_analyzer",
+            "text": text
+        }
+    )
+    return [token['token'] for token in response['tokens']]
+
+# Analyze two similar texts
+tokens_1 = analyze_text('minhash_index', 'OpenSearch is a powerful search engine.')
+tokens_2 = analyze_text('minhash_index', 'OpenSearch is a very powerful search engine.')
+
+# Calculate Jaccard similarity
+set_1 = set(tokens_1)
+set_2 = set(tokens_2)
+shared_tokens = set_1.intersection(set_2)
+jaccard_similarity = len(shared_tokens) / len(set_1.union(set_2))
+
+print(f"Jaccard Similarity: {jaccard_similarity}")
+```
+
+The response should contain the Jaccard similarity score:
+
+```yaml
+Jaccard Similarity: 0.8571428571428571
+```
\ No newline at end of file
diff --git a/_analyzers/token-filters/multiplexer.md b/_analyzers/token-filters/multiplexer.md
new file mode 100644
index 0000000000..21597b7fc1
--- /dev/null
+++ b/_analyzers/token-filters/multiplexer.md
@@ -0,0 +1,165 @@
+---
+layout: default
+title: Multiplexer
+parent: Token filters
+nav_order: 280
+---
+
+# Multiplexer token filter
+
+The `multiplexer` token filter allows you to create multiple versions of the same token by applying different filters. This is useful when you want to analyze the same token in multiple ways. For example, you may want to analyze a token using different stemming, synonyms, or n-gram filters and use all of the generated tokens together. This token filter works by duplicating the token stream and applying different filters to each copy.
+
+The `multiplexer` token filter removes duplicate tokens from the token stream.
+{: .important}
+
+The `multiplexer` token filter does not support multiword `synonym` or `synonym_graph` token filters or `shingle` token filters because they need to analyze not only the current token but also upcoming tokens in order to determine how to transform the input correctly.
+{: .important}
+
+## Parameters
+
+The `multiplexer` token filter can be configured with the following parameters.
+
+Parameter | Required/Optional | Data type | Description
+:--- | :--- | :--- | :--- 
+`filters` | Optional | List of strings | A comma-separated list of token filters to apply to each copy of the token stream. Default is an empty list.
+`preserve_original` | Optional | Boolean | Whether to keep the original token as one of the outputs. Default is `true`.
+
+## Example
+
+The following example request creates a new index named `multiplexer_index` and configures an analyzer with a `multiplexer` filter:
+
+```json
+PUT /multiplexer_index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "english_stemmer": {
+          "type": "stemmer",
+          "name": "english"
+        },
+        "synonym_filter": {
+          "type": "synonym",
+          "synonyms": [
+            "quick,fast"
+          ]
+        },
+        "multiplexer_filter": {
+          "type": "multiplexer",
+          "filters": ["english_stemmer", "synonym_filter"],
+          "preserve_original": true
+        }
+      },
+      "analyzer": {
+        "multiplexer_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "multiplexer_filter"
+          ]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /multiplexer_index/_analyze
+{
+  "analyzer": "multiplexer_analyzer",
+  "text": "The slow turtle hides from the quick dog"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "The",
+      "start_offset": 0,
+      "end_offset": 3,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "slow",
+      "start_offset": 4,
+      "end_offset": 8,
+      "type": "<ALPHANUM>",
+      "position": 1
+    },
+    {
+      "token": "turtle",
+      "start_offset": 9,
+      "end_offset": 15,
+      "type": "<ALPHANUM>",
+      "position": 2
+    },
+    {
+      "token": "turtl",
+      "start_offset": 9,
+      "end_offset": 15,
+      "type": "<ALPHANUM>",
+      "position": 2
+    },
+    {
+      "token": "hides",
+      "start_offset": 16,
+      "end_offset": 21,
+      "type": "<ALPHANUM>",
+      "position": 3
+    },
+    {
+      "token": "hide",
+      "start_offset": 16,
+      "end_offset": 21,
+      "type": "<ALPHANUM>",
+      "position": 3
+    },
+    {
+      "token": "from",
+      "start_offset": 22,
+      "end_offset": 26,
+      "type": "<ALPHANUM>",
+      "position": 4
+    },
+    {
+      "token": "the",
+      "start_offset": 27,
+      "end_offset": 30,
+      "type": "<ALPHANUM>",
+      "position": 5
+    },
+    {
+      "token": "quick",
+      "start_offset": 31,
+      "end_offset": 36,
+      "type": "<ALPHANUM>",
+      "position": 6
+    },
+    {
+      "token": "fast",
+      "start_offset": 31,
+      "end_offset": 36,
+      "type": "SYNONYM",
+      "position": 6
+    },
+    {
+      "token": "dog",
+      "start_offset": 37,
+      "end_offset": 40,
+      "type": "<ALPHANUM>",
+      "position": 7
+    }
+  ]
+}
+```
diff --git a/_analyzers/token-filters/ngram.md b/_analyzers/token-filters/ngram.md
new file mode 100644
index 0000000000..c029eac26e
--- /dev/null
+++ b/_analyzers/token-filters/ngram.md
@@ -0,0 +1,137 @@
+---
+layout: default
+title: N-gram
+parent: Token filters
+nav_order: 290
+---
+
+# N-gram token filter
+
+The `ngram` token filter is a powerful tool used to break down text into smaller components, known as _n-grams_, which can improve partial matching and fuzzy search capabilities. It works by splitting a token into smaller substrings of defined lengths. These filters are commonly used in search applications to support autocomplete, partial matches, and typo-tolerant search. For more information, see [Autocomplete functionality]({{site.url}}{{site.baseurl}}/search-plugins/searching-data/autocomplete/) and [Did-you-mean]({{site.url}}{{site.baseurl}}/search-plugins/searching-data/did-you-mean/).
+
+## Parameters
+
+The `ngram` token filter can be configured with the following parameters.
+
+Parameter | Required/Optional | Data type | Description
+:--- | :--- | :--- | :--- 
+`min_gram` | Optional | Integer | The minimum length of the n-grams. Default is `1`.
+`max_gram` | Optional | Integer | The maximum length of the n-grams. Default is `2`.
+`preserve_original` | Optional | Boolean | Whether to keep the original token as one of the outputs. Default is `false`.
+
+## Example
+
+The following example request creates a new index named `ngram_example_index` and configures an analyzer with an `ngram` filter:
+
+```json
+PUT /ngram_example_index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "ngram_filter": {
+          "type": "ngram",
+          "min_gram": 2,
+          "max_gram": 3
+        }
+      },
+      "analyzer": {
+        "ngram_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "ngram_filter"
+          ]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /ngram_example_index/_analyze
+{
+  "analyzer": "ngram_analyzer",
+  "text": "Search"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "se",
+      "start_offset": 0,
+      "end_offset": 6,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "sea",
+      "start_offset": 0,
+      "end_offset": 6,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "ea",
+      "start_offset": 0,
+      "end_offset": 6,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "ear",
+      "start_offset": 0,
+      "end_offset": 6,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "ar",
+      "start_offset": 0,
+      "end_offset": 6,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "arc",
+      "start_offset": 0,
+      "end_offset": 6,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "rc",
+      "start_offset": 0,
+      "end_offset": 6,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "rch",
+      "start_offset": 0,
+      "end_offset": 6,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "ch",
+      "start_offset": 0,
+      "end_offset": 6,
+      "type": "<ALPHANUM>",
+      "position": 0
+    }
+  ]
+}
+```
diff --git a/_analyzers/token-filters/normalization.md b/_analyzers/token-filters/normalization.md
new file mode 100644
index 0000000000..1be08e65c2
--- /dev/null
+++ b/_analyzers/token-filters/normalization.md
@@ -0,0 +1,88 @@
+---
+layout: default
+title: Normalization
+parent: Token filters
+nav_order: 300
+---
+
+# Normalization token filter
+
+The `normalization` token filter is designed to adjust and simplify text in a way that reduces variations, particularly variations in special characters. It is primarily used to handle variations in writing by standardizing characters in specific languages.
+
+The following `normalization` token filters are available:
+
+- [arabic_normalization](https://lucene.apache.org/core/8_7_0/analyzers-common/org/apache/lucene/analysis/ar/ArabicNormalizer.html)
+- [german_normalization](https://lucene.apache.org/core/8_7_0/analyzers-common/org/apache/lucene/analysis/de/GermanNormalizationFilter.html)
+- [hindi_normalization](https://lucene.apache.org/core/8_7_0/analyzers-common/org/apache/lucene/analysis/hi/HindiNormalizer.html)
+- [indic_normalization](https://lucene.apache.org/core/8_7_0/analyzers-common/org/apache/lucene/analysis/in/IndicNormalizer.html)
+- [sorani_normalization](https://lucene.apache.org/core/8_7_0/analyzers-common/org/apache/lucene/analysis/ckb/SoraniNormalizer.html)
+- [persian_normalization](https://lucene.apache.org/core/8_7_0/analyzers-common/org/apache/lucene/analysis/fa/PersianNormalizer.html)
+- [scandinavian_normalization](https://lucene.apache.org/core/8_7_0/analyzers-common/org/apache/lucene/analysis/miscellaneous/ScandinavianNormalizationFilter.html)
+- [scandinavian_folding](https://lucene.apache.org/core/8_7_0/analyzers-common/org/apache/lucene/analysis/miscellaneous/ScandinavianFoldingFilter.html)
+- [serbian_normalization](https://lucene.apache.org/core/8_7_0/analyzers-common/org/apache/lucene/analysis/sr/SerbianNormalizationFilter.html)
+
+
+## Example
+
+The following example request creates a new index named `german_normalizer_example` and configures an analyzer with a `german_normalization` filter:
+
+```json
+PUT /german_normalizer_example
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "german_normalizer": {
+          "type": "german_normalization"
+        }
+      },
+      "analyzer": {
+        "german_normalizer_analyzer": {
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase", 
+            "german_normalizer"
+          ]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /german_normalizer_example/_analyze
+{
+  "text": "Straße München",
+  "analyzer": "german_normalizer_analyzer"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "strasse",
+      "start_offset": 0,
+      "end_offset": 6,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "munchen",
+      "start_offset": 7,
+      "end_offset": 14,
+      "type": "<ALPHANUM>",
+      "position": 1
+    }
+  ]
+}
+```
diff --git a/_analyzers/token-filters/pattern-capture.md b/_analyzers/token-filters/pattern-capture.md
new file mode 100644
index 0000000000..cff36b583d
--- /dev/null
+++ b/_analyzers/token-filters/pattern-capture.md
@@ -0,0 +1,97 @@
+---
+layout: default
+title: Pattern capture
+parent: Token filters
+nav_order: 310
+---
+
+# Pattern capture token filter
+
+The `pattern_capture` token filter is a powerful filter that uses regular expressions to capture and extract parts of text according to specific patterns. This filter can be useful when you want to extract particular parts of tokens, such as email domains, hashtags, or numbers, and reuse them for further analysis or indexing.
+
+## Parameters
+
+The `pattern_capture` token filter can be configured with the following parameters.
+
+Parameter | Required/Optional | Data type | Description
+:--- | :--- | :--- | :--- 
+`patterns` | Required | Array of strings | An array of regular expressions used to capture parts of text.
+`preserve_original` | Required | Boolean| Whether to keep the original token in the output. Default is `true`.
+
+
+## Example
+
+The following example request creates a new index named `email_index` and configures an analyzer with a `pattern_capture` filter to extract the local part and domain name from an email address:
+
+```json
+PUT /email_index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "email_pattern_capture": {
+          "type": "pattern_capture",
+          "preserve_original": true,
+          "patterns": [
+            "^([^@]+)",
+            "@(.+)$"
+          ]
+        }
+      },
+      "analyzer": {
+        "email_analyzer": {
+          "tokenizer": "uax_url_email",
+          "filter": [
+            "email_pattern_capture",
+            "lowercase"
+          ]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /email_index/_analyze
+{
+  "text": "john.doe@example.com",
+  "analyzer": "email_analyzer"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "john.doe@example.com",
+      "start_offset": 0,
+      "end_offset": 20,
+      "type": "<EMAIL>",
+      "position": 0
+    },
+    {
+      "token": "john.doe",
+      "start_offset": 0,
+      "end_offset": 20,
+      "type": "<EMAIL>",
+      "position": 0
+    },
+    {
+      "token": "example.com",
+      "start_offset": 0,
+      "end_offset": 20,
+      "type": "<EMAIL>",
+      "position": 0
+    }
+  ]
+}
+```
diff --git a/_analyzers/token-filters/pattern-replace.md b/_analyzers/token-filters/pattern-replace.md
new file mode 100644
index 0000000000..73ef7fa7d8
--- /dev/null
+++ b/_analyzers/token-filters/pattern-replace.md
@@ -0,0 +1,116 @@
+---
+layout: default
+title: Pattern replace
+parent: Token filters
+nav_order: 320
+---
+
+# Pattern replace token filter
+
+The `pattern_replace` token filter allows you to modify tokens using regular expressions. This filter replaces patterns in tokens with the specified values, giving you flexibility in transforming or normalizing tokens before indexing them. It's particularly useful when you need to clean or standardize text during analysis.
+
+## Parameters
+
+The `pattern_replace` token filter can be configured with the following parameters.
+
+Parameter | Required/Optional | Data type | Description
+:--- | :--- | :--- | :--- 
+`pattern` | Required | String | A regular expression pattern that matches the text that needs to be replaced.
+`all` | Optional | Boolean | Whether to replace all pattern matches. If `false`, only the first match is replaced. Default is `true`.
+`replacement` | Optional | String | A string with which to replace the matched pattern. Default is an empty string.
+
+
+## Example
+
+The following example request creates a new index named `text_index` and configures an analyzer with a `pattern_replace` filter to replace tokens containing digits with the string `[NUM]`:
+
+```json
+PUT /text_index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "number_replace_filter": {
+          "type": "pattern_replace",
+          "pattern": "\\d+",
+          "replacement": "[NUM]"
+        }
+      },
+      "analyzer": {
+        "number_analyzer": {
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "number_replace_filter"
+          ]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /text_index/_analyze
+{
+  "text": "Visit us at 98765 Example St.",
+  "analyzer": "number_analyzer"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "visit",
+      "start_offset": 0,
+      "end_offset": 5,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "us",
+      "start_offset": 6,
+      "end_offset": 8,
+      "type": "<ALPHANUM>",
+      "position": 1
+    },
+    {
+      "token": "at",
+      "start_offset": 9,
+      "end_offset": 11,
+      "type": "<ALPHANUM>",
+      "position": 2
+    },
+    {
+      "token": "[NUM]",
+      "start_offset": 12,
+      "end_offset": 17,
+      "type": "<NUM>",
+      "position": 3
+    },
+    {
+      "token": "example",
+      "start_offset": 18,
+      "end_offset": 25,
+      "type": "<ALPHANUM>",
+      "position": 4
+    },
+    {
+      "token": "st",
+      "start_offset": 26,
+      "end_offset": 28,
+      "type": "<ALPHANUM>",
+      "position": 5
+    }
+  ]
+}
+```
diff --git a/_analyzers/token-filters/phonetic.md b/_analyzers/token-filters/phonetic.md
new file mode 100644
index 0000000000..7fe380851f
--- /dev/null
+++ b/_analyzers/token-filters/phonetic.md
@@ -0,0 +1,98 @@
+---
+layout: default
+title: Phonetic
+parent: Token filters
+nav_order: 330
+---
+
+# Phonetic token filter
+
+The `phonetic` token filter transforms tokens into their phonetic representations, enabling more flexible matching of words that sound similar but are spelled differently. This is particularly useful for searching names, brands, or other entities that users might spell differently but pronounce similarly.
+
+The `phonetic` token filter is not included in OpenSearch distributions by default. To use this token filter, you must first install the `analysis-phonetic` plugin as follows and then restart OpenSearch:
+
+```bash
+./bin/opensearch-plugin install analysis-phonetic
+```
+{% include copy.html %}
+
+For more information about installing plugins, see [Installing plugins]({{site.url}}{{site.baseurl}}/install-and-configure/plugins/).
+{: .note}
+
+## Parameters
+
+The `phonetic` token filter can be configured with the following parameters.
+
+Parameter | Required/Optional | Data type | Description
+:--- | :--- | :--- | :--- 
+`encoder` | Optional | String | Specifies the phonetic algorithm to use.<br><br>Valid values are:<br>- `metaphone` (default)<br>- `double_metaphone`<br>- `soundex`<br>- `refined_soundex`<br>- `caverphone1`<br>- `caverphone2`<br>- `cologne`<br>- `nysiis`<br>- `koelnerphonetik`<br>- `haasephonetik`<br>- `beider_morse`<br>- `daitch_mokotoff ` 
+`replace` | Optional | Boolean | Whether to replace the original token. If `false`, the original token is included in the output along with the phonetic encoding. Default is `true`.
+
+
+## Example
+
+The following example request creates a new index named `names_index` and configures an analyzer with a `phonetic` filter:
+
+```json
+PUT /names_index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "my_phonetic_filter": {
+          "type": "phonetic",
+          "encoder": "double_metaphone",
+          "replace": true
+        }
+      },
+      "analyzer": {
+        "phonetic_analyzer": {
+          "tokenizer": "standard",
+          "filter": [
+            "my_phonetic_filter"
+          ]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated for the names `Stephen` and `Steven` using the analyzer:
+
+```json
+POST /names_index/_analyze
+{
+  "text": "Stephen",
+  "analyzer": "phonetic_analyzer"
+}
+```
+{% include copy-curl.html %}
+
+```json
+POST /names_index/_analyze
+{
+  "text": "Steven",
+  "analyzer": "phonetic_analyzer"
+}
+```
+{% include copy-curl.html %}
+
+In both cases, the response contains the same generated token:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "STFN",
+      "start_offset": 0,
+      "end_offset": 6,
+      "type": "<ALPHANUM>",
+      "position": 0
+    }
+  ]
+}
+```
diff --git a/_analyzers/token-filters/porter-stem.md b/_analyzers/token-filters/porter-stem.md
new file mode 100644
index 0000000000..fa2f4208a7
--- /dev/null
+++ b/_analyzers/token-filters/porter-stem.md
@@ -0,0 +1,83 @@
+---
+layout: default
+title: Porter stem
+parent: Token filters
+nav_order: 340
+---
+
+# Porter stem token filter
+
+The `porter_stem` token filter reduces words to their base (or _stem_) form and removes common suffixes from words, which helps in matching similar words by their root. For example, the word `running` is stemmed to `run`. This token filter is primarily used for the English language and provides stemming based on the [Porter stemming algorithm](https://snowballstem.org/algorithms/porter/stemmer.html).
+
+
+## Example
+
+The following example request creates a new index named `my_stem_index` and configures an analyzer with a `porter_stem` filter:
+
+```json
+PUT /my_stem_index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "my_porter_stem": {
+          "type": "porter_stem"
+        }
+      },
+      "analyzer": {
+        "porter_analyzer": {
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "my_porter_stem"
+          ]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /my_stem_index/_analyze
+{
+  "text": "running runners ran",
+  "analyzer": "porter_analyzer"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "run",
+      "start_offset": 0,
+      "end_offset": 7,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "runner",
+      "start_offset": 8,
+      "end_offset": 15,
+      "type": "<ALPHANUM>",
+      "position": 1
+    },
+    {
+      "token": "ran",
+      "start_offset": 16,
+      "end_offset": 19,
+      "type": "<ALPHANUM>",
+      "position": 2
+    }
+  ]
+}
+```
diff --git a/_analyzers/token-filters/predicate-token-filter.md b/_analyzers/token-filters/predicate-token-filter.md
new file mode 100644
index 0000000000..24729f0224
--- /dev/null
+++ b/_analyzers/token-filters/predicate-token-filter.md
@@ -0,0 +1,82 @@
+---
+layout: default
+title: Predicate token filter
+parent: Token filters
+nav_order: 340
+---
+
+# Predicate token filter
+
+The `predicate_token_filter` evaluates whether tokens should be kept or discarded, depending on the conditions defined in a custom script. The tokens are evaluated in the analysis predicate context. This filter supports only inline Painless scripts.
+
+## Parameters
+
+The `predicate_token_filter` has one required parameter: `script`. This parameter provides a condition that is used to evaluate whether the token should be kept. 
+
+## Example
+
+The following example request creates a new index named `predicate_index` and configures an analyzer with a `predicate_token_filter`. The filter specifies to only output tokens if they are longer than 7 characters:
+
+```json
+PUT /predicate_index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "my_predicate_filter": {
+          "type": "predicate_token_filter",
+          "script": {
+            "source": "token.term.length() > 7"
+          }
+        }
+      },
+      "analyzer": {
+        "predicate_analyzer": {
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "my_predicate_filter"
+          ]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+POST /predicate_index/_analyze
+{
+  "text": "The OpenSearch community is growing rapidly",
+  "analyzer": "predicate_analyzer"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "opensearch",
+      "start_offset": 4,
+      "end_offset": 14,
+      "type": "<ALPHANUM>",
+      "position": 1
+    },
+    {
+      "token": "community",
+      "start_offset": 15,
+      "end_offset": 24,
+      "type": "<ALPHANUM>",
+      "position": 2
+    }
+  ]
+}
+```
diff --git a/_analyzers/token-filters/remove-duplicates.md b/_analyzers/token-filters/remove-duplicates.md
new file mode 100644
index 0000000000..b0a589884a
--- /dev/null
+++ b/_analyzers/token-filters/remove-duplicates.md
@@ -0,0 +1,152 @@
+---
+layout: default
+title: Remove duplicates
+parent: Token filters
+nav_order: 350
+---
+
+# Remove duplicates token filter
+
+The `remove_duplicates` token filter is used to remove duplicate tokens that are generated in the same position during analysis.
+
+## Example
+
+The following example request creates an index with a `keyword_repeat` token filter. The filter adds a `keyword` version of each token in the same position as the token itself and then uses a `kstem` to create a stemmed version of the token:
+
+```json
+PUT /example-index
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "custom_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "keyword_repeat",
+            "kstem"
+          ]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+Use the following request to analyze the string `Slower turtle`:
+
+```json
+GET /example-index/_analyze
+{
+  "analyzer": "custom_analyzer",
+  "text": "Slower turtle"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the token `turtle` twice in the same position:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "slower",
+      "start_offset": 0,
+      "end_offset": 6,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "slow",
+      "start_offset": 0,
+      "end_offset": 6,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "turtle",
+      "start_offset": 7,
+      "end_offset": 13,
+      "type": "<ALPHANUM>",
+      "position": 1
+    },
+    {
+      "token": "turtle",
+      "start_offset": 7,
+      "end_offset": 13,
+      "type": "<ALPHANUM>",
+      "position": 1
+    }
+  ]
+}
+```
+
+The duplicate token can be removed by adding a `remove_duplicates` token filter to the index settings:
+
+```json
+PUT /index-remove-duplicate
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "custom_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "keyword_repeat",
+            "kstem",
+            "remove_duplicates"
+          ]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+GET /index-remove-duplicate/_analyze
+{
+  "analyzer": "custom_analyzer",
+  "text": "Slower turtle"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "slower",
+      "start_offset": 0,
+      "end_offset": 6,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "slow",
+      "start_offset": 0,
+      "end_offset": 6,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "turtle",
+      "start_offset": 7,
+      "end_offset": 13,
+      "type": "<ALPHANUM>",
+      "position": 1
+    }
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/token-filters/reverse.md b/_analyzers/token-filters/reverse.md
new file mode 100644
index 0000000000..dc48f07e77
--- /dev/null
+++ b/_analyzers/token-filters/reverse.md
@@ -0,0 +1,86 @@
+---
+layout: default
+title: Reverse
+parent: Token filters
+nav_order: 360
+---
+
+# Reverse token filter
+
+The `reverse` token filter reverses the order of the characters in each token, making suffix information accessible at the beginning of the reversed tokens during analysis. 
+
+This is useful for suffix-based searches:
+
+The `reverse` token filter is useful when you need to perform suffix-based searches, such as in the following scenarios:  
+
+- **Suffix matching**: Searching for words based on their suffixes, such as identifying words with a specific ending (for example, `-tion` or `-ing`).
+- **File extension searches**: Searching for files by their extensions, such as `.txt` or `.jpg`.
+- **Custom sorting or ranking**: By reversing tokens, you can implement unique sorting or ranking logic based on suffixes.  
+- **Autocomplete for suffixes**: Implementing autocomplete suggestions that use suffixes rather than prefixes.  
+
+
+## Example
+
+The following example request creates a new index named `my-reverse-index` and configures an analyzer with a `reverse` filter:
+
+```json
+PUT /my-reverse-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "reverse_filter": {
+          "type": "reverse"
+        }
+      },
+      "analyzer": {
+        "my_reverse_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "reverse_filter"
+          ]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+GET /my-reverse-index/_analyze
+{
+  "analyzer": "my_reverse_analyzer",
+  "text": "hello world"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "olleh",
+      "start_offset": 0,
+      "end_offset": 5,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "dlrow",
+      "start_offset": 6,
+      "end_offset": 11,
+      "type": "<ALPHANUM>",
+      "position": 1
+    }
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/token-filters/shingle.md b/_analyzers/token-filters/shingle.md
new file mode 100644
index 0000000000..ea961bf3e0
--- /dev/null
+++ b/_analyzers/token-filters/shingle.md
@@ -0,0 +1,120 @@
+---
+layout: default
+title: Shingle
+parent: Token filters
+nav_order: 370
+---
+
+# Shingle token filter
+
+The `shingle` token filter is used to generate word n-grams, or _shingles_, from input text. For example, for the string `slow green turtle`, the `shingle` filter creates the following one- and two-word shingles: `slow`, `slow green`, `green`, `green turtle`, and `turtle`.
+
+This token filter is often used in conjunction with other filters to enhance search accuracy by indexing phrases rather than individual tokens. For more information, see [Phrase suggester]({{site.url}}{{site.baseurl}}/search-plugins/searching-data/did-you-mean/#phrase-suggester).
+
+## Parameters
+
+The `shingle` token filter can be configured with the following parameters.
+
+Parameter | Required/Optional | Data type | Description
+:--- | :--- | :--- | :--- 
+`min_shingle_size` | Optional | Integer | The minimum number of tokens to concatenate. Default is `2`.
+`max_shingle_size` | Optional | Integer | The maximum number of tokens to concatenate. Default is `2`.
+`output_unigrams` | Optional | Boolean | Whether to include unigrams (individual tokens) as output. Default is `true`.
+`output_unigrams_if_no_shingles` | Optional | Boolean | Whether to output unigrams if no shingles are generated. Default is `false`.
+`token_separator` | Optional | String |  A separator used to concatenate tokens into a shingle. Default is a space (`" "`).
+`filler_token` | Optional | String | A token inserted into empty positions or gaps between tokens. Default is an underscore (`_`).
+
+If `output_unigrams` and `output_unigrams_if_no_shingles` are both set to `true`, `output_unigrams_if_no_shingles` is ignored.
+{: .note}
+
+## Example
+
+The following example request creates a new index named `my-shingle-index` and configures an analyzer with a `shingle` filter:
+
+```json
+PUT /my-shingle-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "my_shingle_filter": {
+          "type": "shingle",
+          "min_shingle_size": 2,
+          "max_shingle_size": 2,
+          "output_unigrams": true
+        }
+      },
+      "analyzer": {
+        "my_shingle_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "my_shingle_filter"
+          ]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+GET /my-shingle-index/_analyze
+{
+  "analyzer": "my_shingle_analyzer",
+  "text": "slow green turtle"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "slow",
+      "start_offset": 0,
+      "end_offset": 4,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "slow green",
+      "start_offset": 0,
+      "end_offset": 10,
+      "type": "shingle",
+      "position": 0,
+      "positionLength": 2
+    },
+    {
+      "token": "green",
+      "start_offset": 5,
+      "end_offset": 10,
+      "type": "<ALPHANUM>",
+      "position": 1
+    },
+    {
+      "token": "green turtle",
+      "start_offset": 5,
+      "end_offset": 17,
+      "type": "shingle",
+      "position": 1,
+      "positionLength": 2
+    },
+    {
+      "token": "turtle",
+      "start_offset": 11,
+      "end_offset": 17,
+      "type": "<ALPHANUM>",
+      "position": 2
+    }
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/token-filters/snowball.md b/_analyzers/token-filters/snowball.md
new file mode 100644
index 0000000000..149486e727
--- /dev/null
+++ b/_analyzers/token-filters/snowball.md
@@ -0,0 +1,108 @@
+---
+layout: default
+title: Snowball
+parent: Token filters
+nav_order: 380
+---
+
+# Snowball token filter
+
+The `snowball` token filter is a stemming filter based on the [Snowball](https://snowballstem.org/) algorithm. It supports many languages and is more efficient and accurate than the Porter stemming algorithm.
+
+## Parameters
+
+The `snowball` token filter can be configured with a `language` parameter that accepts the following values:
+
+- `Arabic`
+- `Armenian`
+- `Basque`
+- `Catalan`
+- `Danish`
+- `Dutch`
+- `English` (default)
+- `Estonian`
+- `Finnish`
+- `French`
+- `German`
+- `German2` 
+- `Hungarian`
+- `Italian`
+- `Irish`
+- `Kp`
+- `Lithuanian`
+- `Lovins`
+- `Norwegian`
+- `Porter`
+- `Portuguese`
+- `Romanian`
+- `Russian`
+- `Spanish`
+- `Swedish`
+- `Turkish`
+
+## Example
+
+The following example request creates a new index named `my-snowball-index` and configures an analyzer with a `snowball` filter:
+
+```json
+PUT /my-snowball-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "my_snowball_filter": {
+          "type": "snowball",
+          "language": "English"
+        }
+      },
+      "analyzer": {
+        "my_snowball_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "my_snowball_filter"
+          ]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+GET /my-snowball-index/_analyze
+{
+  "analyzer": "my_snowball_analyzer",
+  "text": "running runners"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "run",
+      "start_offset": 0,
+      "end_offset": 7,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "runner",
+      "start_offset": 8,
+      "end_offset": 15,
+      "type": "<ALPHANUM>",
+      "position": 1
+    }
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/token-filters/stemmer-override.md b/_analyzers/token-filters/stemmer-override.md
new file mode 100644
index 0000000000..c06f673714
--- /dev/null
+++ b/_analyzers/token-filters/stemmer-override.md
@@ -0,0 +1,139 @@
+---
+layout: default
+title: Stemmer override
+parent: Token filters
+nav_order: 400
+---
+
+# Stemmer override token filter
+
+The `stemmer_override` token filter allows you to define custom stemming rules that override the behavior of default stemmers like Porter or Snowball. This can be useful when you want to apply specific stemming behavior to certain words that might not be modified correctly by the standard stemming algorithms.
+
+## Parameters
+
+The `stemmer_override` token filter must be configured with exactly one of the following parameters.
+
+Parameter | Data type | Description
+:--- | :--- | :--- 
+`rules` | String | Defines the override rules directly in the settings.
+`rules_path` | String | Specifies the path to the file containing custom rules (mappings). The path can be either an absolute path or a path relative to the config directory.
+
+## Example
+
+The following example request creates a new index named `my-index` and configures an analyzer with a `stemmer_override` filter:
+
+```json
+PUT /my-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "my_stemmer_override_filter": {
+          "type": "stemmer_override",
+          "rules": [
+            "running, runner => run",
+            "bought => buy",
+            "best => good"
+          ]
+        }
+      },
+      "analyzer": {
+        "my_custom_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "my_stemmer_override_filter"
+          ]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+GET /my-index/_analyze
+{
+  "analyzer": "my_custom_analyzer",
+  "text": "I am a runner and bought the best shoes"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "i",
+      "start_offset": 0,
+      "end_offset": 1,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "am",
+      "start_offset": 2,
+      "end_offset": 4,
+      "type": "<ALPHANUM>",
+      "position": 1
+    },
+    {
+      "token": "a",
+      "start_offset": 5,
+      "end_offset": 6,
+      "type": "<ALPHANUM>",
+      "position": 2
+    },
+    {
+      "token": "run",
+      "start_offset": 7,
+      "end_offset": 13,
+      "type": "<ALPHANUM>",
+      "position": 3
+    },
+    {
+      "token": "and",
+      "start_offset": 14,
+      "end_offset": 17,
+      "type": "<ALPHANUM>",
+      "position": 4
+    },
+    {
+      "token": "buy",
+      "start_offset": 18,
+      "end_offset": 24,
+      "type": "<ALPHANUM>",
+      "position": 5
+    },
+    {
+      "token": "the",
+      "start_offset": 25,
+      "end_offset": 28,
+      "type": "<ALPHANUM>",
+      "position": 6
+    },
+    {
+      "token": "good",
+      "start_offset": 29,
+      "end_offset": 33,
+      "type": "<ALPHANUM>",
+      "position": 7
+    },
+    {
+      "token": "shoes",
+      "start_offset": 34,
+      "end_offset": 39,
+      "type": "<ALPHANUM>",
+      "position": 8
+    }
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/token-filters/stemmer.md b/_analyzers/token-filters/stemmer.md
new file mode 100644
index 0000000000..dd1344fcbc
--- /dev/null
+++ b/_analyzers/token-filters/stemmer.md
@@ -0,0 +1,118 @@
+---
+layout: default
+title: Stemmer
+parent: Token filters
+nav_order: 390
+---
+
+# Stemmer token filter
+
+The `stemmer` token filter reduces words to their root or base form (also known as their _stem_).
+
+## Parameters
+
+The `stemmer` token filter can be configured with a `language` parameter that accepts the following values:
+
+- Arabic: `arabic`
+- Armenian: `armenian`
+- Basque: `basque`
+- Bengali: `bengali`
+- Brazilian Portuguese: `brazilian`
+- Bulgarian: `bulgarian`
+- Catalan: `catalan`
+- Czech: `czech`
+- Danish: `danish`
+- Dutch: `dutch, dutch_kp`
+- English: `english` (default), `light_english`, `lovins`, `minimal_english`, `porter2`, `possessive_english`
+- Estonian: `estonian`
+- Finnish: `finnish`, `light_finnish`
+- French: `light_french`, `french`, `minimal_french`
+- Galician: `galician`, `minimal_galician` (plural step only)
+- German: `light_german`, `german`, `german2`, `minimal_german`
+- Greek: `greek`
+- Hindi: `hindi`
+- Hungarian: `hungarian, light_hungarian`
+- Indonesian: `indonesian`
+- Irish: `irish`
+- Italian: `light_italian, italian`
+- Kurdish (Sorani): `sorani`
+- Latvian: `latvian`
+- Lithuanian: `lithuanian`
+- Norwegian (Bokmål): `norwegian`, `light_norwegian`, `minimal_norwegian`
+- Norwegian (Nynorsk): `light_nynorsk`, `minimal_nynorsk`
+- Portuguese: `light_portuguese`, `minimal_portuguese`, `portuguese`, `portuguese_rslp`
+- Romanian: `romanian`
+- Russian: `russian`, `light_russian`
+- Spanish: `light_spanish`, `spanish`
+- Swedish: `swedish`, `light_swedish`
+- Turkish: `turkish`
+
+You can also use the `name` parameter as an alias for the `language` parameter. If both are set, the `name` parameter is ignored.
+{: .note}
+
+## Example
+
+The following example request creates a new index named `my-stemmer-index` and configures an analyzer with a `stemmer` filter:
+
+```json
+PUT /my-stemmer-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "my_english_stemmer": {
+          "type": "stemmer",
+          "language": "english"
+        }
+      },
+      "analyzer": {
+        "my_stemmer_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "my_english_stemmer"
+          ]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+GET /my-stemmer-index/_analyze
+{
+  "analyzer": "my_stemmer_analyzer",
+  "text": "running runs"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "run",
+      "start_offset": 0,
+      "end_offset": 7,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "run",
+      "start_offset": 8,
+      "end_offset": 12,
+      "type": "<ALPHANUM>",
+      "position": 1
+    }
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/token-filters/stop.md b/_analyzers/token-filters/stop.md
new file mode 100644
index 0000000000..8f3e01b72d
--- /dev/null
+++ b/_analyzers/token-filters/stop.md
@@ -0,0 +1,111 @@
+---
+layout: default
+title: Stop
+parent: Token filters
+nav_order: 410
+---
+
+# Stop token filter
+
+The `stop` token filter is used to remove common words (also known as _stopwords_) from a token stream during analysis. Stopwords are typically articles and prepositions, such as `a` or `for`. These words are not significantly meaningful in search queries and are often excluded to improve search efficiency and relevance. 
+
+The default list of English stopwords includes the following words: `a`, `an`, `and`, `are`, `as`, `at`, `be`, `but`, `by`, `for`, `if`, `in`, `into`, `is`, `it`, `no`, `not`, `of`, `on`, `or`, `such`, `that`, `the`, `their`, `then`, `there`, `these`, `they`, `this`, `to`, `was`, `will`, and `with`. 
+
+## Parameters
+
+The `stop` token filter can be configured with the following parameters.
+
+Parameter | Required/Optional | Data type | Description
+:--- | :--- | :--- | :--- 
+`stopwords` | Optional | String | Specifies either a custom array of stopwords or a language for which to fetch the predefined Lucene stopword list:<br><br>- [`_arabic_`](https://github.com/apache/lucene/blob/main/lucene/analysis/common/src/resources/org/apache/lucene/analysis/ar/stopwords.txt)<br>- [`_armenian_`](https://github.com/apache/lucene/blob/main/lucene/analysis/common/src/resources/org/apache/lucene/analysis/hy/stopwords.txt)<br>- [`_basque_`](https://github.com/apache/lucene/blob/main/lucene/analysis/common/src/resources/org/apache/lucene/analysis/eu/stopwords.txt)<br>- [`_bengali_`](https://github.com/apache/lucene/blob/main/lucene/analysis/common/src/resources/org/apache/lucene/analysis/bn/stopwords.txt)<br>- [`_brazilian_` (Brazilian Portuguese)](https://github.com/apache/lucene/blob/main/lucene/analysis/common/src/resources/org/apache/lucene/analysis/br/stopwords.txt) <br>- [`_bulgarian_`](https://github.com/apache/lucene/blob/main/lucene/analysis/common/src/resources/org/apache/lucene/analysis/bg/stopwords.txt)<br>- [`_catalan_`](https://github.com/apache/lucene/blob/main/lucene/analysis/common/src/resources/org/apache/lucene/analysis/ca/stopwords.txt)<br>- [`_cjk_` (Chinese, Japanese, and Korean)](https://github.com/apache/lucene/blob/main/lucene/analysis/common/src/resources/org/apache/lucene/analysis/cjk/stopwords.txt)<br>- [`_czech_`](https://github.com/apache/lucene/blob/main/lucene/analysis/common/src/resources/org/apache/lucene/analysis/cz/stopwords.txt)<br>- [`_danish_`](https://github.com/apache/lucene/blob/main/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/danish_stop.txt)<br>- [`_dutch_`](https://github.com/apache/lucene/blob/main/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/dutch_stop.txt)<br>- [`_english_`](https://github.com/apache/lucene/blob/main/lucene/analysis/common/src/java/org/apache/lucene/analysis/en/EnglishAnalyzer.java#L48) (Default)<br>- [`_estonian_`](https://github.com/apache/lucene/blob/main/lucene/analysis/common/src/resources/org/apache/lucene/analysis/et/stopwords.txt)<br>- [`_finnish_`](https://github.com/apache/lucene/blob/main/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/finnish_stop.txt)<br>- [`_french_`](https://github.com/apache/lucene/blob/main/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/french_stop.txt)<br>- [`_galician_`](https://github.com/apache/lucene/blob/main/lucene/analysis/common/src/resources/org/apache/lucene/analysis/gl/stopwords.txt)<br>- [`_german_`](https://github.com/apache/lucene/blob/main/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/german_stop.txt)<br>- [`_greek_`](https://github.com/apache/lucene/blob/main/lucene/analysis/common/src/resources/org/apache/lucene/analysis/el/stopwords.txt)<br>- [`_hindi_`](https://github.com/apache/lucene/blob/main/lucene/analysis/common/src/resources/org/apache/lucene/analysis/hi/stopwords.txt)<br>- [`_hungarian_`](https://github.com/apache/lucene/blob/main/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/hungarian_stop.txt)<br>- [`_indonesian_`](https://github.com/apache/lucene/blob/main/lucene/analysis/common/src/resources/org/apache/lucene/analysis/id/stopwords.txt)<br>- [`_irish_`](https://github.com/apache/lucene/blob/main/lucene/analysis/common/src/resources/org/apache/lucene/analysis/ga/stopwords.txt)<br>- [`_italian_`](https://github.com/apache/lucene/blob/main/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/italian_stop.txt)<br>- [`_latvian_`](https://github.com/apache/lucene/blob/main/lucene/analysis/common/src/resources/org/apache/lucene/analysis/lv/stopwords.txt)<br>- [`_lithuanian_`](https://github.com/apache/lucene/blob/main/lucene/analysis/common/src/resources/org/apache/lucene/analysis/lt/stopwords.txt)<br>- [`_norwegian_`](https://github.com/apache/lucene/blob/main/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/norwegian_stop.txt)<br>- [`_persian_`](https://github.com/apache/lucene/blob/main/lucene/analysis/common/src/resources/org/apache/lucene/analysis/fa/stopwords.txt)<br>- [`_portuguese_`](https://github.com/apache/lucene/blob/main/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/portuguese_stop.txt)<br>- [`_romanian_`](https://github.com/apache/lucene/blob/main/lucene/analysis/common/src/resources/org/apache/lucene/analysis/ro/stopwords.txt)<br>- [`_russian_`](https://github.com/apache/lucene/blob/main/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/russian_stop.txt)<br>- [`_sorani_`](https://github.com/apache/lucene/blob/main/lucene/analysis/common/src/resources/org/apache/lucene/analysis/sr/stopwords.txt)<br>- [`_spanish_`](https://github.com/apache/lucene/blob/main/lucene/analysis/common/src/resources/org/apache/lucene/analysis/ckb/stopwords.txt)<br>- [`_swedish_`](https://github.com/apache/lucene/blob/main/lucene/analysis/common/src/resources/org/apache/lucene/analysis/snowball/swedish_stop.txt)<br>- [`_thai_`](https://github.com/apache/lucene/blob/main/lucene/analysis/common/src/resources/org/apache/lucene/analysis/th/stopwords.txt)<br>- [`_turkish_`](https://github.com/apache/lucene/blob/main/lucene/analysis/common/src/resources/org/apache/lucene/analysis/tr/stopwords.txt)
+`stopwords_path` | Optional | String | Specifies the file path (absolute or relative to the config directory) of the file containing custom stopwords.
+`ignore_case` | Optional | Boolean | If `true`, stopwords will be matched regardless of their case. Default is `false`.
+`remove_trailing` | Optional | Boolean | If `true`, trailing stopwords will be removed during analysis. Default is `true`.
+
+## Example
+
+The following example request creates a new index named `my-stopword-index` and configures an analyzer with a `stop` filter that uses the predefined stopword list for the English language:
+
+```json
+PUT /my-stopword-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "my_stop_filter": {
+          "type": "stop",
+          "stopwords": "_english_"
+        }
+      },
+      "analyzer": {
+        "my_stop_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "my_stop_filter"
+          ]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+GET /my-stopword-index/_analyze
+{
+  "analyzer": "my_stop_analyzer",
+  "text": "A quick dog jumps over the turtle"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "quick",
+      "start_offset": 2,
+      "end_offset": 7,
+      "type": "<ALPHANUM>",
+      "position": 1
+    },
+    {
+      "token": "dog",
+      "start_offset": 8,
+      "end_offset": 11,
+      "type": "<ALPHANUM>",
+      "position": 2
+    },
+    {
+      "token": "jumps",
+      "start_offset": 12,
+      "end_offset": 17,
+      "type": "<ALPHANUM>",
+      "position": 3
+    },
+    {
+      "token": "over",
+      "start_offset": 18,
+      "end_offset": 22,
+      "type": "<ALPHANUM>",
+      "position": 4
+    },
+    {
+      "token": "turtle",
+      "start_offset": 27,
+      "end_offset": 33,
+      "type": "<ALPHANUM>",
+      "position": 6
+    }
+  ]
+}
+```
\ No newline at end of file
diff --git a/_analyzers/token-filters/synonym-graph.md b/_analyzers/token-filters/synonym-graph.md
new file mode 100644
index 0000000000..75c7c79151
--- /dev/null
+++ b/_analyzers/token-filters/synonym-graph.md
@@ -0,0 +1,180 @@
+---
+layout: default
+title: Synonym graph
+parent: Token filters
+nav_order: 420
+---
+
+# Synonym graph token filter
+
+The `synonym_graph` token filter is a more advanced version of the `synonym` token filter. It supports multiword synonyms and processes synonyms across multiple tokens, making it ideal for phrases or scenarios in which relationships between tokens are important.
+
+## Parameters
+
+The `synonym_graph` token filter can be configured with the following parameters.
+
+Parameter | Required/Optional | Data type | Description
+:--- | :--- | :--- | :--- 
+`synonyms` | Either `synonyms` or `synonyms_path` must be specified | String | A list of synonym rules defined directly in the configuration.
+`synonyms_path` | Either `synonyms` or `synonyms_path` must be specified | String | The file path to a file containing synonym rules (either an absolute path or a path relative to the config directory).
+`lenient` | Optional | Boolean | Whether to ignore exceptions when loading the rule configurations. Default is `false`.
+`format` | Optional | String | Specifies the format used to determine how OpenSearch defines and interprets synonyms. Valid values are:<br>- `solr` <br>- [`wordnet`](https://wordnet.princeton.edu/). <br> Default is `solr`.
+`expand` | Optional | Boolean |  Whether to expand equivalent synonym rules. Default is `false`.<br><br>For example: <br>If `synonyms` are defined as `"quick, fast"` and `expand` is set to `true`, then the synonym rules are configured as follows:<br>- `quick => quick`<br>- `quick => fast`<br>- `fast => quick`<br>- `fast => fast`<br><br>If `expand` is set to `false`, the synonym rules are configured as follows:<br>- `quick => quick`<br>- `fast => quick`
+
+## Example: Solr format
+
+The following example request creates a new index named `my-index` and configures an analyzer with a `synonym_graph` filter. The filter is configured with the default `solr` rule format:
+
+```json
+PUT /my-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "my_synonym_graph_filter": {
+          "type": "synonym_graph",
+          "synonyms": [
+            "sports car, race car",
+            "fast car, speedy vehicle",
+            "luxury car, premium vehicle",
+            "electric car, EV"
+          ]
+        }
+      },
+      "analyzer": {
+        "my_synonym_graph_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "my_synonym_graph_filter"
+          ]
+        }
+      }
+    }
+  }
+}
+
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+GET /my-car-index/_analyze
+{
+  "analyzer": "my_synonym_graph_analyzer",
+  "text": "I just bought a sports car and it is a fast car."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {"token": "i","start_offset": 0,"end_offset": 1,"type": "<ALPHANUM>","position": 0},
+    {"token": "just","start_offset": 2,"end_offset": 6,"type": "<ALPHANUM>","position": 1},
+    {"token": "bought","start_offset": 7,"end_offset": 13,"type": "<ALPHANUM>","position": 2},
+    {"token": "a","start_offset": 14,"end_offset": 15,"type": "<ALPHANUM>","position": 3},
+    {"token": "race","start_offset": 16,"end_offset": 26,"type": "SYNONYM","position": 4},
+    {"token": "sports","start_offset": 16,"end_offset": 22,"type": "<ALPHANUM>","position": 4,"positionLength": 2},
+    {"token": "car","start_offset": 16,"end_offset": 26,"type": "SYNONYM","position": 5,"positionLength": 2},
+    {"token": "car","start_offset": 23,"end_offset": 26,"type": "<ALPHANUM>","position": 6},
+    {"token": "and","start_offset": 27,"end_offset": 30,"type": "<ALPHANUM>","position": 7},
+    {"token": "it","start_offset": 31,"end_offset": 33,"type": "<ALPHANUM>","position": 8},
+    {"token": "is","start_offset": 34,"end_offset": 36,"type": "<ALPHANUM>","position": 9},
+    {"token": "a","start_offset": 37,"end_offset": 38,"type": "<ALPHANUM>","position": 10},
+    {"token": "speedy","start_offset": 39,"end_offset": 47,"type": "SYNONYM","position": 11},
+    {"token": "fast","start_offset": 39,"end_offset": 43,"type": "<ALPHANUM>","position": 11,"positionLength": 2},
+    {"token": "vehicle","start_offset": 39,"end_offset": 47,"type": "SYNONYM","position": 12,"positionLength": 2},
+    {"token": "car","start_offset": 44,"end_offset": 47,"type": "<ALPHANUM>","position": 13}
+  ]
+}
+```
+
+## Example: WordNet format
+
+The following example request creates a new index named `my-wordnet-index` and configures an analyzer with a `synonym_graph` filter. The filter is configured with the [`wordnet`](https://wordnet.princeton.edu/) rule format:
+
+```json
+PUT /my-wordnet-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "my_synonym_graph_filter": {
+          "type": "synonym_graph",
+          "format": "wordnet",
+          "synonyms": [
+            "s(100000001, 1, 'sports car', n, 1, 0).",
+            "s(100000001, 2, 'race car', n, 1, 0).",
+            "s(100000001, 3, 'fast car', n, 1, 0).",
+            "s(100000001, 4, 'speedy vehicle', n, 1, 0)."
+          ]
+        }
+      },
+      "analyzer": {
+        "my_synonym_graph_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "my_synonym_graph_filter"
+          ]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+GET /my-wordnet-index/_analyze
+{
+  "analyzer": "my_synonym_graph_analyzer",
+  "text": "I just bought a sports car and it is a fast car."
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {"token": "i","start_offset": 0,"end_offset": 1,"type": "<ALPHANUM>","position": 0},
+    {"token": "just","start_offset": 2,"end_offset": 6,"type": "<ALPHANUM>","position": 1},
+    {"token": "bought","start_offset": 7,"end_offset": 13,"type": "<ALPHANUM>","position": 2},
+    {"token": "a","start_offset": 14,"end_offset": 15,"type": "<ALPHANUM>","position": 3},
+    {"token": "race","start_offset": 16,"end_offset": 26,"type": "SYNONYM","position": 4},
+    {"token": "fast","start_offset": 16,"end_offset": 26,"type": "SYNONYM","position": 4,"positionLength": 2},
+    {"token": "speedy","start_offset": 16,"end_offset": 26,"type": "SYNONYM","position": 4,"positionLength": 3},
+    {"token": "sports","start_offset": 16,"end_offset": 22,"type": "<ALPHANUM>","position": 4,"positionLength": 4},
+    {"token": "car","start_offset": 16,"end_offset": 26,"type": "SYNONYM","position": 5,"positionLength": 4},
+    {"token": "car","start_offset": 16,"end_offset": 26,"type": "SYNONYM","position": 6,"positionLength": 3},
+    {"token": "vehicle","start_offset": 16,"end_offset": 26,"type": "SYNONYM","position": 7,"positionLength": 2},
+    {"token": "car","start_offset": 23,"end_offset": 26,"type": "<ALPHANUM>","position": 8},
+    {"token": "and","start_offset": 27,"end_offset": 30,"type": "<ALPHANUM>","position": 9},
+    {"token": "it","start_offset": 31,"end_offset": 33,"type": "<ALPHANUM>","position": 10},
+    {"token": "is","start_offset": 34,"end_offset": 36,"type": "<ALPHANUM>","position": 11},
+    {"token": "a","start_offset": 37,"end_offset": 38,"type": "<ALPHANUM>","position": 12},
+    {"token": "sports","start_offset": 39,"end_offset": 47,"type": "SYNONYM","position": 13},
+    {"token": "race","start_offset": 39,"end_offset": 47,"type": "SYNONYM","position": 13,"positionLength": 2},
+    {"token": "speedy","start_offset": 39,"end_offset": 47,"type": "SYNONYM","position": 13,"positionLength": 3},
+    {"token": "fast","start_offset": 39,"end_offset": 43,"type": "<ALPHANUM>","position": 13,"positionLength": 4},
+    {"token": "car","start_offset": 39,"end_offset": 47,"type": "SYNONYM","position": 14,"positionLength": 4},
+    {"token": "car","start_offset": 39,"end_offset": 47,"type": "SYNONYM","position": 15,"positionLength": 3},
+    {"token": "vehicle","start_offset": 39,"end_offset": 47,"type": "SYNONYM","position": 16,"positionLength": 2},
+    {"token": "car","start_offset": 44,"end_offset": 47,"type": "<ALPHANUM>","position": 17}
+  ]
+}
+```
diff --git a/_analyzers/token-filters/synonym.md b/_analyzers/token-filters/synonym.md
new file mode 100644
index 0000000000..296d5cd5db
--- /dev/null
+++ b/_analyzers/token-filters/synonym.md
@@ -0,0 +1,277 @@
+---
+layout: default
+title: Synonym
+parent: Token filters
+nav_order: 415
+---
+
+# Synonym token filter
+
+The `synonym` token filter allows you to map multiple terms to a single term or create equivalence groups between words, improving search flexibility.
+
+## Parameters
+
+The `synonym` token filter can be configured with the following parameters.
+
+Parameter | Required/Optional | Data type | Description
+:--- | :--- | :--- | :--- 
+`synonyms` | Either `synonyms` or `synonyms_path` must be specified | String | A list of synonym rules defined directly in the configuration.
+`synonyms_path` | Either `synonyms` or `synonyms_path` must be specified | String |  The file path to a file containing synonym rules (either an absolute path or a path relative to the config directory).
+`lenient` | Optional | Boolean | Whether to ignore exceptions when loading the rule configurations. Default is `false`.
+`format` | Optional | String | Specifies the format used to determine how OpenSearch defines and interprets synonyms. Valid values are:<br>- `solr` <br>- [`wordnet`](https://wordnet.princeton.edu/). <br> Default is `solr`.
+`expand` | Optional | Boolean |  Whether to expand equivalent synonym rules. Default is `false`.<br><br>For example: <br>If `synonyms` are defined as `"quick, fast"` and `expand` is set to `true`, then the synonym rules are configured as follows:<br>- `quick => quick`<br>- `quick => fast`<br>- `fast => quick`<br>- `fast => fast`<br><br>If `expand` is set to `false`, the synonym rules are configured as follows:<br>- `quick => quick`<br>- `fast => quick`
+
+## Example: Solr format
+
+The following example request creates a new index named `my-synonym-index` and configures an analyzer with a `synonym` filter. The filter is configured with the default `solr` rule format:
+
+```json
+PUT /my-synonym-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "my_synonym_filter": {
+          "type": "synonym",
+          "synonyms": [
+            "car, automobile",
+            "quick, fast, speedy",
+            "laptop => computer"
+          ]
+        }
+      },
+      "analyzer": {
+        "my_synonym_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "my_synonym_filter"
+          ]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+GET /my-synonym-index/_analyze
+{
+  "analyzer": "my_synonym_analyzer",
+  "text": "The quick dog jumps into the car with a laptop"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "the",
+      "start_offset": 0,
+      "end_offset": 3,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "quick",
+      "start_offset": 4,
+      "end_offset": 9,
+      "type": "<ALPHANUM>",
+      "position": 1
+    },
+    {
+      "token": "fast",
+      "start_offset": 4,
+      "end_offset": 9,
+      "type": "SYNONYM",
+      "position": 1
+    },
+    {
+      "token": "speedy",
+      "start_offset": 4,
+      "end_offset": 9,
+      "type": "SYNONYM",
+      "position": 1
+    },
+    {
+      "token": "dog",
+      "start_offset": 10,
+      "end_offset": 13,
+      "type": "<ALPHANUM>",
+      "position": 2
+    },
+    {
+      "token": "jumps",
+      "start_offset": 14,
+      "end_offset": 19,
+      "type": "<ALPHANUM>",
+      "position": 3
+    },
+    {
+      "token": "into",
+      "start_offset": 20,
+      "end_offset": 24,
+      "type": "<ALPHANUM>",
+      "position": 4
+    },
+    {
+      "token": "the",
+      "start_offset": 25,
+      "end_offset": 28,
+      "type": "<ALPHANUM>",
+      "position": 5
+    },
+    {
+      "token": "car",
+      "start_offset": 29,
+      "end_offset": 32,
+      "type": "<ALPHANUM>",
+      "position": 6
+    },
+    {
+      "token": "automobile",
+      "start_offset": 29,
+      "end_offset": 32,
+      "type": "SYNONYM",
+      "position": 6
+    },
+    {
+      "token": "with",
+      "start_offset": 33,
+      "end_offset": 37,
+      "type": "<ALPHANUM>",
+      "position": 7
+    },
+    {
+      "token": "a",
+      "start_offset": 38,
+      "end_offset": 39,
+      "type": "<ALPHANUM>",
+      "position": 8
+    },
+    {
+      "token": "computer",
+      "start_offset": 40,
+      "end_offset": 46,
+      "type": "SYNONYM",
+      "position": 9
+    }
+  ]
+}
+```
+
+## Example: WordNet format
+
+The following example request creates a new index named `my-wordnet-index` and configures an analyzer with a `synonym` filter. The filter is configured with the [`wordnet`](https://wordnet.princeton.edu/) rule format:
+
+```json
+PUT /my-wordnet-index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "my_wordnet_synonym_filter": {
+          "type": "synonym",
+          "format": "wordnet",
+          "synonyms": [
+            "s(100000001,1,'fast',v,1,0).",
+            "s(100000001,2,'quick',v,1,0).",
+            "s(100000001,3,'swift',v,1,0)."
+          ]
+        }
+      },
+      "analyzer": {
+        "my_wordnet_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "my_wordnet_synonym_filter"
+          ]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+GET /my-wordnet-index/_analyze
+{
+  "analyzer": "my_wordnet_analyzer",
+  "text": "I have a fast car"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "i",
+      "start_offset": 0,
+      "end_offset": 1,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "have",
+      "start_offset": 2,
+      "end_offset": 6,
+      "type": "<ALPHANUM>",
+      "position": 1
+    },
+    {
+      "token": "a",
+      "start_offset": 7,
+      "end_offset": 8,
+      "type": "<ALPHANUM>",
+      "position": 2
+    },
+    {
+      "token": "fast",
+      "start_offset": 9,
+      "end_offset": 13,
+      "type": "<ALPHANUM>",
+      "position": 3
+    },
+    {
+      "token": "quick",
+      "start_offset": 9,
+      "end_offset": 13,
+      "type": "SYNONYM",
+      "position": 3
+    },
+    {
+      "token": "swift",
+      "start_offset": 9,
+      "end_offset": 13,
+      "type": "SYNONYM",
+      "position": 3
+    },
+    {
+      "token": "car",
+      "start_offset": 14,
+      "end_offset": 17,
+      "type": "<ALPHANUM>",
+      "position": 4
+    }
+  ]
+}
+```
diff --git a/_analyzers/token-filters/trim.md b/_analyzers/token-filters/trim.md
new file mode 100644
index 0000000000..cdfebed52f
--- /dev/null
+++ b/_analyzers/token-filters/trim.md
@@ -0,0 +1,93 @@
+---
+layout: default
+title: Trim
+parent: Token filters
+nav_order: 430
+---
+
+# Trim token filter
+
+The `trim` token filter removes leading and trailing white space characters from tokens. 
+
+Many popular tokenizers, such as `standard`, `keyword`, and `whitespace` tokenizers, automatically strip leading and trailing white space characters during tokenization. When using these tokenizers, there is no need to configure an additional `trim` token filter. 
+{: .note}
+
+
+## Example
+
+The following example request creates a new index named `my_pattern_trim_index` and configures an analyzer with a `trim` filter and a `pattern` tokenizer, which does not remove leading and trailing white space characters:
+
+```json
+PUT /my_pattern_trim_index
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "my_trim_filter": {
+          "type": "trim"
+        }
+      },
+      "tokenizer": {
+        "my_pattern_tokenizer": {
+          "type": "pattern",
+          "pattern": ","
+        }
+      },
+      "analyzer": {
+        "my_pattern_trim_analyzer": {
+          "type": "custom",
+          "tokenizer": "my_pattern_tokenizer",
+          "filter": [
+            "lowercase",
+            "my_trim_filter"
+          ]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+GET /my_pattern_trim_index/_analyze
+{
+  "analyzer": "my_pattern_trim_analyzer",
+  "text": " OpenSearch ,  is ,   powerful  "
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "opensearch",
+      "start_offset": 0,
+      "end_offset": 12,
+      "type": "word",
+      "position": 0
+    },
+    {
+      "token": "is",
+      "start_offset": 13,
+      "end_offset": 18,
+      "type": "word",
+      "position": 1
+    },
+    {
+      "token": "powerful",
+      "start_offset": 19,
+      "end_offset": 32,
+      "type": "word",
+      "position": 2
+    }
+  ]
+}
+```
diff --git a/_analyzers/token-filters/truncate.md b/_analyzers/token-filters/truncate.md
new file mode 100644
index 0000000000..16d1452901
--- /dev/null
+++ b/_analyzers/token-filters/truncate.md
@@ -0,0 +1,107 @@
+---
+layout: default
+title: Truncate
+parent: Token filters
+nav_order: 440
+---
+
+# Truncate token filter
+
+The `truncate` token filter is used to shorten tokens exceeding a specified length. It trims tokens to a maximum number of characters, ensuring that tokens exceeding this limit are truncated. 
+
+## Parameters
+
+The `truncate` token filter can be configured with the following parameter.
+
+Parameter | Required/Optional | Data type | Description
+:--- | :--- | :--- | :--- 
+`length` | Optional | Integer | Specifies the maximum length of the generated token. Default is `10`.
+
+## Example
+
+The following example request creates a new index named `truncate_example` and configures an analyzer with a `truncate` filter:
+
+```json
+PUT /truncate_example
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "truncate_filter": {
+          "type": "truncate",
+          "length": 5
+        }
+      },
+      "analyzer": {
+        "truncate_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "truncate_filter"
+          ]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+GET /truncate_example/_analyze
+{
+  "analyzer": "truncate_analyzer",
+  "text": "OpenSearch is powerful and scalable"
+}
+
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "opens",
+      "start_offset": 0,
+      "end_offset": 10,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "is",
+      "start_offset": 11,
+      "end_offset": 13,
+      "type": "<ALPHANUM>",
+      "position": 1
+    },
+    {
+      "token": "power",
+      "start_offset": 14,
+      "end_offset": 22,
+      "type": "<ALPHANUM>",
+      "position": 2
+    },
+    {
+      "token": "and",
+      "start_offset": 23,
+      "end_offset": 26,
+      "type": "<ALPHANUM>",
+      "position": 3
+    },
+    {
+      "token": "scala",
+      "start_offset": 27,
+      "end_offset": 35,
+      "type": "<ALPHANUM>",
+      "position": 4
+    }
+  ]
+}
+```
diff --git a/_analyzers/token-filters/unique.md b/_analyzers/token-filters/unique.md
new file mode 100644
index 0000000000..c4dfcbab16
--- /dev/null
+++ b/_analyzers/token-filters/unique.md
@@ -0,0 +1,106 @@
+---
+layout: default
+title: Unique
+parent: Token filters
+nav_order: 450
+---
+
+# Unique token filter
+
+The `unique` token filter ensures that only unique tokens are kept during the analysis process, removing duplicate tokens that appear within a single field or text block. 
+
+## Parameters
+
+The `unique` token filter can be configured with the following parameter.
+
+Parameter | Required/Optional | Data type | Description
+:--- | :--- | :--- | :--- 
+`only_on_same_position` | Optional | Boolean | If `true`, the token filter acts as a `remove_duplicates` token filter and only removes tokens that are in the same position. Default is `false`.
+
+## Example
+
+The following example request creates a new index named `unique_example` and configures an analyzer with a `unique` filter:
+
+```json
+PUT /unique_example
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "unique_filter": {
+          "type": "unique",
+          "only_on_same_position": false
+        }
+      },
+      "analyzer": {
+        "unique_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "unique_filter"
+          ]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+GET /unique_example/_analyze
+{
+  "analyzer": "unique_analyzer",
+  "text": "OpenSearch OpenSearch is powerful powerful and scalable"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "opensearch",
+      "start_offset": 0,
+      "end_offset": 10,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "is",
+      "start_offset": 22,
+      "end_offset": 24,
+      "type": "<ALPHANUM>",
+      "position": 1
+    },
+    {
+      "token": "powerful",
+      "start_offset": 25,
+      "end_offset": 33,
+      "type": "<ALPHANUM>",
+      "position": 2
+    },
+    {
+      "token": "and",
+      "start_offset": 43,
+      "end_offset": 46,
+      "type": "<ALPHANUM>",
+      "position": 3
+    },
+    {
+      "token": "scalable",
+      "start_offset": 47,
+      "end_offset": 55,
+      "type": "<ALPHANUM>",
+      "position": 4
+    }
+  ]
+}
+```
diff --git a/_analyzers/token-filters/uppercase.md b/_analyzers/token-filters/uppercase.md
new file mode 100644
index 0000000000..5026892400
--- /dev/null
+++ b/_analyzers/token-filters/uppercase.md
@@ -0,0 +1,83 @@
+---
+layout: default
+title: Uppercase
+parent: Token filters
+nav_order: 460
+---
+
+# Uppercase token filter
+
+The `uppercase` token filter is used to convert all tokens (words) to uppercase during analysis.
+
+## Example
+
+The following example request creates a new index named `uppercase_example` and configures an analyzer with an `uppercase` filter:
+
+```json
+PUT /uppercase_example
+{
+  "settings": {
+    "analysis": {
+      "filter": {
+        "uppercase_filter": {
+          "type": "uppercase"
+        }
+      },
+      "analyzer": {
+        "uppercase_analyzer": {
+          "type": "custom",
+          "tokenizer": "standard",
+          "filter": [
+            "lowercase",
+            "uppercase_filter"
+          ]
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+GET /uppercase_example/_analyze
+{
+  "analyzer": "uppercase_analyzer",
+  "text": "OpenSearch is powerful"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "OPENSEARCH",
+      "start_offset": 0,
+      "end_offset": 10,
+      "type": "<ALPHANUM>",
+      "position": 0
+    },
+    {
+      "token": "IS",
+      "start_offset": 11,
+      "end_offset": 13,
+      "type": "<ALPHANUM>",
+      "position": 1
+    },
+    {
+      "token": "POWERFUL",
+      "start_offset": 14,
+      "end_offset": 22,
+      "type": "<ALPHANUM>",
+      "position": 2
+    }
+  ]
+}
+```
diff --git a/_analyzers/token-filters/word-delimiter-graph.md b/_analyzers/token-filters/word-delimiter-graph.md
new file mode 100644
index 0000000000..ac734bebeb
--- /dev/null
+++ b/_analyzers/token-filters/word-delimiter-graph.md
@@ -0,0 +1,164 @@
+---
+layout: default
+title: Word delimiter graph
+parent: Token filters
+nav_order: 480
+---
+
+# Word delimiter graph token filter
+
+The `word_delimiter_graph` token filter is used to split tokens at predefined characters and also offers optional token normalization based on customizable rules.
+
+The `word_delimiter_graph` filter is used to remove punctuation from complex identifiers like part numbers or product IDs. In such cases, it is best used with the `keyword` tokenizer. For hyphenated words, use the `synonym_graph` token filter instead of the `word_delimiter_graph` filter because users frequently search for these terms both with and without hyphens.
+{: .note}
+
+By default, the filter applies the following rules.
+
+| Description   | Input  | Output |
+|:---|:---|:---|
+| Treats non-alphanumeric characters as delimiters.  | `ultra-fast`    | `ultra`, `fast`   |
+| Removes delimiters at the beginning or end of tokens.    | `Z99++'Decoder'`| `Z99`, `Decoder`  |
+| Splits tokens when there is a transition between uppercase and lowercase letters. | `OpenSearch`    | `Open`, `Search`  |
+| Splits tokens when there is a transition between letters and numbers.  | `T1000`         | `T`, `1000`   |
+| Removes the possessive ('s) from the end of tokens.  | `John's`        | `John`  |
+
+It's important **not** to use tokenizers that strip punctuation, like the `standard` tokenizer, with this filter. Doing so may prevent proper token splitting and interfere with options like `catenate_all` or `preserve_original`. We recommend using this filter with a `keyword` or `whitespace` tokenizer.
+{: .important}
+
+## Parameters
+
+You can configure the `word_delimiter_graph` token filter using the following parameters.
+
+Parameter | Required/Optional | Data type | Description
+:--- | :--- | :--- | :--- 
+`adjust_offsets` | Optional | Boolean | Determines whether the token offsets should be recalculated for split or concatenated tokens. When `true`, the filter adjusts the token offsets to accurately represent the token's position within the token stream. This adjustment ensures that the token's location in the text aligns with its modified form after processing, which is particularly useful for applications like highlighting or phrase queries. When `false`, the offsets remain unchanged, which may result in misalignment when the processed tokens are mapped back to their positions in the original text. If your analyzer uses filters like `trim` that change the token lengths without changing their offsets, we recommend setting this parameter to `false`. Default is `true`.
+`catenate_all` | Optional | Boolean | Produces concatenated tokens from a sequence of alphanumeric parts. For example, `"quick-fast-200"` becomes `[ quickfast200, quick, fast, 200 ]`. Default is `false`.
+`catenate_numbers` | Optional | Boolean | Concatenates numerical sequences. For example, `"10-20-30"` becomes `[ 102030, 10, 20, 30 ]`. Default is `false`.
+`catenate_words` | Optional | Boolean | Concatenates alphabetic words. For example, `"high-speed-level"` becomes `[ highspeedlevel, high, speed, level ]`. Default is `false`. 
+`generate_number_parts` | Optional | Boolean | If `true`, numeric tokens (tokens consisting of numbers only) are included in the output. Default is `true`.
+`generate_word_parts` | Optional | Boolean | If `true`, alphabetical tokens (tokens consisting of alphabetic characters only) are included in the output. Default is `true`.
+`ignore_keywords` | Optional | Boolean | Whether to process tokens marked as keywords. Default is `false`.
+`preserve_original` | Optional | Boolean | Keeps the original token (which may include non-alphanumeric delimiters) alongside the generated tokens in the output. For example, `"auto-drive-300"` becomes `[ auto-drive-300, auto, drive, 300 ]`. If `true`, the filter generates multi-position tokens not supported by indexing, so do not use this filter in an index analyzer or use the `flatten_graph` filter after this filter. Default is `false`. 
+`protected_words` | Optional | Array of strings | Specifies tokens that should not be split.
+`protected_words_path` | Optional | String | Specifies a path (absolute or relative to the config directory) to a file containing tokens that should not be separated by new lines.
+`split_on_case_change` | Optional | Boolean | Splits tokens where consecutive letters have different cases (one is lowercase and the other is uppercase). For example, `"OpenSearch"` becomes `[ Open, Search ]`. Default is `true`.
+`split_on_numerics` | Optional | Boolean | Splits tokens where there are consecutive letters and numbers. For example `"v8engine"` will become `[ v, 8, engine ]`. Default is `true`.
+`stem_english_possessive` | Optional | Boolean | Removes English possessive endings, such as `'s`. Default is `true`.
+`type_table` | Optional | Array of strings | A custom map that specifies how to treat characters and whether to treat them as delimiters, which avoids unwanted splitting. For example, to treat a hyphen (`-`) as an alphanumeric character, specify `["- => ALPHA"]` so that words are not split at hyphens. Valid types are: <br> - `ALPHA`: alphabetical <br> - `ALPHANUM`: alphanumeric <br> - `DIGIT`: numeric <br> - `LOWER`: lowercase alphabetical <br> - `SUBWORD_DELIM`: non-alphanumeric delimiter <br> - `UPPER`: uppercase alphabetical
+`type_table_path` | Optional | String | Specifies a path (absolute or relative to the config directory) to a file containing a custom character map. The map specifies how to treat characters and whether to treat them as delimiters, which avoids unwanted splitting. For valid types, see `type_table`.
+
+## Example
+
+The following example request creates a new index named `my-custom-index` and configures an analyzer with a `word_delimiter_graph` filter:
+
+```json
+PUT /my-custom-index
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "custom_analyzer": {
+          "tokenizer": "keyword",
+          "filter": [ "custom_word_delimiter_filter" ]
+        }
+      },
+      "filter": {
+        "custom_word_delimiter_filter": {
+          "type": "word_delimiter_graph",
+          "split_on_case_change": true,
+          "split_on_numerics": true,
+          "stem_english_possessive": true
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+GET /my-custom-index/_analyze
+{
+  "analyzer": "custom_analyzer",
+  "text": "FastCar's Model2023"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "Fast",
+      "start_offset": 0,
+      "end_offset": 4,
+      "type": "word",
+      "position": 0
+    },
+    {
+      "token": "Car",
+      "start_offset": 4,
+      "end_offset": 7,
+      "type": "word",
+      "position": 1
+    },
+    {
+      "token": "Model",
+      "start_offset": 10,
+      "end_offset": 15,
+      "type": "word",
+      "position": 2
+    },
+    {
+      "token": "2023",
+      "start_offset": 15,
+      "end_offset": 19,
+      "type": "word",
+      "position": 3
+    }
+  ]
+}   
+```
+
+<!-- vale off-->
+## Differences between the word_delimiter_graph and word_delimiter filters
+<!-- vale on-->
+
+Both the `word_delimiter_graph` and `word_delimiter` token filters generate tokens spanning multiple positions when any of the following parameters are set to `true`:
+
+- `catenate_all`  
+- `catenate_numbers`  
+- `catenate_words`  
+- `preserve_original`  
+
+To illustrate the differences between these filters, consider the input text `Pro-XT500`.
+
+<!-- vale off-->
+### word_delimiter_graph
+<!-- vale on-->
+
+The `word_delimiter_graph` filter assigns a `positionLength` attribute to multi-position tokens, indicating how many positions a token spans. This ensures that the filter always generates valid token graphs, making it suitable for use in advanced token graph scenarios. Although token graphs with multi-position tokens are not supported for indexing, they can still be useful in search scenarios. For example, queries like `match_phrase` can use these graphs to generate multiple subqueries from a single input string. For the example input text, the `word_delimiter_graph` filter generates the following tokens:
+
+- `Pro` (position 1)  
+- `XT500` (position 2)  
+- `ProXT500` (position 1, `positionLength`: 2)
+
+The `positionLength` attribute the production of a valid graph to be used in advanced queries.
+
+<!-- vale off-->
+### word_delimiter
+<!-- vale on-->
+
+In contrast, the `word_delimiter` filter does not assign a `positionLength` attribute to multi-position tokens, leading to invalid graphs when these tokens are present. For the example input text, the `word_delimiter` filter generates the following tokens:
+
+- `Pro` (position 1)  
+- `XT500` (position 2)  
+- `ProXT500` (position 1, no `positionLength`)
+
+The lack of a `positionLength` attribute results in a token graph that is invalid for token streams containing multi-position tokens.
\ No newline at end of file
diff --git a/_analyzers/token-filters/word-delimiter.md b/_analyzers/token-filters/word-delimiter.md
new file mode 100644
index 0000000000..d820fae2a0
--- /dev/null
+++ b/_analyzers/token-filters/word-delimiter.md
@@ -0,0 +1,128 @@
+---
+layout: default
+title: Word delimiter 
+parent: Token filters
+nav_order: 470
+---
+
+# Word delimiter token filter
+
+The `word_delimiter` token filter is used to split tokens at predefined characters and also offers optional token normalization based on customizable rules. 
+
+We recommend using the `word_delimiter_graph` filter instead of the `word_delimiter` filter whenever possible because the `word_delimiter` filter sometimes produces invalid token graphs. For more information about the differences between the two filters, see [Differences between the `word_delimiter_graph` and `word_delimiter` filters]({{site.url}}{{site.baseurl}}/analyzers/token-filters/word-delimiter-graph/#differences-between-the-word_delimiter_graph-and-word_delimiter-filters).
+{: .important}
+
+The `word_delimiter` filter is used to remove punctuation from complex identifiers like part numbers or product IDs. In such cases, it is best used with the `keyword` tokenizer. For hyphenated words, use the `synonym_graph` token filter instead of the `word_delimiter` filter because users frequently search for these terms both with and without hyphens.
+{: .note}
+
+By default, the filter applies the following rules.
+
+| Description   | Input  | Output |
+|:---|:---|:---|
+| Treats non-alphanumeric characters as delimiters.  | `ultra-fast`    | `ultra`, `fast`   |
+| Removes delimiters at the beginning or end of tokens.    | `Z99++'Decoder'`| `Z99`, `Decoder`  |
+| Splits tokens when there is a transition between uppercase and lowercase letters. | `OpenSearch`    | `Open`, `Search`  |
+| Splits tokens when there is a transition between letters and numbers.  | `T1000`         | `T`, `1000`   |
+| Removes the possessive ('s) from the end of tokens.  | `John's`        | `John`  |
+
+It's important **not** to use tokenizers that strip punctuation, like the `standard` tokenizer, with this filter. Doing so may prevent proper token splitting and interfere with options like `catenate_all` or `preserve_original`. We recommend using this filter with a `keyword` or `whitespace` tokenizer.
+{: .important}
+
+## Parameters
+
+You can configure the `word_delimiter` token filter using the following parameters.
+
+Parameter | Required/Optional | Data type | Description
+:--- | :--- | :--- | :--- 
+`catenate_all` | Optional | Boolean | Produces concatenated tokens from a sequence of alphanumeric parts. For example, `"quick-fast-200"` becomes `[ quickfast200, quick, fast, 200 ]`. Default is `false`.
+`catenate_numbers` | Optional | Boolean | Concatenates numerical sequences. For example, `"10-20-30"` becomes `[ 102030, 10, 20, 30 ]`. Default is `false`.
+`catenate_words` | Optional | Boolean | Concatenates alphabetic words. For example, `"high-speed-level"` becomes `[ highspeedlevel, high, speed, level ]`. Default is `false`. 
+`generate_number_parts` | Optional | Boolean | If `true`, numeric tokens (tokens consisting of numbers only) are included in the output. Default is `true`.
+`generate_word_parts` | Optional | Boolean | If `true`, alphabetical tokens (tokens consisting of alphabetic characters only) are included in the output. Default is `true`.
+`preserve_original` | Optional | Boolean | Keeps the original token (which may include non-alphanumeric delimiters) alongside the generated tokens in the output. For example, `"auto-drive-300"` becomes `[ auto-drive-300, auto, drive, 300 ]`. If `true`, the filter generates multi-position tokens not supported by indexing, so do not use this filter in an index analyzer or use the `flatten_graph` filter after this filter. Default is `false`. 
+`protected_words` | Optional | Array of strings | Specifies tokens that should not be split.
+`protected_words_path` | Optional | String | Specifies a path (absolute or relative to the config directory) to a file containing tokens that should not be separated by new lines.
+`split_on_case_change` | Optional | Boolean | Splits tokens where consecutive letters have different cases (one is lowercase and the other is uppercase). For example, `"OpenSearch"` becomes `[ Open, Search ]`. Default is `true`.
+`split_on_numerics` | Optional | Boolean | Splits tokens where there are consecutive letters and numbers. For example `"v8engine"` will become `[ v, 8, engine ]`. Default is `true`.
+`stem_english_possessive` | Optional | Boolean | Removes English possessive endings, such as `'s`. Default is `true`.
+`type_table` | Optional | Array of strings | A custom map that specifies how to treat characters and whether to treat them as delimiters, which avoids unwanted splitting. For example, to treat a hyphen (`-`) as an alphanumeric character, specify `["- => ALPHA"]` so that words are not split at hyphens. Valid types are: <br> - `ALPHA`: alphabetical <br> - `ALPHANUM`: alphanumeric <br> - `DIGIT`: numeric <br> - `LOWER`: lowercase alphabetical <br> - `SUBWORD_DELIM`: non-alphanumeric delimiter <br> - `UPPER`: uppercase alphabetical
+`type_table_path` | Optional | String | Specifies a path (absolute or relative to the config directory) to a file containing a custom character map. The map specifies how to treat characters and whether to treat them as delimiters, which avoids unwanted splitting. For valid types, see `type_table`.
+
+## Example
+
+The following example request creates a new index named `my-custom-index` and configures an analyzer with a `word_delimiter` filter:
+
+```json
+PUT /my-custom-index
+{
+  "settings": {
+    "analysis": {
+      "analyzer": {
+        "custom_analyzer": {
+          "tokenizer": "keyword",
+          "filter": [ "custom_word_delimiter_filter" ]
+        }
+      },
+      "filter": {
+        "custom_word_delimiter_filter": {
+          "type": "word_delimiter",
+          "split_on_case_change": true,
+          "split_on_numerics": true,
+          "stem_english_possessive": true
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Generated tokens
+
+Use the following request to examine the tokens generated using the analyzer:
+
+```json
+GET /my-custom-index/_analyze
+{
+  "analyzer": "custom_analyzer",
+  "text": "FastCar's Model2023"
+}
+```
+{% include copy-curl.html %}
+
+The response contains the generated tokens:
+
+```json
+{
+  "tokens": [
+    {
+      "token": "Fast",
+      "start_offset": 0,
+      "end_offset": 4,
+      "type": "word",
+      "position": 0
+    },
+    {
+      "token": "Car",
+      "start_offset": 4,
+      "end_offset": 7,
+      "type": "word",
+      "position": 1
+    },
+    {
+      "token": "Model",
+      "start_offset": 10,
+      "end_offset": 15,
+      "type": "word",
+      "position": 2
+    },
+    {
+      "token": "2023",
+      "start_offset": 15,
+      "end_offset": 19,
+      "type": "word",
+      "position": 3
+    }
+  ]
+}  
+```
diff --git a/_api-reference/common-parameters.md b/_api-reference/common-parameters.md
index 5b536ad992..ac3efbf4bf 100644
--- a/_api-reference/common-parameters.md
+++ b/_api-reference/common-parameters.md
@@ -123,4 +123,17 @@ Kilometers | `km` or `kilometers`
 Meters | `m` or `meters`
 Centimeters | `cm` or `centimeters`
 Millimeters | `mm` or `millimeters`
-Nautical miles | `NM`, `nmi`, or `nauticalmiles` 
\ No newline at end of file
+Nautical miles | `NM`, `nmi`, or `nauticalmiles` 
+
+## `X-Opaque-Id` header
+
+You can specify an opaque identifier for any request using the `X-Opaque-Id` header. This identifier is used to track tasks and deduplicate deprecation warnings in server-side logs. This identifier is used to differentiate between callers sending requests to your OpenSearch cluster. Do not specify a unique value per request.
+
+#### Example request
+
+The following request adds an opaque ID to the request:
+
+```json
+curl -H "X-Opaque-Id: my-curl-client-1" -XGET localhost:9200/_tasks
+```
+{% include copy.html %}
diff --git a/_api-reference/index-apis/update-settings.md b/_api-reference/index-apis/update-settings.md
index 18caf2185d..3afaaa10d3 100644
--- a/_api-reference/index-apis/update-settings.md
+++ b/_api-reference/index-apis/update-settings.md
@@ -11,7 +11,7 @@ redirect_from:
 **Introduced 1.0**
 {: .label .label-purple }
 
-You can use the update settings API operation to update index-level settings. You can change dynamic index settings at any time, but static settings cannot be changed after index creation. For more information about static and dynamic index settings, see [Create index]({{site.url}}{{site.baseurl}}/api-reference/index-apis/create-index/).
+You can use the update settings API operation to update index-level settings. You can change dynamic index settings at any time, but static settings cannot be changed after index creation. For more information about static and dynamic index settings, see [Configuring OpenSearch]({{site.url}}{{site.baseurl}}/install-and-configure/configuring-opensearch/index/).
 
 Aside from the static and dynamic index settings, you can also update individual plugins' settings. To get the full list of updatable settings, run `GET <target-index>/_settings?include_defaults=true`.
 
diff --git a/_automating-configurations/api/create-workflow.md b/_automating-configurations/api/create-workflow.md
index 610bfe8fab..ad9552c3ef 100644
--- a/_automating-configurations/api/create-workflow.md
+++ b/_automating-configurations/api/create-workflow.md
@@ -16,7 +16,7 @@ Creating a workflow adds the content of a workflow template to the flow framewor
 
 To obtain the validation template for workflow steps, call the [Get Workflow Steps API]({{site.url}}{{site.baseurl}}/automating-configurations/api/get-workflow-steps/).
 
-You can include placeholder expressions in the value of workflow step fields. For example, you can specify a credential field in a template as `openAI_key: '${{ openai_key }}'`. The expression will be substituted with the user-provided value during provisioning, using the format {% raw %}`${{ <value> }}`{% endraw %}. You can pass the actual key as a parameter by using the [Provision Workflow API]({{site.url}}{{site.baseurl}}/automating-configurations/api/provision-workflow/) or by using this API with the `provision` parameter set to `true`.
+You can include placeholder expressions in the value of workflow step fields. For example, you can specify a credential field in a template as {% raw %}`openAI_key: '${{ openai_key }}'`{% endraw %}. The expression will be substituted with the user-provided value during provisioning, using the format {% raw %}`${{ <value> }}`{% endraw %}. You can pass the actual key as a parameter by using the [Provision Workflow API]({{site.url}}{{site.baseurl}}/automating-configurations/api/provision-workflow/) or by using this API with the `provision` parameter set to `true`.
 
 Once a workflow is created, provide its `workflow_id` to other APIs.
 
diff --git a/_automating-configurations/api/provision-workflow.md b/_automating-configurations/api/provision-workflow.md
index 62c4954ee9..cb1fe42789 100644
--- a/_automating-configurations/api/provision-workflow.md
+++ b/_automating-configurations/api/provision-workflow.md
@@ -30,7 +30,7 @@ The following table lists the available path parameters.
 
 ## Query parameters
 
-If you have included a substitution expression in the template, you may pass it as a query parameter or as a string value of a request body field. For example, if you specified a credential field in a template as `openAI_key: '${{ openai_key }}'`, then you can include the `openai_key` parameter as a query parameter or body field so it can be substituted during provisioning. For example, the following request provides a query parameter:
+If you have included a substitution expression in the template, you may pass it as a query parameter or as a string value of a request body field. For example, if you specified a credential field in a template as {% raw %}`openAI_key: '${{ openai_key }}'`{% endraw %}, then you can include the `openai_key` parameter as a query parameter or body field so it can be substituted during provisioning. For example, the following request provides a query parameter:
 
 ```json
 POST /_plugins/_flow_framework/workflow/<workflow_id>/_provision?<parameter>=<value>
@@ -47,14 +47,14 @@ POST /_plugins/_flow_framework/workflow/8xL8bowB8y25Tqfenm50/_provision
 ```
 {% include copy-curl.html %}
 
-The following request substitutes the expression `${{ openai_key }}` with the value "12345" using a query parameter:
+The following request substitutes the expression {% raw %}`${{ openai_key }}`{% endraw %} with the value "12345" using a query parameter:
 
 ```json
 POST /_plugins/_flow_framework/workflow/8xL8bowB8y25Tqfenm50/_provision?openai_key=12345
 ```
 {% include copy-curl.html %}
 
-The following request substitutes the expression `${{ openai_key }}` with the value "12345" using the request body:
+The following request substitutes the expression {% raw %}`${{ openai_key }}`{% endraw %} with the value "12345" using the request body:
 
 ```json
 POST /_plugins/_flow_framework/workflow/8xL8bowB8y25Tqfenm50/_provision
diff --git a/_benchmark/reference/commands/aggregate.md b/_benchmark/reference/commands/aggregate.md
index 17612f1164..a891bf3edf 100644
--- a/_benchmark/reference/commands/aggregate.md
+++ b/_benchmark/reference/commands/aggregate.md
@@ -69,9 +69,30 @@ Aggregate test execution ID:  aggregate_results_geonames_9aafcfb8-d3b7-4583-864e
 -------------------------------
 ```
 
-The results will be aggregated into one test execution and stored under the ID shown in the output:
+The results will be aggregated into one test execution and stored under the ID shown in the output.
 
+### Additional options
 - `--test-execution-id`: Define a unique ID for the aggregated test execution.
 - `--results-file`: Write the aggregated results to the provided file.
 - `--workload-repository`: Define the repository from which OpenSearch Benchmark will load workloads (default is `default`).
 
+## Aggregated results
+
+Aggregated results includes the following information:
+
+- **Relative Standard Deviation (RSD)**: For each metric an additional `mean_rsd` value shows the spread of results across test executions.
+- **Overall min/max values**: Instead of averaging minimum and maximum values, the aggregated result include `overall_min` and `overall_max` which reflect the true minimum/maximum across all test runs.
+- **Storage**: Aggregated test results are  stored in a separate `aggregated_results` folder alongside the `test_executions` folder.
+
+The following example shows aggregated results:
+
+```json
+    "throughput": {
+     "overall_min": 29056.890292903263,
+     "mean": 50115.8603858536,
+     "median": 50099.54349684457,
+     "overall_max": 72255.15946248993,
+     "unit": "docs/s",
+     "mean_rsd": 59.426059705973664
+    },
+```
diff --git a/_config.yml b/_config.yml
index f2749b66f8..3c6f737cc8 100644
--- a/_config.yml
+++ b/_config.yml
@@ -31,9 +31,6 @@ collections:
   install-and-configure:
     permalink: /:collection/:path/
     output: true
-  upgrade-to:
-    permalink: /:collection/:path/
-    output: true
   im-plugin:
     permalink: /:collection/:path/
     output: true
@@ -94,6 +91,9 @@ collections:
   data-prepper: 
     permalink: /:collection/:path/
     output: true
+  migration-assistant:
+    permalink: /:collection/:path/
+    output: true
   tools:
     permalink: /:collection/:path/
     output: true
@@ -121,6 +121,9 @@ collections:
   getting-started:
     permalink: /:collection/:path/
     output: true
+  workspace:
+    permalink: /:collection/:path/
+    output: true
 
 opensearch_collection:
   # Define the collections used in the theme
@@ -134,11 +137,6 @@ opensearch_collection:
     install-and-configure:
       name: Install and upgrade
       nav_fold: true
-    upgrade-to:
-      name: Migrate to OpenSearch
-      # nav_exclude: true
-      nav_fold: true
-      # search_exclude: true
     im-plugin:
       name: Managing Indexes
       nav_fold: true
@@ -210,6 +208,12 @@ clients_collection:
         name: Clients
         nav_fold: true
 
+migration_assistant_collection:
+  collections:
+    migration-assistant:
+        name: Migration Assistant
+        nav_fold: true
+
 benchmark_collection:
   collections:
     benchmark:
@@ -249,6 +253,12 @@ defaults:
     values:
       section: "benchmark"
       section-name: "Benchmark"
+  -
+    scope:
+      path: "_migration-assistant"
+    values:
+      section: "migration-assistant"
+      section-name: "Migration Assistant"
 
 # Enable or disable the site search
 # By default, just-the-docs enables its JSON file-based search. We also have an OpenSearch-driven search functionality.
@@ -308,6 +318,7 @@ plugins:
   - jekyll-remote-theme
   - jekyll-redirect-from
   - jekyll-sitemap
+  - jekyll-spec-insert
 
 # This format has to conform to RFC822
 last-modified-at:
@@ -317,6 +328,8 @@ last-modified-at:
 # The following items will not be processed, by default. Create a custom list
 # to override the default setting.
 exclude:
+  - README.md
+  - DEVELOPER_GUIDE.md
   - Gemfile
   - Gemfile.lock
   - node_modules
@@ -324,6 +337,12 @@ exclude:
   - vendor/cache/
   - vendor/gems/
   - vendor/ruby/
-  - README.md
-  - .idea
-  - templates
+  - templates/
+  - .sass-cache/
+  - .jekyll-cache/
+  - .idea/
+  - .github/
+  - .bundle/
+  - _site/
+  - spec-insert
+  - release-notes
\ No newline at end of file
diff --git a/_dashboards/dashboards-assistant/alert-insight.md b/_dashboards/dashboards-assistant/alert-insight.md
index 9e41b977ca..603e5aba44 100644
--- a/_dashboards/dashboards-assistant/alert-insight.md
+++ b/_dashboards/dashboards-assistant/alert-insight.md
@@ -197,6 +197,9 @@ POST /.plugins-ml-config/_doc/os_insight
 The created `os_insight` agent provides alert insights related to OpenSearch cluster metrics. For insights about alerts unrelated to OpenSearch cluster metrics, you need to register an agent with [this template](https://github.com/opensearch-project/flow-framework/blob/2.x/sample-templates/create-knowledge-base-alert-agent.json) and change the agent name to `KB_For_Alert_Insight`.
 {: .note}
 
+This example demonstrates a system index. In security-enabled domains, only superadmins have permissions to execute this code. For information about making superadmin calls, see [System indexes]({{site.url}}{{site.baseurl}}/security/configuration/system-indices/). For access permissions, contact your system administrator.
+{: .warning}
+
 ### Step 4: Test the agents
 
 You can verify that the agents were created successfully by calling the agents with an example payload.
diff --git a/_dashboards/dashboards-assistant/data-summary.md b/_dashboards/dashboards-assistant/data-summary.md
index 5ad465be62..e90e184e07 100644
--- a/_dashboards/dashboards-assistant/data-summary.md
+++ b/_dashboards/dashboards-assistant/data-summary.md
@@ -36,7 +36,7 @@ queryEnhancements.queryAssist.summary.enabled: true
 
 ### Step 2: Create a data summary agent
 
-To orchestrate data summarization, create a data summary [agent]({{site.url}}{{site.baseurl}}/ml-commons-plugin/agents-tools/index/#agents). To create an agent, send a `POST /_plugins/_ml/agents/_register` request and provide the agent template as a payload:
+To orchestrate data summarization, create a data summary [agent]({{site.url}}{{site.baseurl}}/ml-commons-plugin/agents-tools/index/#agents). To create an agent, send a `POST /_plugins/_flow_framework/workflow?provision=true` request and provide the agent template as a payload:
 
 <details markdown="block">
   <summary>
@@ -45,7 +45,7 @@ To orchestrate data summarization, create a data summary [agent]({{site.url}}{{s
   {: .text-delta}
 
 ```json
-POST /_plugins/_ml/agents/_register
+POST /_plugins/_flow_framework/workflow?provision=true
 {
   "name": "Query Assist Agent",
   "description": "Create a Query Assist Agent using Claude on BedRock",
@@ -237,6 +237,9 @@ POST /.plugins-ml-config/_doc/os_data2summary
 ```
 {% include copy-curl.html %}
 
+This example demonstrates a system index. In security-enabled domains, only superadmins have permissions to execute this code. For information about making superadmin calls, see [System indexes]({{site.url}}{{site.baseurl}}/security/configuration/system-indices/). For access permissions, contact your system administrator.
+{: .warning}
+
 ### Step 4: Test the agent
 
 You can verify that the data summary agent was created successfully by calling the agent with an example payload:
@@ -288,4 +291,4 @@ To view alert insights in OpenSearch Dashboards, use the following steps:
 
 1. From the query language dropdown list, select **PPL**. You will see the generated data summary after the query text, as shown in the following image.
 
-    <img src="{{site.url}}{{site.baseurl}}/images/dashboards-assistant/data-summary.png" alt="data summary">
\ No newline at end of file
+    <img src="{{site.url}}{{site.baseurl}}/images/dashboards-assistant/data-summary.png" alt="data summary">
diff --git a/_dashboards/dashboards-assistant/suggest-anomaly-detector.md b/_dashboards/dashboards-assistant/suggest-anomaly-detector.md
index 2c9f795e8d..8f4aac80fd 100644
--- a/_dashboards/dashboards-assistant/suggest-anomaly-detector.md
+++ b/_dashboards/dashboards-assistant/suggest-anomaly-detector.md
@@ -36,7 +36,7 @@ assistant.smartAnomalyDetector.enabled: true
 
 ### Step 2: Create an anomaly detector suggestion agent
 
-To orchestrate anomaly detector suggestions, create an anomaly detector suggestion [agent]({{site.url}}{{site.baseurl}}/ml-commons-plugin/agents-tools/index/#agents). To create an agent, send a `POST /_plugins/_ml/agents/_register` request and provide the agent template as a payload. For more information, see [Configuring OpenSearch Assistant]({{site.url}}{{site.baseurl}}/dashboards/dashboards-assistant/index/#configuring-opensearch-assistant).
+To orchestrate anomaly detector suggestions, create an anomaly detector suggestion [agent]({{site.url}}{{site.baseurl}}/ml-commons-plugin/agents-tools/index/#agents). To create an agent, send a `POST /_plugins/_flow_framework/workflow?provision=true` request and provide the agent template as a payload. For more information, see [Configuring OpenSearch Assistant]({{site.url}}{{site.baseurl}}/dashboards/dashboards-assistant/index/#configuring-opensearch-assistant).
 
 For sample agent templates, see [Flow Framework sample templates](https://github.com/opensearch-project/flow-framework/tree/2.x/sample-templates). Note the agent ID; you'll use it in the following step.
 
@@ -55,6 +55,9 @@ POST /.plugins-ml-config/_doc/os_suggest_ad
 ```
 {% include copy-curl.html %}
 
+This example demonstrates a system index. In security-enabled domains, only superadmins have permissions to execute this code. For information about making superadmin calls, see [System indexes]({{site.url}}{{site.baseurl}}/security/configuration/system-indices/). For access permissions, contact your system administrator.
+{: .warning}
+
 ### Step 4: Test the agent
 
 You can verify that the agent was created successfully by calling the agent with an example payload:
diff --git a/_dashboards/dashboards-assistant/text-to-visualization.md b/_dashboards/dashboards-assistant/text-to-visualization.md
index 5c0aab51f0..a30ca6d1f8 100644
--- a/_dashboards/dashboards-assistant/text-to-visualization.md
+++ b/_dashboards/dashboards-assistant/text-to-visualization.md
@@ -177,7 +177,7 @@ POST /_plugins/_flow_framework/workflow/<workflow_id>/_provision
 To view the status of the workflow and all created resources, send the following request:
 
 ```json
-/_plugins/_flow_framework/workflow/<workflow_id>/_status
+GET /_plugins/_flow_framework/workflow/<workflow_id>/_status
 ```
 {% include copy-curl.html %}
 
@@ -209,6 +209,9 @@ POST /.plugins-ml-config/_doc/os_text2vega_with_instructions
 ```
 {% include copy-curl.html %}
 
+This example demonstrates a system index. In security-enabled domains, only superadmins have permissions to execute this code. For information about making superadmin calls, see [System indexes]({{site.url}}{{site.baseurl}}/security/configuration/system-indices/). For access permissions, contact your system administrator.
+{: .warning}
+
 ### Step 4: Test the agent
 
 You can verify that the agent was created successfully by calling the agent with an example payload:
diff --git a/_dashboards/management/accelerate-external-data.md b/_dashboards/management/accelerate-external-data.md
index 6d1fa030e4..00eb8671ec 100644
--- a/_dashboards/management/accelerate-external-data.md
+++ b/_dashboards/management/accelerate-external-data.md
@@ -1,10 +1,8 @@
 ---
 layout: default
 title: Optimize query performance using OpenSearch indexing
-parent: Connecting Amazon S3 to OpenSearch
-grand_parent: Data sources
-nav_order: 15
-has_children: false
+parent: Data sources
+nav_order: 17
 ---
 
 # Optimize query performance using OpenSearch indexing
@@ -14,35 +12,171 @@ Introduced 2.11
 
 Query performance can be slow when using external data sources for reasons such as network latency, data transformation, and data volume. You can optimize your query performance by using OpenSearch indexes, such as a skipping index or a covering index. 
 
-A _skipping index_ uses skip acceleration methods, such as partition, minimum and maximum values, and value sets, to ingest and create compact aggregate data structures. This makes them an economical option for direct querying scenarios. 
+- A _skipping index_ uses skip acceleration methods, such as partition, minimum and maximum values, and value sets, to ingest and create compact aggregate data structures. This makes them an economical option for direct querying scenarios. For more information, see [Skipping indexes](https://opensearch.org/docs/latest/dashboards/management/accelerate-external-data/#skipping-indexes).
+- A _covering index_ ingests all or some of the data from the source into OpenSearch and makes it possible to use all OpenSearch Dashboards and plugin functionality. For more information, see [Covering indexes](https://opensearch.org/docs/latest/dashboards/management/accelerate-external-data/#covering-indexes).
+- A _materialized view_ enhances query performance by storing precomputed and aggregated data from the source data. For more information, see [Materialized views](https://opensearch.org/docs/latest/dashboards/management/accelerate-external-data/#materialized-views).
 
-A _covering index_ ingests all or some of the data from the source into OpenSearch and makes it possible to use all OpenSearch Dashboards and plugin functionality. See the [Flint Index Reference Manual](https://github.com/opensearch-project/opensearch-spark/blob/main/docs/index.md) for comprehensive guidance on this feature's indexing process.
+For comprehensive guidance on each indexing process, see the [Flint Index Reference Manual](https://github.com/opensearch-project/opensearch-spark/blob/main/docs/index.md). 
 
 ## Data sources use case: Accelerate performance
 
-To get started with the **Accelerate performance** use case available in **Data sources**, follow these steps:
+To get started with accelerating query performance, perform the following steps:
 
-1. Go to **OpenSearch Dashboards** > **Query Workbench** and select your Amazon S3 data source from the **Data sources** dropdown menu in the upper-left corner.
-2. From the left-side navigation menu, select a database.
-3. View the results in the table and confirm that you have the desired data.
+1. Go to **OpenSearch Dashboards** > **Query Workbench** and select your data source from the **Data sources** dropdown menu.
+2. From the navigation menu, select a database.
+3. View the results in the table and confirm that you have the correct data.
 4. Create an OpenSearch index by following these steps:
-    1. Select the **Accelerate data** button. A pop-up window appears. 
-    2. Enter your details in **Select data fields**. In the **Database** field, select the desired acceleration index: **Skipping index** or **Covering index**. A _skipping index_ uses skip acceleration methods, such as partition, min/max, and value sets, to ingest data using compact aggregate data structures. This makes them an economical option for direct querying scenarios. A _covering index_ ingests all or some of the data from the source into OpenSearch and makes it possible to use all OpenSearch Dashboards and plugin functionality.
-5. Under **Index settings**, enter the information for your acceleration index. For information about naming, select **Help**. Note that an Amazon S3 table can only have one skipping index at a time.
+    1. Select **Accelerate data**. A pop-up window appears. 
+    2. Enter your database and table details under **Select data fields**.
+5. For **Acceleration type**, select the type of acceleration according to your use case. Then, enter the information for your acceleration type. For more information, see the following sections:
+      - [Skipping indexes](https://opensearch.org/docs/latest/dashboards/management/accelerate-external-data/#skipping-indexes)
+      - [Covering indexes](https://opensearch.org/docs/latest/dashboards/management/accelerate-external-data/#covering-indexes)
+      - [Materialized views](https://opensearch.org/docs/latest/dashboards/management/accelerate-external-data/#materialized-views)
+
+## Skipping indexes
+
+A _skipping index_ uses skip acceleration methods, such as partition, min/max, and value sets, to ingest data using compact aggregate data structures. This makes them an economical option for direct querying scenarios.
+
+With a skipping index, you can index only the metadata of the data stored in Amazon S3. When you query a table with a skipping index, the query planner references the index and rewrites the query to efficiently locate the data, instead of scanning all partitions and files. This allows the skipping index to quickly narrow down the specific location of the stored data.
 
 ### Define skipping index settings
 
-1. Under **Skipping index definition**, select the **Add fields** button to define the skipping index acceleration method and choose the fields you want to add.
-2. Select the **Copy Query to Editor** button to apply your skipping index settings. 
-3. View the skipping index query details in the table pane and then select the **Run** button. Your index is added to the left-side navigation menu containing the list of your databases.
+1. Under **Skipping index definition**, select **Generate** to automatically generate a skipping index. Alternately, to manually choose the fields you want to add, select **Add fields**. Choose from the following types:
+  - `Partition`: Uses data partition details to locate data. This type is best for partitioning-based columns such as year, month, day, hour.
+  - `MinMax`: Uses lower and upper bound of the indexed column to locate data. This type is best for numeric columns.
+  - `ValueSet`: Uses a unique value set to locate data. This type is best for columns with low to moderate cardinality that require exact matching.
+  - `BloomFilter`: Uses the bloom filter algorithm to locate data. This type is best for columns with high cardinality that do not require exact matching.
+2. Select **Create acceleration** to apply your skipping index settings. 
+3. View the skipping index query details and then click **Run**. OpenSearch adds your index to the left navigation pane.
+
+Alternately, you can manually create a skipping index using Query Workbench. Select your data source from the dropdown and run a query like the following:
+
+```sql
+CREATE SKIPPING INDEX
+ON datasourcename.gluedatabasename.vpclogstable(
+ `srcaddr` BLOOM_FILTER, 
+ `dstaddr` BLOOM_FILTER, 
+ `day` PARTITION, 
+ `account_id`BLOOM_FILTER
+ ) WITH (
+index_settings = '{"number_of_shards":5,"number_of_replicas":1}',
+auto_refresh = true,
+checkpoint_location = 's3://accountnum-vpcflow/AWSLogs/checkpoint'
+)
+```
+
+## Covering indexes
+
+A _covering index_ ingests all or some of the data from the source into OpenSearch and makes it possible to use all OpenSearch Dashboards and plugin functionality.
+
+With a covering index, you can ingest data from a specified column in a table. This is the most performant of the three indexing types. Because OpenSearch ingests all data from your desired column, you get better performance and can perform advanced analytics.
+
+OpenSearch creates a new index from the covering index data. You can use this new index to create visualizations, or for anomaly detection and geospatial capabilities. You can manage the covering view index with Index State Management. For more information, see [Index State Management](https://opensearch.org/docs/latest/im-plugin/ism/index/).
 
 ### Define covering index settings
 
-1. Under **Index settings**, enter a valid index name. Note that each Amazon S3 table can have multiple covering indexes.
-2. Once you have added the index name, define the covering index fields by selecting `(add fields here)` under **Covering index definition**. 
-3. Select the **Copy Query to Editor** button to apply your covering index settings.
-4. View the covering index query details in the table pane and then select the **Run** button. Your index is added to the left-side navigation menu containing the list of your databases.
+1. For **Index name**, enter a valid index name. Note that each table can have multiple covering indexes.
+2. Choose a **Refresh type**. By default, OpenSearch automatically refreshes the index. Otherwise, you must manually trigger a refresh using a REFRESH statement.
+3. Enter a **Checkpoint location**, which is a path for refresh job checkpoints. The location must be a path in an HDFS compatible file system. 
+4. Define the covering index fields by selecting **(add fields here)** under **Covering index definition**. 
+5. Select **Create acceleration** to apply your covering index settings.
+6. View the covering index query details and then click **Run**. OpenSearch adds your index to the left navigation pane.
+
+Alternately, you can manually create a covering index on your table using Query Workbench. Select your data source from the dropdown and run a query like the following:
+
+```sql
+CREATE INDEX vpc_covering_index
+ON datasourcename.gluedatabasename.vpclogstable (version, account_id, interface_id, 
+srcaddr, dstaddr, srcport, dstport, protocol, packets, 
+bytes, start, action, log_status STRING, 
+`aws-account-id`, `aws-service`, `aws-region`, year, 
+month, day, hour )
+WITH (
+  auto_refresh = true,
+  refresh_interval = '15 minute',
+  checkpoint_location = 's3://accountnum-vpcflow/AWSLogs/checkpoint'
+)
+```
+
+## Materialized views
+
+With _materialized views_, you can use complex queries, such as aggregations, to power Dashboards visualizations. Materialized views ingest a small amount of your data, depending on the query, into OpenSearch. OpenSearch then forms an index from the ingested data that you can use for visualizations. You can manage the materialized view index with Index State Management. For more information, see [Index State Management](https://opensearch.org/docs/latest/im-plugin/ism/index/).
+
+### Define materialized view settings
+
+1. For **Index name**, enter a valid index name. Note that each table can have multiple covering indexes.
+2. Choose a **Refresh type**. By default, OpenSearch automatically refreshes the index. Otherwise, you must manually trigger a refresh using a `REFRESH` statement.
+3. Enter a **Checkpoint location**, which is a path for refresh job checkpoints. The location must be a path in an HDFS compatible file system. 
+4. Enter a **Watermark delay**, which defines how late data can come and still be processed, such as 1 minute or 10 seconds.
+5. Define the covering index fields under **Materialized view definition**.
+6. Select **Create acceleration** to apply your materialized view index settings.
+7. View the materialized view query details and then click **Run**. OpenSearch adds your index to the left navigation pane.
+
+Alternately, you can manually create a materialized view index on your table using Query Workbench. Select your data source from the dropdown and run a query like the following:
+
+```sql
+CREATE MATERIALIZED VIEW {table_name}__week_live_mview AS
+  SELECT
+    cloud.account_uid AS `aws.vpc.cloud_account_uid`,
+    cloud.region AS `aws.vpc.cloud_region`,
+    cloud.zone AS `aws.vpc.cloud_zone`,
+    cloud.provider AS `aws.vpc.cloud_provider`,
+
+    CAST(IFNULL(src_endpoint.port, 0) AS LONG) AS `aws.vpc.srcport`,
+    CAST(IFNULL(src_endpoint.svc_name, 'Unknown') AS STRING)  AS `aws.vpc.pkt-src-aws-service`,
+    CAST(IFNULL(src_endpoint.ip, '0.0.0.0') AS STRING)  AS `aws.vpc.srcaddr`,
+    CAST(IFNULL(src_endpoint.interface_uid, 'Unknown') AS STRING)  AS `aws.vpc.src-interface_uid`,
+    CAST(IFNULL(src_endpoint.vpc_uid, 'Unknown') AS STRING)  AS `aws.vpc.src-vpc_uid`,
+    CAST(IFNULL(src_endpoint.instance_uid, 'Unknown') AS STRING)  AS `aws.vpc.src-instance_uid`,
+    CAST(IFNULL(src_endpoint.subnet_uid, 'Unknown') AS STRING)  AS `aws.vpc.src-subnet_uid`,
+
+    CAST(IFNULL(dst_endpoint.port, 0) AS LONG) AS `aws.vpc.dstport`,
+    CAST(IFNULL(dst_endpoint.svc_name, 'Unknown') AS STRING) AS `aws.vpc.pkt-dst-aws-service`,
+    CAST(IFNULL(dst_endpoint.ip, '0.0.0.0') AS STRING)  AS `aws.vpc.dstaddr`,
+    CAST(IFNULL(dst_endpoint.interface_uid, 'Unknown') AS STRING)  AS `aws.vpc.dst-interface_uid`,
+    CAST(IFNULL(dst_endpoint.vpc_uid, 'Unknown') AS STRING)  AS `aws.vpc.dst-vpc_uid`,
+    CAST(IFNULL(dst_endpoint.instance_uid, 'Unknown') AS STRING)  AS `aws.vpc.dst-instance_uid`,
+    CAST(IFNULL(dst_endpoint.subnet_uid, 'Unknown') AS STRING)  AS `aws.vpc.dst-subnet_uid`,
+    CASE
+      WHEN regexp(dst_endpoint.ip, '(10\\..*)|(192\\.168\\..*)|(172\\.1[6-9]\\..*)|(172\\.2[0-9]\\..*)|(172\\.3[0-1]\\.*)')
+        THEN 'ingress'
+      ELSE 'egress'
+      END AS `aws.vpc.flow-direction`,
+
+    CAST(IFNULL(connection_info['protocol_num'], 0) AS INT) AS `aws.vpc.connection.protocol_num`,
+    CAST(IFNULL(connection_info['tcp_flags'], '0') AS STRING)  AS `aws.vpc.connection.tcp_flags`,
+    CAST(IFNULL(connection_info['protocol_ver'], '0') AS STRING)  AS `aws.vpc.connection.protocol_ver`,
+    CAST(IFNULL(connection_info['boundary'], 'Unknown') AS STRING)  AS `aws.vpc.connection.boundary`,
+    CAST(IFNULL(connection_info['direction'], 'Unknown') AS STRING)  AS `aws.vpc.connection.direction`,
+
+    CAST(IFNULL(traffic.packets, 0) AS LONG) AS `aws.vpc.packets`,
+    CAST(IFNULL(traffic.bytes, 0) AS LONG) AS `aws.vpc.bytes`,
+
+    CAST(FROM_UNIXTIME(time / 1000) AS TIMESTAMP) AS `@timestamp`,
+    CAST(FROM_UNIXTIME(start_time / 1000) AS TIMESTAMP) AS `start_time`,
+    CAST(FROM_UNIXTIME(start_time / 1000) AS TIMESTAMP) AS `interval_start_time`,
+    CAST(FROM_UNIXTIME(end_time / 1000) AS TIMESTAMP) AS `end_time`,
+    status_code AS `aws.vpc.status_code`,
+
+    severity AS `aws.vpc.severity`,
+    class_name AS `aws.vpc.class_name`,
+    category_name AS `aws.vpc.category_name`,
+    activity_name AS `aws.vpc.activity_name`,
+    disposition AS `aws.vpc.disposition`,
+    type_name AS `aws.vpc.type_name`,
+
+    region AS `aws.vpc.region`,
+    accountid AS `aws.vpc.account-id`
+  FROM
+  datasourcename.gluedatabasename.vpclogstable 
+WITH (
+  auto_refresh = true,
+  refresh_interval = '15 Minute',
+  checkpoint_location = 's3://accountnum-vpcflow/AWSLogs/checkpoint',
+  watermark_delay = '1 Minute',
+)
+```
 
 ## Limitations
 
-This feature is still under development, so there are some limitations. For real-time updates, refer to the [developer documentation on GitHub](https://github.com/opensearch-project/opensearch-spark/blob/main/docs/index.md#limitations).
+This feature is still under development, so there are some limitations. For real-time updates, see the [developer documentation on GitHub](https://github.com/opensearch-project/opensearch-spark/blob/main/docs/index.md#limitations).
diff --git a/_dashboards/management/acl.md b/_dashboards/management/acl.md
new file mode 100644
index 0000000000..bd57b72419
--- /dev/null
+++ b/_dashboards/management/acl.md
@@ -0,0 +1,78 @@
+---
+layout: default
+title: Access control lists for saved objects
+parent: Dashboards Management
+nav_order: 50
+---
+
+# Access control lists for saved objects
+Introduced 2.18
+{: .label .label-purple }
+
+You can use access control lists (ACLs) to manage permissions for your saved objects, providing authorization (AuthZ) capabilities without requiring backend plugin integration.
+
+## Understanding ACL types
+
+ACLs are applied at two levels:
+
+1. **Workspace ACL:** Workspace objects inherit permissions from their parent workspace. See [Workspace ACL]({{site.url}}{{site.baseurl}}/dashboards/workspace/workspace-acl) for more information.
+2. **Objects ACL:** Each individual object can have its own ACL policy. All operations on these objects must pass ACL policy validation.
+
+## Enabling the ACL feature
+
+The ACL feature must be enabled before you can define any access controls. Enable it by:
+
+1. Opening your `opensearch_dashboards.yml` file.
+2. Enabling permissions with `savedObjects.permission.enabled: true`.
+
+## Defining ACL permissions
+
+ACL permissions are defined using the following schema: 
+
+```json
+{
+  "permissions": {
+    "<permission_type_1>": {
+        "users": ["<principal_1>", "<principal_2>"],
+        "groups": ["<principal_3>", "<principal_4>"]
+    }
+  } 
+}
+```
+{% include copy-curl.html %}
+
+### Granting permissions to authenticated users
+
+The wildcard character (`*`) grants permissions to all authenticated users. In the following example, the ACL grants workspace management permissions to the `finance_manager` group and dashboard creation permissions to the `finance_analyst` group:
+
+```json
+{
+  "permissions": {
+    "write": {
+        "groups": ["finance_manager"]
+    },
+    "library_write": {
+        "groups": ["finance_analyst"]
+    }
+  } 
+}
+```
+{% include copy-curl.html %}
+
+### Configuring mixed-level permissions
+
+To allow one user, `user-1` for example, to modify an object while giving read-only access to others, you can configure the ACL policy as follows:
+
+```json
+{
+  "permissions": {
+    "read": {
+        "users": ["*"]
+    },
+    "write": {
+        "users": ["user-1"]
+    },
+  }
+}
+```
+{% include copy-curl.html %}
diff --git a/_dashboards/management/management-index.md b/_dashboards/management/management-index.md
index 7edc4d06c2..01796180e5 100644
--- a/_dashboards/management/management-index.md
+++ b/_dashboards/management/management-index.md
@@ -9,16 +9,14 @@ has_children: true
 Introduced 2.10
 {: .label .label-purple }
 
-**Dashboards Management** serves as the command center for customizing OpenSearch Dashboards to your needs. A view of the interface is shown in the following image.
+**Dashboards Management** is the central hub for managing and customizing OpenSearch data directly within OpenSearch Dashboards. 
 
-<img src="{{site.url}}{{site.baseurl}}/images/dashboards/dashboards-management-ui.png" alt="Dashboards Management interface" width="700"/>
-
-{::nomarkdown}<img src="{{site.url}}{{site.baseurl}}/images/icons/alert-icon.png" class="inline-icon" alt="alert icon"/>{:/} **Note**<br>OpenSearch and OpenSearch Dashboards privileges govern access to individual features. If you do not have the appropriate access, consult your administrator. 
-{: .note}
+OpenSearch and OpenSearch Dashboards permissions govern access to individual features. If you do not have the appropriate access permissions, consult your administrator.
+{: .warning}
 
 ## Applications
 
-The following applications are available in **Dashboards Management**:
+You can access the following applications in **Dashboards Management**:
 
 - **[Index Patterns]({{site.url}}{{site.baseurl}}/dashboards/management/index-patterns/):** To access OpenSearch data, you need to create an index pattern so that you can select the data you want to use and define the properties of the fields. The Index Pattern tool gives you the ability to create an index pattern from within the UI. Index patterns point to one or more indexes, data streams, or index aliases. 
 - **[Data Sources]({{site.url}}{{site.baseurl}}/dashboards/management/multi-data-sources/):** The Data Sources tool is used to configure and manage the data sources that OpenSearch uses to collect and analyze data. You can use the tool to specify the source configuration in your copy of the [OpenSearch Dashboards configuration file]({{site.url}}{{site.baseurl}}https://github.com/opensearch-project/OpenSearch-Dashboards/blob/main/config/opensearch_dashboards.yml).
diff --git a/_dashboards/workspace/apis.md b/_dashboards/workspace/apis.md
new file mode 100644
index 0000000000..683488e423
--- /dev/null
+++ b/_dashboards/workspace/apis.md
@@ -0,0 +1,386 @@
+---
+layout: default
+title: Workspaces APIs
+parent: Workspace for OpenSearch Dashboards
+nav_order: 10
+---
+
+# Workspaces APIs
+Introduced 2.18
+{: .label .label-purple }
+
+The Workspaces API provides a set of endpoints for managing workspaces in OpenSearch Dashboards.
+
+## List Workspaces API
+
+You can use the following endpoint to retrieve a list of workspaces:
+
+```json
+POST <osd host>:<port>/api/workspaces/_list
+```
+{% include copy-curl.html %}
+
+The following table lists the available path parameters.
+
+| Parameter | Data type | Required | Description |
+| :--- | :--- | :--- | :--- |
+| `search` | String | Optional | A query string used to filter workspaces with simple query syntax, for example, `simple_query_string`. |
+| `searchFields` | Array | Optional | Specifies which fields to perform the search query against. |
+| `sortField` | String | Optional | The field name to use for sorting results. |
+| `sortOrder` | String | Optional | Specifies ascending or descending sort order. |
+| `perPage` | Number | Optional | The number of workspace results per page. |
+| `page` | Number | Optional | The number of pages of results to retrieve. |
+| `permissionModes` | Array | Optional | A list of permissions to filter by. |
+
+#### Example request
+
+```json
+POST /api/workspaces/_list
+```
+{% include copy-curl.html %}
+
+The following example response shows a successful API call:
+
+```json
+{
+    "success": true,
+    "result": {
+        "page": 1,
+        "per_page": 20,
+        "total": 3,
+        "workspaces": [
+            {
+                "name": "test1",
+                "features": [
+                    "use-case-all"
+                ],
+                "id": "hWNZls"
+            },
+            {
+                "name": "test2",
+                "features": [
+                    "use-case-observability"
+                ],
+                "id": "SnkOPt"
+            }
+        ]
+    }
+}
+```
+{% include copy-curl.html %}
+
+## Get Workspaces API
+
+You can use the following endpoint to retrieve a single workspace:
+
+```json
+GET <osd host>:<port>/api/workspaces/<id>
+```
+{% include copy-curl.html %}
+
+The following table lists the available path parameters. All path parameters are required.
+
+| Parameter | Data type | Required | Description |
+| :--- | :--- | :--- | :--- |
+| `<id>` | String | Required | Identifies the unique workspace to be retrieved. |
+
+#### Example request
+
+```json
+GET /api/workspaces/SnkOPt
+```
+{% include copy-curl.html %}
+
+The following example response shows a successful API call:
+
+```json
+{
+    "success": true,
+    "result": {
+        "name": "test2",
+        "features": ["use-case-all"],
+        "id": "SnkOPt"
+    }
+}
+```
+{% include copy-curl.html %}
+
+## Create Workspaces API
+
+You can use the following endpoint to create a workspace:
+
+```json
+POST <osd host>:<port>/api/workspaces
+```
+{% include copy-curl.html %}
+
+The following table lists the available path parameters.
+
+| Parameter | Data type | Required | Description |
+| :--- | :--- | :--- | :--- |
+| `attributes` | Object | Required | Defines the workspace attributes. |
+| `permissions` | Object | Optional | Specifies the permissions for the workspace. |
+
+#### Example request
+
+```json
+POST api/workspaces
+{
+    "attributes": {
+        "name": "test4",
+        "description": "test4"
+    }
+}
+```
+{% include copy-curl.html %}
+
+The following example response shows a successful API call:
+
+```json
+{
+    "success": true,
+    "result": {
+        "id": "eHVoCJ"
+    }
+}
+```
+{% include copy-curl.html %}
+
+## Update Workspaces API
+
+You can use the following endpoint to update the attributes and permissions for a workspace:
+
+```json
+PUT <osd host>:<port>/api/workspaces/<id>
+```
+{% include copy-curl.html %}
+
+The following table lists the available path parameters.
+
+| Parameter | Data type | Required | Description |
+| :--- | :--- | :--- | :--- |
+| `<id>` | String | Required | Identifies the unique workspace to be retrieved. |
+| `attributes` | Object | Required | Defines the workspace attributes. |
+| `permissions` | Object | Optional | Specifies the permissions for the workspace. |
+
+#### Example request
+
+```json
+PUT api/workspaces/eHVoCJ
+{
+    "attributes": {
+        "name": "test4",
+        "description": "test update"
+    }
+}
+```
+{% include copy-curl.html %}
+
+The following example response shows a successful API call:
+
+```json
+{
+    "success": true,
+    "result": true
+}
+```
+{% include copy-curl.html %}
+
+## Delete Workspaces API
+
+You can use the following endpoint to delete a workspace:
+
+```json
+DELETE <osd host>:<port>/api/workspaces/<id>
+```
+{% include copy-curl.html %}
+
+The following table lists the available path parameters. All path parameters are required.
+
+| Parameter | Data type | Required | Description |
+| :--- | :--- | :--- | :--- |
+| `<id>` | String | Required | Identifies the unique workspace to be retrieved. |
+
+#### Example request
+
+```json
+DELETE api/workspaces/eHVoCJ
+```
+{% include copy-curl.html %}
+
+The following example response shows a successful API call:
+
+```json
+{
+    "success": true,
+    "result": true
+}
+```
+{% include copy-curl.html %}
+
+## Duplicate Saved Objects Workspaces API
+
+You can use the following endpoint to copy saved objects between workspaces:
+
+```json
+POST <osd host>:<port>/api/workspaces/_duplicate_saved_objects
+```
+{% include copy-curl.html %}
+
+The following table lists the available path parameters.
+
+| Parameter | Data type | Required | Description |
+| :--- | :--- | :--- | :--- |
+| `objects` | Array | Required | Specifies the saved objects to be duplicated. |
+| `targetWorkspace` | String | Required | Identifies the destination workspace for copying. |
+| `includeReferencesDeep` | Boolean | Optional | Determines whether to copy all referenced objects to the target workspace. Default is `true`. |
+
+The following table lists the attributes of the object in the `objects` parameter.
+
+| Parameter | Data type | Required | Description |
+| :--- | :--- | :--- | :--- |
+| `type` | String | Required | Defines the saved object classification, such as `index-pattern`, `config`, or `dashboard`. |
+| `id` | String | Required | The ID of the saved object. |
+
+#### Example request
+
+```json
+POST api/workspaces/_duplicate_saved_objects
+{
+    "objects": [
+        {
+            "type": "index-pattern",
+            "id": "619cc200-ecd0-11ee-95b1-e7363f9e289d"
+        }
+    ],
+    "targetWorkspace": "9gt4lB"
+}
+```
+{% include copy-curl.html %}
+
+The following example response shows a successful API call:
+
+```json
+{
+    "successCount": 1,
+    "success": true,
+    "successResults": [
+        {
+            "type": "index-pattern",
+            "id": "619cc200-ecd0-11ee-95b1-e7363f9e289d",
+            "meta": {
+                "title": "test*",
+                "icon": "indexPatternApp"
+            },
+            "destinationId": "f4b724fd-9647-4bbf-bf59-610b43a62c75"
+        }
+    ]
+}
+```
+{% include copy-curl.html %}
+
+## Associate Saved Objects Workspaces API
+
+You can use the following endpoint to associate saved objects with a workspace:
+
+```json
+POST <osd host>:<port>/api/workspaces/_associate
+```
+{% include copy-curl.html %}
+
+The following table lists the available path parameters.
+
+| Parameter | Data type | Required | Description |
+| :--- | :--- | :--- | :--- |
+| `workspaceId` | String | Required | Identifies the target workspace for object association. |
+| `savedObjects` | Array | Required | Specifies the list of saved objects to be copied. |
+
+The following table lists the attributes of the object in the `objects` parameter.
+
+| Parameter | Data type | Required | Description |
+| :--- | :--- | :--- | :--- |
+| `type` | String | Required | Defines the saved object classification, such as `index-pattern`, `config`, or `dashboard`. |
+| `id` | String | Required | The ID of the saved object. |
+
+#### Example request
+
+```json
+POST api/workspaces/_associate
+{
+    "objects": [
+        {
+            "type": "index-pattern",
+            "id": "619cc200-ecd0-11ee-95b1-e7363f9e289d"
+        }
+    ],
+    "targetWorkspace": "9gt4lB"
+}
+```
+{% include copy-curl.html %}
+
+The following example response shows a successful API call:
+
+```json
+{
+    "success": true,
+    "result": [
+        {
+            "id": "619cc200-ecd0-11ee-95b1-e7363f9e289d",
+        }
+    ]
+}
+```
+{% include copy-curl.html %}
+
+## Dissociate Saved Objects Workspaces API
+
+You can use the following endpoint to dissociate saved objects from a workspace:
+
+```json
+POST <osd host>:<port>/api/workspaces/_dissociate
+```
+{% include copy-curl.html %}
+
+The following table lists the available path parameters.
+
+| Parameter | Data type | Required | Description |
+| :--- | :--- | :--- | :--- |
+| `workspaceId` | String | Required | The target workspace with which to associate the objects. |
+| `savedObjects` | Array | Required | A list of saved objects to copy. |
+
+The following table lists the attributes of the `savedObjects` parameter.
+
+| Parameter | Data type | Required | Description |
+| :--- | :--- | :--- | :--- |
+| `type` | String | Required | The type of the saved object, such as `index-pattern`, `config`, or `dashboard`. |
+| `id` | String | Required | The ID of the saved object. |
+
+#### Example request
+
+```json
+POST api/workspaces/_dissociate
+{
+    "objects": [
+        {
+            "type": "index-pattern",
+            "id": "619cc200-ecd0-11ee-95b1-e7363f9e289d"
+        }
+    ],
+    "targetWorkspace": "9gt4lB"
+}
+```
+{% include copy-curl.html %}
+
+The following example response shows a successful API call:
+
+```json
+{
+    "success": true,
+    "result": [
+        {
+            "id": "619cc200-ecd0-11ee-95b1-e7363f9e289d",
+        }
+    ]
+}
+```
+{% include copy-curl.html %}
diff --git a/_dashboards/workspace/create-workspace.md b/_dashboards/workspace/create-workspace.md
new file mode 100644
index 0000000000..34ba65bb54
--- /dev/null
+++ b/_dashboards/workspace/create-workspace.md
@@ -0,0 +1,52 @@
+---
+layout: default
+title: Create a workspace
+parent: Workspace for OpenSearch Dashboards
+nav_order: 1
+---
+
+# Create a workspace
+Introduced 2.18
+{: .label .label-purple }
+
+Before getting started with this tutorial, you must enable the workspace feature flag. See [Enabling the ACL feature]({{site.url}}{{site.baseurl}}/dashboards/workspace/workspace/#enabling-the-workspace-feature) for more information.
+
+When the saved objects permission is enabled, only users with admin status can create workspaces. See [Configuring the dashboard admin]({{site.url}}{{site.baseurl}}/dashboards/workspace/workspace-acl/#configuring-dashboard-administrators) for more information. 
+
+To create a workspace, follow these steps:
+
+1. Open OpenSearch Dashboards.
+2. From the main page, choose the appropriate card for your use case, for example, **Observability**, **Security Analytics**, **Search**, **Essentials**, or **Analytics**. Alternatively, you can select the **Create workspace** button and choose the appropriate use case from the dropdown menu.
+3. Enter the required information in the **Workspace details** window.
+  - **Workspace name** is required. Valid characters are `a-z`, `A-Z`, `0-9`, parentheses (`()`), brackets (`[]`), underscore (`_`), hyphen (`-`), and spaces. Choose a unique workspace name within the character limit (40 characters). The **Create workspace** button is disabled when the workspace name already exists or exceeds the character limit, and an error message appears.
+  - **Use case and features** is required. Choose the use case that best fits your needs. If you are using Amazon OpenSearch Serverless and have enabled the [multiple data sources]({{site.url}}{{site.baseurl}}/dashboards/management/data-sources/) feature, **Essentials** is automatically assigned. 
+4. (Optional) Select the color picker to customize the color of your workspace icon.
+5. (Optional) Add a workspace description of up to 200 characters. This option is disabled when the description exceeds the character limit.
+6. Save your workspace.
+  - The **Create workspace** button becomes active once you enter the information for all required fields. You become the workspace owner automatically. The system redirects you to either the collaborators page if the saved objects permission is enabled or the overview page if the saved objects permission is disabled. See [Configuring dashboard admin]({{site.url}}{{site.baseurl}}/dashboards/workspace/workspace-acl/#configuring-dashboard-administrators) for more information about permissions.
+
+To set up permissions, see [Workspace access control lists]({{site.url}}{{site.baseurl}}/dashboards/workspace/workspace-acl/) for more information.
+
+## Associating data sources with a workspace
+
+The **Associate data source** option is only visible when the multiple data sources feature is enabled. Before creating your workspace, you must connect it with at least one data source. If you have not set up your data sources, see [Data sources]({{site.url}}{{site.baseurl}}/dashboards/management/data-sources/). Once your sources are connected, you can link them to your new workspace.
+{: .warning}
+
+### Associating OpenSearch data sources
+
+To associate OpenSearch data sources, follow these steps: 
+
+1. Select the **Associate OpenSearch Data Sources** button to open the selection modal.
+2. View the available data sources in the modal:
+  - Standard OpenSearch sources appear as single entries.
+  - Sources with direct query connections show a +N indicator.
+3. Select the appropriate data source name(s).
+4. Select the **Associate data sources** button to complete the association.
+
+### Associating direct query sources
+
+To associate direct query sources, follow these steps: 
+
+1. Select the **Associate direct query data sources** button to open the selection modal. The modal displays only sources with direct query connections.
+2. Select a data source to automatically expand its direct query connections.
+3. Select the **Associate data sources** button to complete the association.
diff --git a/_dashboards/workspace/index.md b/_dashboards/workspace/index.md
new file mode 100644
index 0000000000..f0f572a4a5
--- /dev/null
+++ b/_dashboards/workspace/index.md
@@ -0,0 +1,27 @@
+---
+layout: default
+title: Getting started with workspaces
+parent: Workspace for OpenSearch Dashboards
+nav_order: 0
+---
+
+# Getting started with workspaces
+Introduced 2.18
+{: .label .label-purple }
+
+OpenSearch Dashboards 2.18 introduces an enhanced home page that provides a comprehensive view of all your workspaces.
+
+The new home page includes the following features: 
+
+1. A **Create workspace** button for [OpenSearch Dashboard admins]({{site.url}}{{site.baseurl}}/dashboards/workspace/workspace-acl/#configuring-dashboard-administrators) to navigate to the [create workspace]({{site.url}}{{site.baseurl}}/dashboards/workspace/create-workspace) page.
+2. Workspace access time information and a link to the workspace overview page.
+3. A use case information icon that displays information about the workspace's purpose.
+4. A **View all workspaces** button that navigates to the [workspace management]({{site.url}}{{site.baseurl}}/dashboards/workspace/manage-workspace/#navigating-the-workspaces-list) page.
+5. Links to the latest OpenSearch documentation through the **Learn more from documentation** button and to [OpenSearch Playground](https://playground.opensearch.org/app/home#/) through the **Explore live demo environment at playground.opensearch.org** button.
+
+The navigation logic ensures a seamless user experience by directing you to the appropriate page based on your workspace access level:
+
+- If a you have a default workspace configured, you are directed to the workspace overview page.
+- If a you have only one workspace, you are directed to the overview page of that workspace.
+- If a you have multiple workspaces, you are directed to the new home page.
+- If a you have no workspaces, you are directed to the new home page.
diff --git a/_dashboards/workspace/manage-workspace.md b/_dashboards/workspace/manage-workspace.md
new file mode 100644
index 0000000000..45733d75be
--- /dev/null
+++ b/_dashboards/workspace/manage-workspace.md
@@ -0,0 +1,118 @@
+---
+layout: default
+title: Manage workspaces
+parent: Workspace for OpenSearch Dashboards
+nav_order: 2
+---
+
+# Manage workspaces
+Introduced 2.18
+{: .label .label-purple }
+
+You can access and modify the workspace details, including name, description, use case, and icon color, on the **Workspace details** page. 
+
+To access and modify your workspace details, follow these steps: 
+
+1. Open OpenSearch Dashboards and navigate to **My Workspaces**.
+2. Choose the desired workspace  and then select the **Edit** button to make changes
+3. Select the **Save** button to confirm changes or the **Discard changes** button to cancel modifications.
+
+## Workspace update permissions
+
+The following permissions apply when changing workspaces:
+
+1. **Without the Security plugin:** All users can edit and update the workspace.
+2. **With the Security plugin installed and `savedObjects.permission.enabled: false` in the `config/opensearch_dashboards.yml` file:** All users can edit and update workspaces.
+3. **With the Security plugin and `savedObjects.permission.enabled: true` in the `config/opensearch_dashboards.yml`:** Only the [workspace owner]({{site.url}}{{site.baseurl}}/dashboards/workspace/workspace-acl/#defining-workspace-collaborators) and the [workspace admins]({{site.url}}{{site.baseurl}}/dashboards/workspace/workspace-acl/#configuring-dashboard-administrators) can edit and update workspaces.
+
+## Workspace update restrictions 
+
+When updating workspace use cases, the following rules apply.
+
+Original use case | Target use case |
+:---: | :---:
+Analytics  | Cannot be changed to any other use case
+Search  | Analytics
+Security analytics  | Analytics
+Observability  | Analytics
+Essentials  |    Analytics Search<br> Security Analytics<br> Observability
+
+## Workspace control panel
+
+The **Workspace details** page features the following buttons in the upper-right corner:
+
+1. **Delete** ({::nomarkdown}<img src="{{site.url}}{{site.baseurl}}/images/dashboards/trash-can-icon.png" class="inline-icon" alt="trash can icon"/>{:/} icon)
+    - **Without the Security plugin installed:** All users can delete the workspace.
+    - **With the Security plugins installed and `savedObjects.permission.enabled: false` in the `config/opensearch_dashboards.yml` file:** All users can delete the workspace.
+    - **With the Security plugin installed and `savedObjects.permission.enabled: true` in the `config/opensearch_dashboards.yml` file:** Only the admin can delete the workspace.
+2. **Set as default workspace:** Sets the current workspace as the default login destination.
+3. **Workspace overview:** Opens the **Overview** page in a new tab.
+
+## Adding assets to the workspace
+
+Access the **Sample data** in the navigation menu on the left. Select the appropriate dataset to install it in your cluster and OpenSearch Dashboards.
+
+## Copying assets between workspaces
+
+Data sources and configuration copying are not supported.
+{: .warning}
+
+The assets page provides the following methods for copying assets across workspaces:
+
+1. **Copy all assets to...:** Copies all assets in the table.
+2. **Copy to...:** Moves selected assets from the table.
+3. **Copy to...:** Copies a single asset from the table.
+
+After selecting a copy option, choose the target workspace from the dropdown menu. The **Copy related assets** checkbox allows you to transfer associated assets.
+
+Upon selecting the **Copy** button, a side panel appears showing successful and failed asset transfers. Asset copy destinations depend on the following security configurations:
+ 
+1. **Without the Security plugin:** All workspaces are accessible.
+2. **With the Security plugin and `savedObjects.permission.enabled: false` in the `config/opensearch_dashboards.yml` file:** All workspaces are accessible.
+3. **With the Security plugin and `savedObjects.permission.enabled: true` in the `config/opensearch_dashboards.yml` file:** Only workspaces for which the user has read and write or admin permissions are accessible.
+
+## Associating data sources
+
+On the data source management page, you can access a comprehensive list of associated OpenSearch connections, monitor direct query connections relevant to your current workspace, and establish new data source associations as needed.
+
+### Managing OpenSearch connections
+
+The OpenSearch connections tab displays all associated connections for the current workspace. Follow these steps to manage your connections:
+
+1. Access a comprehensive list of associated OpenSearch connections on the connections tab.
+2. Use the **Remove association** button to unlink connections as needed.
+3. Add new data sources by selecting the **OpenSearch data sources** button and subsequent modal.
+4. Select from unassociated OpenSearch connections to expand your workspace's capabilities.
+
+### Adding direct query connections
+
+The **Direct query connections** tab displays a list of all direct query connections associated with your current workspace. To add more direct query connections to your workspace, select the **Direct query data sources** button. A modal window opens.
+
+The association modal displays a list of OpenSearch connections that contain direct query connections and have not yet been associated with your current workspace. When you associate an OpenSearch connection with your current workspace, all direct query connections within that OpenSearch connection are automatically associated as well.
+
+## Deleting your workspace
+
+Workspace deletion is restricted to admins. If you do not see a {::nomarkdown}<img src="{{site.url}}{{site.baseurl}}/images/dashboards/trash-can-icon.png" class="inline-icon" alt="trash can icon"/>{:/} icon, check your permissions. See [Configuring dashboard administrators]({{site.url}}{{site.baseurl}}/dashboards/workspace/workspace-acl/#configuring-dashboard-administrators) for more information.
+{: .warning}
+
+Deleting a workspace permanently erases all its assets (except data sources) and the workspace itself. This action cannot be reversed.
+
+To delete a workspace, follow these steps:
+
+1. From the **Workspace details** page, select the {::nomarkdown}<img src="{{site.url}}{{site.baseurl}}/images/dashboards/trash-can-icon.png" class="inline-icon" alt="trash can icon"/>{:/} icon in the upper-right corner to delete the current workspace.
+2. Alternatively, from the workspace list page, select the {::nomarkdown}<img src="{{site.url}}{{site.baseurl}}/images/ellipsis-icon.png" class="inline-icon" alt="ellipsis icon"/>{:/} icon and select **Delete**. Optionally, select multiple workspaces for bulk deletion.
+
+## Navigating the workspaces list
+
+The workspaces list page serves as your central hub for workspace management, displaying all workspaces for which you have access permissions. Key features include the following: 
+
+- Search: Quickly find a workspace by name.
+- Filter: Sort workspaces by use case.
+- At a glance: View each workspace's name, use case, description, last update time, and associated data sources.
+
+Each workspace entry includes an **Actions** column with the following functional buttons. These tools streamline your workspace management, allowing for efficient organization and customization of your OpenSearch Dashboards environment:
+
+1. Copy ID: One-click copying of the workspace ID.
+2. Edit: Direct access to the workspace's detailed configuration page.
+3. Set as default: Easily set any workspace as your default workspace.
+4. Delete: Remove workspaces as needed (may require admin privileges).
diff --git a/_dashboards/workspace/workspace-acl.md b/_dashboards/workspace/workspace-acl.md
new file mode 100644
index 0000000000..16b2cc8628
--- /dev/null
+++ b/_dashboards/workspace/workspace-acl.md
@@ -0,0 +1,153 @@
+---
+layout: default
+title: Workspace access control lists
+parent: Workspace for OpenSearch Dashboards
+nav_order: 3
+---
+
+# Workspace access control lists
+Introduced 2.18
+{: .label .label-purple }
+
+Workspace access control lists (ACLs) manage authorization for saved objects `AuthZ(Authorization)` while enabling [Security in OpenSearch]({{site.url}}{{site.baseurl}}/security/) for `AuthN(Authentication)`.
+
+## Personas
+
+**Workspace** use cases involve the following key personas:
+
+* **Dashboard admin:** Has full access to all OpenSearch Dashboards functions and data.
+* **Workspace administrator (also called _owner_):** Has full control over a specific workspace, including its configuration and saved objects. When a workspace is created, its creator is automatically assigned the role of workspace owner.
+* **Workspace content producer:** Can view, create, and update saved objects within the workspace.
+* **Workspace viewer:** Has read-only access to saved objects in the workspace.
+
+ Roles are workspace specific, allowing users to assume different roles across workspaces.
+ {: .note}
+
+## Enabling permission control
+
+See [Enabling the ACL feature]({{site.url}}{{site.baseurl}}/dashboards/management/acl#enabling-the-acl-feature) for instructions. 
+
+## Configuring dashboard administrators
+
+To grant full access to all workspaces and objects in OpenSearch Dashboards, configure the admin permissions. Edit the `opensearch_dashboards.yml` file to define the admin by user ID and backend role, as shown in the following configuration:
+
+```yaml
+opensearchDashboards.dashboardAdmin.users: ["UserID"]
+opensearchDashboards.dashboardAdmin.groups: ["BackendRole"]
+savedObjects.permission.enabled: true
+```
+{% include copy.html %}
+
+By default, the configuration is set to `[]`, meaning that no users are designated as admins. If the Security plugin is not installed and `savedObjects.permission.enabled: false`, all users are granted admin permissions.
+
+### Configuring global admin access
+
+Set all users as admins with this wildcard setting:
+
+```yaml
+opensearchDashboards.dashboardAdmin.users: ["*"]
+```
+{% include copy-curl.html %}
+
+### Configuring admin access for a single user
+
+Configure a user with the `admin-user-id` setting:
+
+```yaml
+opensearchDashboards.dashboardAdmin.users: ["admin-user-id"]
+```
+{% include copy-curl.html %}
+
+### Configuring admin access by backend role
+
+Configure a user with the `admin-role` setting:
+
+```yaml
+opensearchDashboards.dashboardAdmin.groups: ["admin-role"]
+```
+{% include copy-curl.html %}
+
+### Admin-restricted operations
+
+Admin-restricted operations include the following:
+
+- Workspace creation
+- Workspace deletion
+- Data source connections
+- Disconnecting data sources from workspaces
+
+## Defining workspace collaborators
+
+Access to collaborator management is limited to admins. The **Collaborators** feature is only available when permission control is enabled. For instructions on activating permission control, see [Enabling permission control](#enabling-permission-control). The access levels include the following:
+
+- **Read only:** Grants permission to view the workspace and its assets.
+- **Read and write:** Allows viewing and editing of assets within the workspace.
+- **Admin:** Provides full access, including viewing and editing of assets within the workspace and updating workspace metadata, such as name, description, data sources, and collaborators.
+
+From the **Collaborators** page, you can by collaborator ID and filter results by collaborator type and access level.
+
+### Adding collaborators
+
+Workspace creators are granted the **Admin** access level as a collaborator. To add more collaborators, select the **Add collaborators** button, which displays a dropdown menu. Choose **Add Users** or **Add Groups** to access the corresponding modal for adding new collaborators.
+
+#### Adding users
+
+To add users, follow these steps: 
+
+1. Select the **Add Users** button to open the modal. The modal displays one empty `User ID` field by default.
+2. Choose an access level: **Read only**, **Read and write**, or **Admin**.
+3. Choose **Add another User** to add multiple users. Do not use duplicate or existing `User ID` fields to avoid errors.
+4. Resolve any errors before finalizing. Successfully added users appear in the collaborators table.
+
+#### Adding groups
+
+To add groups, follow these steps:
+
+1. Select the **Add Groups** button to open the modal. The modal displays one empty `Group ID` field by default.
+2. Choose an access level: **Read only**, **Read and write**, or **Admin**.
+3. Use **Add another group** to add multiple groups. Do not use duplicate or existing `Group ID` fields to avoid errors.
+4. Resolve any errors before finalizing. Successfully added users appear in the collaborators table.
+
+### Modifying access levels
+
+You can modify collaborators access levels after adding them to the collaborators table if you have the required permissions. Collaborators can be assigned any access level. However, if all **Admin** collaborators are changed to lower access levels, then only admins can manage workspace collaboration.
+
+#### Modifying individual access levels
+
+To modify a single collaborator's access level, follow these steps:
+
+1. Select the action icon on the right of the table row.
+2. Select **Change access level** from the dropdown menu.
+3. Choose the desired access level from the list. 
+4. Confirm the change in the modal that appears and select **Confirm**. The collaborator's access level is updated in the table upon confirmation.
+
+#### Modifying access levels in batch
+
+To change access levels for several collaborators simultaneously, follow these steps:
+
+1. Select the desired collaborator rows in the table. 
+2. Select the **Actions** button that appears.
+3. Select **Change access level** from the dropdown menu.
+4. Select the new access level from the list provided. 
+5. Review and confirm the changes in the modal that appears. The access levels for all selected collaborators are updated in the table upon confirmation.
+
+### Deleting collaborators
+
+After adding collaborators to the table, you have the option to delete them. Be cautious when removing admin collaborators because deleting all of them restricts workspace collaborator management to admins only. A confirmation modal is displayed before finalizing this action.
+
+#### Deleting individual collaborators
+
+To delete an individual collaborator, follow these steps:
+
+1. Select the {::nomarkdown}<img src="{{site.url}}{{site.baseurl}}/images/ellipsis-icon.png" class="inline-icon" alt="ellipsis icon"/>{:/} icon on the right of the table row to display a dropdown menu.
+2. Select **Delete collaborator** from the dropdown menu. A confirmation modal appears to verify your action.
+3. Select **Confirm** in the modal to remove the collaborator from the table.
+
+#### Deleting collaborators in batch
+
+To remove several collaborators simultaneously, follow these steps:
+
+1. Select the rows containing the collaborators you want to remove from the table. A "Delete x collaborators" button appears.
+2. Select the **Delete x collaborators** button.
+3. Review the confirmation modal that appears.
+4. Select **Confirm** to remove all selected collaborators from the table.
diff --git a/_dashboards/workspace/workspace.md b/_dashboards/workspace/workspace.md
new file mode 100644
index 0000000000..0938c48891
--- /dev/null
+++ b/_dashboards/workspace/workspace.md
@@ -0,0 +1,118 @@
+---
+layout: default
+title: Workspace for OpenSearch Dashboards
+nav_order: 110
+has_children: true
+---
+
+# Workspace for OpenSearch Dashboards
+Introduced 2.18
+{: .label .label-purple }
+
+The Workspace feature in OpenSearch Dashboards enables you to tailor your environment with use-case-specific configurations. For example, you can create dedicated workspaces for observability scenarios, allowing you to focus on relevant functionalities. Additionally, the Workspace feature enables organization of visual assets, such as dashboards and visualizations, within a workspace with isolated storage.
+
+## Workspace data model
+
+The Workspace data model is defined by the following structure: 
+
+```typescript
+interface Workspace {
+  id: string;
+  name: string;
+  description?: string;
+  features?: string[];
+  color: string;
+  uiSettings: Record<string, unknown>;
+}
+```
+{% include copy-curl.html %}
+
+The Workspace data model is composed of the following key attributes:
+
+- `id`: String type; unique ID for each each workspace.
+- `name`: String type; designates the name of the workspace.
+- `description`: Optional string type; provides contextual information for the workspace.
+- `features`: Optional array of strings; contains use case IDs linked to the workspace.
+
+---
+
+#### Example Workspace object
+
+The following object shows a typical Workspace configuration:
+
+```typescript
+{
+  id: "M5NqCu",
+  name: "Analytics team",
+  description: "Analytics team workspace",
+  features: ["use-case-analytics"],
+}
+```
+{% include copy-curl.html %}
+
+The configuration creates the `Analytics team` using the `use-case-observability` feature set. Use cases map to specific feature groups, limiting functionality to the defined set within each workspace. 
+
+The following are predefined use case options:
+
+- `use-case-observability`
+- `use-case-security-analytics`
+- `use-case-search`
+- `use-case-essentials`
+- `use-case-all`
+
+---
+
+## Associating saved objects with workspaces
+
+Saved objects in OpenSearch Dashboards, such as dashboards, visualizations, and index patterns, can be associated with specific workspaces, improving organization and accessibility as the volume of objects grows.
+
+The `workspaces` attribute, an array of strings, is added to saved objects to be linked with one or more workspaces. As a result, saved objects such as dashboards and visualizations are only accessible within their designated workspaces. 
+
+The following saved object shows a dashboard object associated with the workspace `M5NqCu`:
+
+```typescript
+{
+  type: "dashboard",
+  id: "da123f20-6680-11ee-93fa-df944ec23359",
+  workspaces: ["M5NqCu"]
+}
+```
+{% include copy-curl.html %}
+
+Saved objects support association with multiple workspaces, facilitating cross-team collaboration and resource sharing. This feature is useful when an object is relevant to multiple teams, projects, or use cases. 
+
+The following example shows a data source object linked to multiple workspaces:
+
+```typescript
+{
+  type: "data-source",
+  id: "da123f20-6680-11ee-93fa-df944ec23359",
+  workspaces: ["M5NqCu", "<TeamA-workspace-id>", "<Analytics-workspace-id>"]
+}
+```
+{% include copy-curl.html %}
+
+## Non-workspace saved objects
+
+Not all saved objects in OpenSearch Dashboards are associated with a workspace. Some objects operate independently of the workspace framework. These objects lack `workspace` attributes and serve system-wide functions. For example, the global user interface settings object manages configurations affecting the entire OpenSearch Dashboards interface in order to maintain consistent functionality across all workspaces.
+
+This dual approach allows OpenSearch Dashboards to balance granular, context-specific customization with overall system consistency. 
+
+## Enabling the Workspace feature
+
+In your `opensearch_dashboards.yml` file, set the following option:
+
+```yaml
+workspace.enabled: true
+uiSettings:
+  overrides:
+    "home:useNewHomePage": true
+```
+{% include copy-curl.html %}
+
+If your cluster has the Security plugin installed, then multi-tenancy must be disabled to avoid conflicts with similar workspaces:
+
+```yaml
+opensearch_security.multitenancy.enabled: false
+```
+{% include copy-curl.html %}
diff --git a/_data-prepper/pipelines/configuration/processors/anomaly-detector.md b/_data-prepper/pipelines/configuration/processors/anomaly-detector.md
index 9628bb6caf..ba574bdf7d 100644
--- a/_data-prepper/pipelines/configuration/processors/anomaly-detector.md
+++ b/_data-prepper/pipelines/configuration/processors/anomaly-detector.md
@@ -53,6 +53,7 @@ You can configure `random_cut_forest` mode with the following options.
 | `sample_size` | `256` | 100--2500 | The sample size used in the ML algorithm. |
 | `time_decay` | `0.1` | 0--1.0 | The time decay value used in the ML algorithm. Used as the mathematical expression `timeDecay` divided by `SampleSize` in the ML algorithm. |
 | `type` | `metrics` | N/A | The type of data sent to the algorithm. |
+| `output_after` | 32 | N/A | Specifies the number of events to process before outputting any detected anomalies. |
 | `version` | `1.0` | N/A | The algorithm version number. |
 
 ## Usage
diff --git a/_data-prepper/pipelines/configuration/processors/aws-lambda.md b/_data-prepper/pipelines/configuration/processors/aws-lambda.md
new file mode 100644
index 0000000000..bd167996a1
--- /dev/null
+++ b/_data-prepper/pipelines/configuration/processors/aws-lambda.md
@@ -0,0 +1,94 @@
+---
+layout: default
+title: aws_lambda
+parent: Processors
+grand_parent: Pipelines
+nav_order: 10
+---
+
+# aws_lambda integration for Data Prepper
+
+The [AWS Lambda](https://aws.amazon.com/lambda/) integration allows developers to use serverless computing capabilities within their Data Prepper pipelines for flexible event processing and data routing.
+
+## AWS Lambda processor configuration
+
+The `aws_lambda` processor enables invocation of an AWS Lambda function within your Data Prepper pipeline in order to process events. It supports both synchronous and asynchronous invocations based on your use case.
+
+## Configuration fields
+
+You can configure the processor using the following configuration options.
+
+Field                | Type    | Required | Description                                                                 
+-------------------- | ------- | -------- | ---------------------------------------------------------------------------- 
+`function_name`      | String  | Required | The name of the AWS Lambda function to invoke.                               
+`invocation_type`    | String  | Required | Specifies the invocation type, either `request-response` or `event`. Default is `request-response`.           
+`aws.region`         | String  | Required | The AWS Region in which the Lambda function is located.                         
+`aws.sts_role_arn`   | String  | Optional | The Amazon Resource Name (ARN) of the role to assume before invoking the Lambda function.               
+`max_retries`        | Integer | Optional | The maximum number of retries for failed invocations. Default is `3`.             
+`batch`              | Object  | Optional | The batch settings for the Lambda invocations. Default is `key_name = "events"`. Default threshold is `event_count=100`, `maximum_size="5mb"`, and `event_collect_timeout = 10s`.                            
+`lambda_when`        | String  | Optional | A conditional expression that determines when to invoke the Lambda processor.     
+`response_codec`     | Object  | Optional |  A codec configuration for parsing Lambda responses. Default is `json`.
+`tags_on_match_failure` | List | Optional |  A list of tags to add to events when Lambda matching fails or encounters an unexpected error.
+`sdk_timeout`        | Duration| Optional | Configures the SDK's client connection timeout period. Default is `60s`. 
+`response_events_match` | Boolean | Optional | Specifies how Data Prepper interprets and processes Lambda function responses. Default is `false`.
+
+#### Example configuration
+
+```
+processors:
+  - aws_lambda:
+      function_name: "my-lambda-function"
+      invocation_type: "request-response"
+      response_events_match: false
+      aws:
+        region: "us-east-1"
+        sts_role_arn: "arn:aws:iam::123456789012:role/my-lambda-role"
+      max_retries: 3
+      batch:
+        key_name: "events"
+        threshold:
+          event_count: 100
+          maximum_size: "5mb"
+          event_collect_timeout: PT10S
+      lambda_when: "event['status'] == 'process'"
+
+```
+{% include copy-curl.html %}
+
+## Usage
+
+The processor supports the following invocation types:
+
+- `request-response`: The processor waits for Lambda function completion before proceeding.
+- `event`: The function is triggered asynchronously without waiting for a response.
+- `batch`: When enabled, events are aggregated and sent in bulk to optimize Lambda invocations. Batch thresholds control the event count, size limit, and timeout.
+- `codec`: JSON is used for both request and response codecs. Lambda must return JSON array outputs.
+- `tags_on_match_failure`: Custom tags can be applied to events when Lambda processing fails or encounters unexpected issues.
+
+## Behavior
+
+When configured for batching, the AWS Lambda processor groups multiple events into a single request. This grouping is governed by batch thresholds, which can be based on the event count, size limit, or timeout. The processor then sends the entire batch to the Lambda function as a single payload.
+
+## Lambda response handling
+
+The `response_events_match` setting defines how Data Prepper handles the relationship between batch events sent to Lambda and the response received:
+
+- `true`: Lambda returns a JSON array with results for each batched event. Data Prepper maps this array back to its corresponding original event, ensuring that each event in the batch gets the corresponding part of the response from the array.
+- `false`: Lambda returns one or more events for the entire batch. Response events are not correlated with the original events. Original event metadata is not preserved in the response events. For example, when `response_events_match` is set to `true`, the Lambda function is expected to return the same number of response events as the number of original requests, maintaining the original order.
+
+## Limitations
+
+Note the following limitations:
+
+- Payload limitation: 6 MB payload limit
+- Response codec: JSON-only codec support
+
+## Integration testing
+
+Integration tests for this plugin are executed separately from the main Data Prepper build process. Use the following Gradle command to run these tests:
+
+```
+./gradlew :data-prepper-plugins:aws-lambda:integrationTest -Dtests.processor.lambda.region="us-east-1" -Dtests.processor.lambda.functionName="lambda_test_function"  -Dtests.processor.lambda.sts_role_arn="arn:aws:iam::123456789012:role/dataprepper-role
+```
+
+{% include copy-curl.html %}
diff --git a/_data-prepper/pipelines/configuration/sinks/aws-lambda.md b/_data-prepper/pipelines/configuration/sinks/aws-lambda.md
new file mode 100644
index 0000000000..d8c00bdb16
--- /dev/null
+++ b/_data-prepper/pipelines/configuration/sinks/aws-lambda.md
@@ -0,0 +1,73 @@
+---
+layout: default
+title: aws_lambda
+parent: Sinks
+grand_parent: Pipelines
+nav_order: 10
+---
+
+----------------------------------------------------------------------------------------
+# `aws_lambda` sink for Data Prepper
+
+This page explains how to configure and use [AWS Lambda](https://aws.amazon.com/lambda/) with Data Prepper, enabling Lambda functions to serve as both processors and sinks.
+
+## `aws_lambda` sink
+
+Configure the Lambda sink using the following parameters.
+
+Field             | Type    | Required | Description                                                                 
+--------------------| ------- | -------- | ---------------------------------------------------------------------------- 
+`function_name`     | String  | Yes      | The name of the AWS Lambda function to invoke.                               
+`invocation_type`   | String  | No       | Specifies the invocation type. Default is `event`.             
+`aws.region`        | String  | Yes      | The AWS Region in which the Lambda function is located.                         
+`aws.sts_role_arn`  | String  | No       | The Amazon Resource Name (ARN) of the role to assume before invoking the Lambda function.               
+`max_retries`       | Integer | No       | The maximum number of retries if the invocation fails. Default is `3`.             
+`batch`             | Object  | No       | Optional batch settings for Lambda invocations. Default is `key_name = events`. Default threshold is `event_count=100`, `maximum_size="5mb"`, and `event_collect_timeout = 10s`.
+`lambda_when`       | String  | No       | A conditional expression that determines when to invoke the Lambda sink.          
+`dlq`               | Object  | No       | The dead-letter queue (DLQ) configuration for failed invocations.                
+
+#### Example configuration
+
+```
+sink:
+  - aws_lambda:
+      function_name: "my-lambda-sink"
+      invocation_type: "event"
+      aws:
+        region: "us-west-2"
+        sts_role_arn: "arn:aws:iam::123456789012:role/my-lambda-sink-role"
+      max_retries: 5
+      batch:
+        key_name: "events"
+        threshold:
+          event_count: 50
+          maximum_size: "3mb"
+          event_collect_timeout: PT5S
+      lambda_when: "event['type'] == 'log'"
+      dlq:
+        region: "us-east-1"
+        sts_role_arn: "arn:aws:iam::123456789012:role/my-sqs-role"
+        bucket: "<<your-dlq-bucket-name>>"
+```
+{% include copy-curl.html %}
+
+## Usage
+
+The invocation types are as follows:
+
+- `event` (Default): Executes functions asynchronously without waiting for responses.  
+- `request-response` (Sink only): Executes functions synchronously, though responses are not processed.
+- `batch`: Automatically groups events based on configured thresholds. 
+- `dlq`: Supports the DLQ configuration for failed invocations after retry attempts.
+
+Data Prepper components use an AWS Identity and Access Management (IAM) role assumption, `aws.sts_role_arn`, for secure Lambda function invocation and respect Lambda's concurrency limits during event processing. For more information, see the [AWS Lambda documentation](https://docs.aws.amazon.com/lambda).
+{: .note}
+
+## Developer guide
+
+Integration tests must be executed separately from the main Data Prepper build. Execute them with the following command:
+
+```
+./gradlew :data-prepper-plugins:aws-lambda:integrationTest -Dtests.sink.lambda.region="us-east-1" -Dtests.sink.lambda.functionName="lambda_test_function"  -Dtests.sink.lambda.sts_role_arn="arn:aws:iam::123456789012:role/dataprepper-role
+```
+{% include copy-curl.html %}
diff --git a/_data-prepper/pipelines/configuration/sources/s3.md b/_data-prepper/pipelines/configuration/sources/s3.md
index db92718a36..7ca27ee500 100644
--- a/_data-prepper/pipelines/configuration/sources/s3.md
+++ b/_data-prepper/pipelines/configuration/sources/s3.md
@@ -104,7 +104,7 @@ Option | Required | Type | Description
 `s3_select` | No | [s3_select](#s3_select) | The Amazon S3 Select configuration.
 `scan` | No | [scan](#scan) | The S3 scan configuration.
 `delete_s3_objects_on_read` | No | Boolean | When `true`, the S3 scan attempts to delete S3 objects after all events from the S3 object are successfully acknowledged by all sinks. `acknowledgments` should be enabled when deleting S3 objects. Default is `false`.
-`workers` | No | Integer | Configures the number of worker threads that the source uses to read data from S3. Leave this value as the default unless your S3 objects are less than 1 MB in size. Performance may decrease for larger S3 objects. This setting affects SQS-based sources and S3-Scan sources. Default is `1`.
+`workers` | No | Integer | Configures the number of worker threads (1--10) that the source uses to read data from S3. Leave this value as the default unless your S3 objects are less than 1 MB in size. Performance may decrease for larger S3 objects. This setting affects SQS-based sources and S3-Scan sources. Default is `1`.
 
 
 
diff --git a/_data-prepper/pipelines/expression-syntax.md b/_data-prepper/pipelines/expression-syntax.md
index 383b54c19b..07f68ee58e 100644
--- a/_data-prepper/pipelines/expression-syntax.md
+++ b/_data-prepper/pipelines/expression-syntax.md
@@ -30,6 +30,9 @@ The following table lists the supported operators. Operators are listed in order
 |----------------------|-------------------------------------------------------|---------------|
 | `()`                 | Priority expression                                   | Left to right |
 | `not`<br> `+`<br>  `-`| Unary logical NOT<br>Unary positive<br>Unary negative | Right to left |
+| `*`, `/`             | Multiplication and division operators                 | Left to right |
+| `+`, `-`             | Addition and subtraction operators                    | Left to right |
+| `+`                  | String concatenation operator                         | Left to right |
 | `<`, `<=`, `>`, `>=` | Relational operators                                  | Left to right |
 | `==`, `!=`           | Equality operators                                    | Left to right |
 | `and`, `or`          | Conditional expression                                | Left to right |
@@ -78,7 +81,6 @@ Conditional expressions allow you to combine multiple expressions or values usin
 <Any> or <Any>
 not <Any>
 ```
-{% include copy-curl.html %}
 
 The following are some example conditional expressions: 
 
@@ -91,9 +93,64 @@ not /status_code in {200, 202}
 ```
 {% include copy-curl.html %}
 
+### Arithmetic expressions
+
+Arithmetic expressions enable basic mathematical operations like addition, subtraction, multiplication, and division. These expressions can be combined with conditional expressions to create more complex conditional statements. The available arithmetic operators are +, -, *, and /. The syntax for using the arithmetic operators is as follows:
+
+```
+<Any> + <Any>
+<Any> - <Any>
+<Any> * <Any>
+<Any> / <Any>
+```
+
+The following are example arithmetic expressions: 
+
+```
+/value + length(/message)
+/bytes / 1024
+/value1 - /value2
+/TimeInSeconds * 1000
+```
+{% include copy-curl.html %}
+
+The following are some example arithmetic expressions used in conditional expressions : 
+
+```
+/value + length(/message) > 200
+/bytes / 1024 < 10
+/value1 - /value2 != /value3 + /value4
+```
+{% include copy-curl.html %}
+
+### String concatenation expressions
+
+String concatenation expressions enable you to combine strings to create new strings. These concatenated strings can also be used within conditional expressions. The syntax for using string concatenation is as follows:
+
+```
+<String Variable or String Literal> + <String Variable or String Literal>
+```
+
+The following are example string concatenation expressions:
+
+```
+/name + "suffix"
+"prefix" + /name
+"time of " + /timeInMs + " ms"
+```
+{% include copy-curl.html %}
+
+The following are example string concatenation expressions that can be used in conditional expressions:
+
+```
+/service + ".com" == /url
+"www." + /service != /url
+```
+{% include copy-curl.html %}
+
 ### Reserved symbols
 
-Reserved symbols are symbols that are not currently used in the expression syntax but are reserved for possible future functionality or extensions. Reserved symbols include `^`, `*`, `/`, `%`, `+`, `-`, `xor`, `=`, `+=`, `-=`, `*=`, `/=`, `%=`, `++`, `--`, and `${<text>}`.
+Certain symbols, such as ^, %, xor, =, +=, -=, *=, /=, %=, ++, --, and ${<text>}, are reserved for future functionality or extensions. Reserved symbols include `^`, `%`, `xor`, `=`, `+=`, `-=`, `*=`, `/=`, `%=`, `++`, `--`, and `${<text>}`.
 
 ## Syntax components
 
@@ -170,6 +227,9 @@ White space is optional around relational operators, regex equality operators, e
 | `()`                 | Priority expression      | Yes                  | `/a==(/b==200)`<br>`/a in ({200})`                             | `/status in({200})`                   |
 | `in`, `not in`       | Set operators            | Yes                  | `/a in {200}`<br>`/a not in {400}`                             | `/a in{200, 202}`<br>`/a not in{400}` |
 | `<`, `<=`, `>`, `>=` | Relational operators     | No                   | `/status < 300`<br>`/status>=300`                              |                                       |
+| `+`                  | String concatenation operator   | No                   | `/status_code + /message + "suffix"`
+| `+`, `-`             | Arithmetic addition and subtraction operators | No      | `/status_code + length(/message) - 2`
+| `*`, `/`             | Multiplication and division operators | No              | `/status_code * length(/message) / 3`
 | `=~`, `!~`           | Regex equality operators | No                   | `/msg =~ "^\w*$"`<br>`/msg=~"^\w*$"`                           |                                       |
 | `==`, `!=`           | Equality operators       | No                   | `/status == 200`<br>`/status_code==200`                        |                                       |
 | `and`, `or`, `not`   | Conditional operators    | Yes                  | `/a<300 and /b>200`                                            | `/b<300and/b>200`                     |
diff --git a/_data/top_nav.yml b/_data/top_nav.yml
index 51d8138680..6552d90359 100644
--- a/_data/top_nav.yml
+++ b/_data/top_nav.yml
@@ -63,6 +63,8 @@ items:
         url: /docs/latest/clients/
       - label: Benchmark
         url: /docs/latest/benchmark/
+      - label: Migration Assistant
+        url: /docs/latest/migration-assistant/
   - label: Platform
     url: /platform/index.html
     children:
diff --git a/_field-types/supported-field-types/flat-object.md b/_field-types/supported-field-types/flat-object.md
index c9e59710e1..65d7c6dc8e 100644
--- a/_field-types/supported-field-types/flat-object.md
+++ b/_field-types/supported-field-types/flat-object.md
@@ -56,7 +56,8 @@ The flat object field type supports the following queries:
 - [Multi-match]({{site.url}}{{site.baseurl}}/query-dsl/full-text/multi-match/) 
 - [Query string]({{site.url}}{{site.baseurl}}/query-dsl/full-text/query-string/) 
 - [Simple query string]({{site.url}}{{site.baseurl}}/query-dsl/full-text/simple-query-string/) 
-- [Exists]({{site.url}}{{site.baseurl}}/query-dsl/term/exists/) 
+- [Exists]({{site.url}}{{site.baseurl}}/query-dsl/term/exists/)
+- [Wildcard]({{site.url}}{{site.baseurl}}/query-dsl/term/wildcard/)
 
 ## Limitations
 
@@ -243,4 +244,4 @@ PUT /test-index/
 ```
 {% include copy-curl.html %}
 
-Because `issue.number` is not part of the flat object, you can use it to aggregate and sort documents.
\ No newline at end of file
+Because `issue.number` is not part of the flat object, you can use it to aggregate and sort documents.
diff --git a/_getting-started/communicate.md b/_getting-started/communicate.md
index 3472270c30..773558fb21 100644
--- a/_getting-started/communicate.md
+++ b/_getting-started/communicate.md
@@ -28,7 +28,7 @@ curl -X GET "http://localhost:9200/_cluster/health"
 If you're using the Security plugin, provide the username and password in the request:
 
 ```bash
-curl -X GET "http://localhost:9200/_cluster/health" -ku admin:<custom-admin-password>
+curl -X GET "https://localhost:9200/_cluster/health" -ku admin:<custom-admin-password>
 ```
 {% include copy.html %}
 
@@ -317,4 +317,4 @@ Once a field is created, you cannot change its type. Changing a field type requi
 
 ## Next steps
 
-- See [Ingest data into OpenSearch]({{site.url}}{{site.baseurl}}/getting-started/ingest-data/) to learn about ingestion options.
\ No newline at end of file
+- See [Ingest data into OpenSearch]({{site.url}}{{site.baseurl}}/getting-started/ingest-data/) to learn about ingestion options.
diff --git a/_includes/cards.html b/_includes/cards.html
index 6d958e61a5..5ab37b8c27 100644
--- a/_includes/cards.html
+++ b/_includes/cards.html
@@ -30,8 +30,14 @@
         <p class="description">Measure performance metrics for your OpenSearch cluster</p>
         <p class="last-link">Documentation &#x2192;</p>
       </div>  
+
+    <div class="card">
+      <a href="{{site.url}}/docs/latest/migration-assistant/" class='card-link'></a>
+        <p class="heading">Migration Assistant</p>
+        <p class="description">Migrate to OpenSearch from other platforms</p>
+        <p class="last-link">Documentation &#x2192;</p>
+      </div>  
   </div>
   
 </div>
 
-
diff --git a/_includes/header.html b/_includes/header.html
index 20d82c451e..32d5b14774 100644
--- a/_includes/header.html
+++ b/_includes/header.html
@@ -82,7 +82,7 @@
 {% endif %}
 <div role="banner" id="top">
   <div class="navigation-container">
-    <a class="navigation-container--logo" href="{{ '/' | relative_url }}">
+    <a class="navigation-container--logo" href="https://opensearch.org/">
       OpenSearch
       <svg width="200" height="39" viewBox="0 0 200 39" fill="none" xmlns="http://www.w3.org/2000/svg">
         <g clip-path="url(#clip0_723_1352)">
diff --git a/_layouts/default.html b/_layouts/default.html
index d4d40d8cc4..7f2bf0a2a8 100755
--- a/_layouts/default.html
+++ b/_layouts/default.html
@@ -87,6 +87,8 @@
           {% assign section = site.clients_collection.collections %}
         {% elsif page.section == "benchmark" %}
           {% assign section = site.benchmark_collection.collections %}
+        {% elsif page.section == "migration-assistant" %}
+          {% assign section = site.migration_assistant_collection.collections %}
         {% endif %}
 
         {% if section %}
diff --git a/_migration-assistant/deploying-migration-assistant/configuration-options.md b/_migration-assistant/deploying-migration-assistant/configuration-options.md
new file mode 100644
index 0000000000..7097d7e90e
--- /dev/null
+++ b/_migration-assistant/deploying-migration-assistant/configuration-options.md
@@ -0,0 +1,175 @@
+---
+layout: default
+title: Configuration options
+nav_order: 15
+parent: Deploying Migration Assistant
+---
+
+# Configuration options
+
+This page outlines the configuration options for three key migrations scenarios:
+
+1. **Metadata migration**
+2. **Backfill migration with `Reindex-from-Snapshot` (RFS)**
+3. **Live capture migration with Capture and Replay (C&R)**
+
+Each of these migrations depends on either a snapshot or a capture proxy. The following example `cdk.context.json` configurations are used by AWS Cloud Development Kit (AWS CDK) to deploy and configure Migration Assistant for OpenSearch, shown as separate blocks for each migration type. If you are performing a migration applicable to multiple scenarios, these options can be combined.
+
+
+For a complete list of configuration options, see [opensearch-migrations-options.md](https://github.com/opensearch-project/opensearch-migrations/blob/main/deployment/cdk/opensearch-service-migration/options.md). If you need a configuration option that is not found on this page, create an issue in the [OpenSearch Migrations repository](https://github.com/opensearch-project/opensearch-migrations/issues).
+{: .tip }
+
+Options for the source cluster endpoint, target cluster endpoint, and existing virtual private cloud (VPC) should be configured in order for the migration tools to function effectively.
+
+## Shared configuration options
+
+Each migration configuration shares the following options.
+
+
+| Name | Example  | Description   |
+| :--- | :--- | :--- |
+| `sourceClusterEndpoint` | `"https://source-cluster.elb.us-east-1.endpoint.com"`  | The endpoint for the source cluster.  |
+| `targetClusterEndpoint` | `"https://vpc-demo-opensearch-cluster-cv6hggdb66ybpk4kxssqt6zdhu.us-west-2.es.amazonaws.com:443"`   | The endpoint for the target cluster. Required if using an existing target cluster for the migration instead of creating a new one. |
+| `vpcId` | `"vpc-123456789abcdefgh"`  | The ID of the existing VPC in which the migration resources will be stored. The VPC must have at least two private subnets that span two Availability Zones. |
+
+
+## Backfill migration using RFS
+
+The following CDK performs a backfill migrations using RFS:
+
+```json
+{
+  "backfill-migration": {
+    "stage": "dev",
+    "vpcId": <VPC_ID>,
+    "sourceCluster": {
+        "endpoint": <SOURCE_CLUSTER_ENDPOINT>,
+        "version": "ES 7.10",
+        "auth": {"type": "none"}
+    },
+    "targetCluster": {
+        "endpoint": <TARGET_CLUSTER_ENDPOINT>,
+        "auth": {
+            "type": "basic",
+            "username": <TARGET_CLUSTER_USERNAME>,
+            "passwordFromSecretArn": <TARGET_CLUSTER_PASSWORD_SECRET>
+        }
+    },
+    "reindexFromSnapshotServiceEnabled": true,
+    "reindexFromSnapshotExtraArgs": "",
+    "artifactBucketRemovalPolicy": "DESTROY"
+  }
+}
+```
+{% include copy.html %}
+
+Performing an RFS backfill migration requires an existing snapshot. 
+
+
+The RFS configuration uses the following options. All options are optional. 
+
+| Name  | Example | Description |
+| :--- | :--- | :--- |
+| `reindexFromSnapshotServiceEnabled` | `true` | Enables deployment and configuration of the RFS ECS service. |
+| `reindexFromSnapshotExtraArgs` | `"--target-aws-region us-east-1 --target-aws-service-signing-name es"` | Extra arguments for the Document Migration command, with space separation. See [RFS Extra Arguments](https://github.com/opensearch-project/opensearch-migrations/blob/main/DocumentsFromSnapshotMigration/README.md#arguments) for more information. You can pass `--no-insecure` to remove the `--insecure` flag. |
+
+To view all available arguments for `reindexFromSnapshotExtraArgs`, see [Snapshot migrations README](https://github.com/opensearch-project/opensearch-migrations/blob/main/DocumentsFromSnapshotMigration/README.md#arguments). At a minimum, no extra arguments may be needed.
+
+## Live capture migration with C&R 
+
+The following sample CDK performs a live capture migration with C&R:
+
+```json
+{
+  "live-capture-migration": {
+    "stage": "dev",
+    "vpcId": <VPC_ID>,
+    "sourceCluster": {
+        "endpoint": <SOURCE_CLUSTER_ENDPOINT>,
+        "version": "ES 7.10",
+        "auth": {"type": "none"}
+    },
+    "targetCluster": {
+        "endpoint": <TARGET_CLUSTER_ENDPOINT>,
+        "auth": {
+            "type": "basic",
+            "username": <TARGET_CLUSTER_USERNAME>,
+            "passwordFromSecretArn": <TARGET_CLUSTER_PASSWORD_SECRET>
+        }
+    },
+    "captureProxyServiceEnabled": true,
+    "captureProxyExtraArgs": "",
+    "trafficReplayerServiceEnabled": true,
+    "trafficReplayerExtraArgs": "",
+    "artifactBucketRemovalPolicy": "DESTROY"
+  }
+}
+```
+{% include copy.html %}
+
+Performing a live capture migration requires that a Capture Proxy be configured to capture incoming traffic and send it to the target cluster using the Traffic Replayer service. For arguments available in `captureProxyExtraArgs`, refer to the `@Parameter` fields [here](https://github.com/opensearch-project/opensearch-migrations/blob/main/TrafficCapture/trafficCaptureProxyServer/src/main/java/org/opensearch/migrations/trafficcapture/proxyserver/CaptureProxy.java). For `trafficReplayerExtraArgs`, refer to the `@Parameter` fields [here](https://github.com/opensearch-project/opensearch-migrations/blob/main/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/TrafficReplayer.java). At a minimum, no extra arguments may be needed.
+
+
+| Name  | Example  | Description   |
+| :--- | :--- | :--- |
+| `captureProxyServiceEnabled`    | `true`  | Enables the Capture Proxy service deployment using an AWS CloudFormation stack.  |
+| `captureProxyExtraArgs`  | `"--suppressCaptureForHeaderMatch user-agent .*elastic-java/7.17.0.*"`  | Extra arguments for the Capture Proxy command, including options specified by the [Capture Proxy](https://github.com/opensearch-project/opensearch-migrations/blob/main/TrafficCapture/trafficCaptureProxyServer/src/main/java/org/opensearch/migrations/trafficcapture/proxyserver/CaptureProxy.java).  |
+| `trafficReplayerServiceEnabled` | `true`  | Enables the Traffic Replayer service deployment using a CloudFormation stack.  |
+| `trafficReplayerExtraArgs`      | `"--sigv4-auth-header-service-region es,us-east-1 --speedup-factor 5"`                 | Extra arguments for the Traffic Replayer command, including options for auth headers and other parameters specified by the [Traffic Replayer](https://github.com/opensearch-project/opensearch-migrations/blob/main/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/TrafficReplayer.java). |
+
+
+For arguments available in `captureProxyExtraArgs`, see the `@Parameter` fields in [`CaptureProxy.java`](https://github.com/opensearch-project/opensearch-migrations/blob/main/TrafficCapture/trafficCaptureProxyServer/src/main/java/org/opensearch/migrations/trafficcapture/proxyserver/CaptureProxy.java). For `trafficReplayerExtraArgs`, see the `@Parameter` fields in [TrafficReplayer.java](https://github.com/opensearch-project/opensearch-migrations/blob/main/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/TrafficReplayer.java).
+
+
+## Cluster authentication options
+
+Both the source and target cluster can use no authentication, authentication limited to VPC, basic authentication with a username and password, or AWS Signature Version 4 scoped to a user or role.
+
+### No authentication
+
+```json
+    "sourceCluster": {
+        "endpoint": <SOURCE_CLUSTER_ENDPOINT>,
+        "version": "ES 7.10",
+        "auth": {"type": "none"}
+    }
+```
+{% include copy.html %}
+
+### Basic authentication
+
+```json
+    "sourceCluster": {
+        "endpoint": <SOURCE_CLUSTER_ENDPOINT>,
+        "version": "ES 7.10",
+        "auth": {
+            "type": "basic",
+            "username": <TARGET_CLUSTER_USERNAME>,
+            "passwordFromSecretArn": <TARGET_CLUSTER_PASSWORD_SECRET>
+        }
+    }
+```
+{% include copy.html %}
+
+### Signature Version 4 authentication
+
+```json
+    "sourceCluster": {
+        "endpoint": <SOURCE_CLUSTER_ENDPOINT>,
+        "version": "ES 7.10",
+        "auth": {
+            "type": "sigv4",
+            "region": "us-east-1",
+            "serviceSigningName": "es"
+        }
+    }
+```
+{% include copy.html %}
+
+The `serviceSigningName` can be `es` for an Elasticsearch or OpenSearch domain, or `aoss` for an OpenSearch Serverless collection.
+
+All of these authentication options apply to both source and target clusters.
+
+## Network configuration
+
+The migration tooling expects the source cluster, target cluster, and migration resources to exist in the same VPC. If this is not the case, manual networking setup outside of this documentation is likely required.
diff --git a/_migrations/deploying-migration-assistant/iam-and-security-groups-for-existing-clusters.md b/_migration-assistant/deploying-migration-assistant/iam-and-security-groups-for-existing-clusters.md
similarity index 61%
rename from _migrations/deploying-migration-assistant/iam-and-security-groups-for-existing-clusters.md
rename to _migration-assistant/deploying-migration-assistant/iam-and-security-groups-for-existing-clusters.md
index 46f1d7e11e..331b99e1fa 100644
--- a/_migrations/deploying-migration-assistant/iam-and-security-groups-for-existing-clusters.md
+++ b/_migration-assistant/deploying-migration-assistant/iam-and-security-groups-for-existing-clusters.md
@@ -2,40 +2,42 @@
 layout: default
 title: IAM and security groups for existing clusters
 nav_order: 20
-parent: Deploying migration assistant
+parent: Deploying Migration Assistant
 ---
 
 # IAM and security groups for existing clusters
 
-This page outlines scenarios for using the migration tools with existing clusters, including any necessary configuration changes to ensure proper communication between them.
+This page outlines security scenarios for using the migration tools with existing clusters, including any necessary configuration changes to ensure proper communication between them.
 
-## Importing an OpenSearch Service or OpenSearch Serverless Target Cluster
+## Importing an Amazon OpenSearch Service or Amazon OpenSearch Serverless target cluster
+
+Use the following scenarios for Amazon OpenSearch Service or Amazon OpenSearch Serverless target clusters.
 
 ### OpenSearch Service
 
 For an OpenSearch Domain, two main configurations are typically required to ensure proper functioning of the migration solution:
 
-1. **Security Group Configuration**:  
-   The Domain should have a security group that allows communication from the applicable Migration services (Traffic Replayer, Migration Console, Reindex-from-Snapshot). The CDK will automatically create an `osClusterAccessSG` security group, which is applied to the Migration services. The user should then add this security group to their existing Domain to allow access.
+1. **Security Group Configuration**
+
+   The domain should have a security group that allows communication from the applicable migration services (Traffic Replayer, Migration Console, `Reindex-from-Snapshot`). The CDK automatically creates an `osClusterAccessSG` security group, which is applied to the migration services. The user should then add this security group to their existing domain to allow access.
 
-2. **Access Policy Configuration**:  
-   The Domain’s access policy should either:
-   - Be an open access policy that allows all access, or
-   - Be configured to allow at least the IAM task roles for the applicable Migration services (Traffic Replayer, Migration Console, Reindex-from-Snapshot) to access the Domain.
+2. **Access Policy Configuration** should be one of the following:
+   - An open access policy that allows all access.
+   - Configured to allow at least the AWS Identity and Access Management (IAM) task roles for the applicable migration services (Traffic Replayer, Migration Console, `Reindex-from-Snapshot`) to access the domain.
 
 ### OpenSearch Serverless
 
-For an OpenSearch Serverless Collection, you will need to configure both Network and Data Access policies:
+For an OpenSearch Serverless Collection, you will need to configure both network and data access policies:
 
 1. **Network Policy Configuration**:  
    The Collection should have a network policy that uses the `VPC` access type. This requires creating a VPC endpoint on the VPC used for the solution. The VPC endpoint should be configured for the private subnets of the VPC and should attach the `osClusterAccessSG` security group.
 
 2. **Data Access Policy Configuration**:  
-   The data access policy should grant permission to perform all [index operations](https://docs.aws.amazon.com/opensearch-service/latest/developerguide/serverless-data-access.html#serverless-data-supported-permissions) ↗ (`aoss:*`) for all indexes in the Collection. The IAM task roles of the applicable Migration services (Traffic Replayer, Migration Console, Reindex-from-Snapshot) should be used as the principals for this data access policy.
+   The data access policy should grant permission to perform all [index operations](https://docs.aws.amazon.com/opensearch-service/latest/developerguide/serverless-data-access.html#serverless-data-supported-permissions) (`aoss:*`) for all indexes in the Collection. The IAM task roles of the applicable Migration services (Traffic Replayer, migration console, `Reindex-from-Snapshot`) should be used as the principals for this data access policy.
 
 ## Capture Proxy on Coordinator Nodes of Source Cluster
 
-Although the CDK does not automatically set up the Capture Proxy on source cluster nodes (except in the demo solution), the Capture Proxy instances must communicate with the resources deployed by the CDK (e.g., Kafka). This section outlines the necessary steps.
+Although the CDK does not automatically set up the Capture Proxy on source cluster nodes (except in the demo solution), the Capture Proxy instances must communicate with the resources deployed by the CDK, such as Kafka. This section outlines the necessary steps to set up communication.
 
 Before [setting up Capture Proxy instances](https://github.com/opensearch-project/opensearch-migrations/tree/main/TrafficCapture/trafficCaptureProxyServer#installing-capture-proxy-on-coordinator-nodes) on the source cluster, ensure the following configurations are in place:
 
@@ -66,7 +68,3 @@ Before [setting up Capture Proxy instances](https://github.com/opensearch-projec
     ]
 }
 ```
-
-## Related Links
-
-- [OpenSearch Traffic Capture Setup](https://github.com/opensearch-project/opensearch-migrations/tree/main/TrafficCapture/trafficCaptureProxyServer#installing-capture-proxy-on-coordinator-nodes) ↗
\ No newline at end of file
diff --git a/_migration-assistant/deploying-migration-assistant/index.md b/_migration-assistant/deploying-migration-assistant/index.md
new file mode 100644
index 0000000000..1c559a81b1
--- /dev/null
+++ b/_migration-assistant/deploying-migration-assistant/index.md
@@ -0,0 +1,13 @@
+---
+layout: default
+title: Deploying Migration Assistant
+nav_order: 15
+has_children: true
+permalink: /deploying-migration-assistant/
+redirect-from:
+   - /deploying-migration-assistant/index/
+---
+
+# Deploying Migration Assistant
+
+This section provides information about the available options for deploying Migration Assistant.
diff --git a/_migration-assistant/getting-started-data-migration.md b/_migration-assistant/getting-started-data-migration.md
new file mode 100644
index 0000000000..4110f29edf
--- /dev/null
+++ b/_migration-assistant/getting-started-data-migration.md
@@ -0,0 +1,353 @@
+---
+layout: default
+title: Getting started with data migration
+nav_order: 10
+redirect_from:
+  - /upgrade-to/upgrade-to/
+  - /upgrade-to/snapshot-migrate/
+---
+
+# Getting started with data migration
+
+This quickstart outlines how to deploy Migration Assistant for OpenSearch and execute an existing data migration using `Reindex-from-Snapshot` (RFS). It uses AWS for illustrative purposes. However, the steps can be modified for use with other cloud providers.
+
+## Prerequisites and assumptions
+
+Before using this quickstart, make sure you fulfill the following prerequisites:
+
+* Verify that your migration path [is supported]({{site.url}}{{site.baseurl}}/migration-assistant/is-migration-assistant-right-for-you/#migration-paths). Note that we test with the exact versions specified, but you should be able to migrate data on alternative minor versions as long as the major version is supported.
+* The source cluster must be deployed Amazon Simple Storage Service (Amazon S3) plugin.
+* The target cluster must be deployed.
+
+The steps in this guide assume the following:
+
+* In this guide, a snapshot will be taken and stored in Amazon S3; the following assumptions are made about this snapshot:
+  * The `_source` flag is enabled on all indexes to be migrated.
+  * The snapshot includes the global cluster state (`include_global_state` is `true`).
+  * Shard sizes of up to approximately 80 GB are supported. Larger shards cannot be migrated. If this presents challenges for your migration, contact the [migration team](https://opensearch.slack.com/archives/C054JQ6UJFK).
+* Migration Assistant will be installed in the same AWS Region and have access to both the source snapshot and target cluster.
+
+---
+
+## Step 1: Install Bootstrap on an Amazon EC2 instance (~10 minutes)
+
+To begin your migration, use the following steps to install a `bootstrap` box on an Amazon Elastic Compute Cloud (Amazon EC2) instance. The instance uses AWS CloudFormation to create and manage the stack.
+
+1. Log in to the target AWS account in which you want to deploy Migration Assistant.
+2. From the browser where you are logged in to your target AWS account, right-click [here](https://console.aws.amazon.com/cloudformation/home?region=us-east-1#/stacks/new?templateURL=https://solutions-reference.s3.amazonaws.com/migration-assistant-for-amazon-opensearch-service/latest/migration-assistant-for-amazon-opensearch-service.template&redirectId=SolutionWeb) to load the CloudFormation template from a new browser tab.
+3. Follow the CloudFormation stack wizard:
+   * **Stack Name:** `MigrationBootstrap`
+   * **Stage Name:** `dev`
+   * Choose **Next** after each step > **Acknowledge** > **Submit**.
+4. Verify that the Bootstrap stack exists and is set to `CREATE_COMPLETE`. This process takes around 10 minutes to complete.
+
+---
+
+## Step 2: Set up Bootstrap instance access (~5 minutes)
+
+Use the following steps to set up Bootstrap instance access:
+
+1. After deployment, find the EC2 instance ID for the `bootstrap-dev-instance`.
+2. Create an AWS Identity and Access Management (IAM) policy using the following snippet, replacing `<aws-region>`, `<aws-account>`, `<stage>`, and `<ec2-instance-id>` with your information:
+
+    ```json
+    {
+        "Version": "2012-10-17",
+        "Statement": [
+            {
+                "Effect": "Allow",
+                "Action": "ssm:StartSession",
+                "Resource": [
+                    "arn:aws:ec2:<aws-region>:<aws-account>:instance/<ec2-instance-id>",
+                    "arn:aws:ssm:<aws-region>:<aws-account>:document/BootstrapShellDoc-<stage>-<aws-region>"
+                ]
+            }
+        ]
+    }
+    ```
+    {% include copy.html %}
+
+3. Name the policy, for example, `SSM-OSMigrationBootstrapAccess`, and then create the policy by selecting **Create policy**.
+
+---
+
+## Step 3: Log in to Bootstrap and building Migration Assistant (~15 minutes)
+
+Next, log in to Bootstrap and build Migration Assistant using the following steps.
+
+### Prerequisites
+
+To use these steps, make sure you fulfill the following prerequisites:
+
+* The AWS Command Line Interface (AWS CLI) and AWS Session Manager plugin are installed on your instance.
+* The AWS credentials are configured (`aws configure`) for your instance.
+
+### Steps
+
+1. Load AWS credentials into your terminal.
+2. Log in to the instance using the following command, replacing `<instance-id>` and `<aws-region>` with your instance ID and Region:
+
+    ```bash
+    aws ssm start-session --document-name BootstrapShellDoc-<stage>-<aws-region> --target <instance-id> --region <aws-region> [--profile <profile-name>]
+    ```
+    {% include copy.html %}
+    
+3. Once logged in, run the following command from the shell of the Bootstrap instance in the `/opensearch-migrations` directory:
+
+    ```bash
+    ./initBootstrap.sh && cd deployment/cdk/opensearch-service-migration
+    ```
+    {% include copy.html %}
+    
+4. After a successful build, note the path for infrastructure deployment, which will be used in the next step.
+
+---
+
+## Step 4: Configure and deploy RFS (~20 minutes)
+
+Use the following steps to configure and deploy RFS:
+
+1. Add the target cluster password to AWS Secrets Manager as an unstructured string. Be sure to copy the secret Amazon Resource Name (ARN) for use during deployment.
+2. From the same shell as the Bootstrap instance, modify the `cdk.context.json` file located in the `/opensearch-migrations/deployment/cdk/opensearch-service-migration` directory:
+
+    ```json
+    {
+    "migration-assistant": {
+        "vpcId": "<TARGET CLUSTER VPC ID>",
+        "targetCluster": {
+            "endpoint": "<TARGET CLUSTER ENDPOINT>",
+            "auth": {
+                "type": "basic",
+                "username": "<TARGET CLUSTER USERNAME>",
+                "passwordFromSecretArn": "<TARGET CLUSTER PASSWORD SECRET>"
+            }
+        },
+        "sourceCluster": {
+            "endpoint": "<SOURCE CLUSTER ENDPOINT>",
+            "auth": {
+                "type": "basic",
+                "username": "<TARGET CLUSTER USERNAME>",
+                "passwordFromSecretArn": "<TARGET CLUSTER PASSWORD SECRET>"
+            }
+        },
+        "reindexFromSnapshotExtraArgs": "<RFS PARAMETERS (see below)>",
+        "stage": "dev",
+        "otelCollectorEnabled": true,
+        "migrationConsoleServiceEnabled": true,
+        "reindexFromSnapshotServiceEnabled": true,
+        "migrationAssistanceEnabled": true
+    }
+    }
+    ```
+    {% include copy.html %}
+
+    The source and target cluster authorization can be configured to have no authorization, `basic` with a username and password, or `sigv4`. 
+
+3. Bootstrap the account with the following command:
+
+    ```bash
+    cdk bootstrap --c contextId=migration-assistant --require-approval never 
+    ```
+    {% include copy.html %}
+
+4. Deploy the stacks:
+
+    ```bash
+    cdk deploy "*" --c contextId=migration-assistant --require-approval never --concurrency 5
+    ```
+    {% include copy.html %}
+
+5. Verify that all CloudFormation stacks were installed successfully.
+
+### RFS parameters
+
+If you're creating a snapshot using migration tooling, these parameters are automatically configured. If you're using an existing snapshot, modify the `reindexFromSnapshotExtraArgs` setting with the following values:
+
+    ```bash
+    --s3-repo-uri s3://<bucket-name>/<repo> --s3-region <region> --snapshot-name <name>
+    ```
+
+You will also need to give the `migrationconsole` and `reindexFromSnapshot` TaskRoles permissions to the S3 bucket. 
+
+---
+
+## Step 5: Deploy Migration Assistant
+
+To deploy Migration Assistant, use the following steps:
+
+1. Bootstrap the account:
+   
+    ```bash
+    cdk bootstrap --c contextId=migration-assistant --require-approval never --concurrency 5
+    ```
+    {% include copy.html %}
+
+2. Deploy the stacks when `cdk.context.json` is fully configured:
+   
+    ```bash
+    cdk deploy "*" --c contextId=migration-assistant --require-approval never --concurrency 3
+    ```
+    {% include copy.html %}
+
+These commands deploy the following stacks:
+
+* Migration Assistant network stack
+* `Reindex-from-snapshot` stack
+* Migration console stack
+
+---
+
+## Step 6: Access the migration console
+
+Run the following command to access the migration console:
+
+```bash
+./accessContainer.sh migration-console dev <region>
+```
+{% include copy.html %}
+
+
+`accessContainer.sh` is located in `/opensearch-migrations/deployment/cdk/opensearch-service-migration/` on the Bootstrap instance. To learn more, see [Accessing the migration console].
+`{: .note}
+
+---
+
+## Step 7: Verify the connection to the source and target clusters
+
+To verify the connection to the clusters, run the following command:
+
+```bash
+console clusters connection-check
+```
+{% include copy.html %}
+
+You should receive the following output:
+
+```bash
+* **Source Cluster:** Successfully connected!
+* **Target Cluster:** Successfully connected!
+```
+
+To learn more about migration console commands, see [Migration commands].
+
+---
+
+## Step 8: Create a snapshot
+
+Run the following command to initiate snapshot creation from the source cluster:
+
+```bash
+console snapshot create [...]
+```
+{% include copy.html %}
+
+To check the snapshot creation status, run the following command:
+
+```bash
+console snapshot status [...]
+```
+{% include copy.html %}
+
+To learn more information about the snapshot, run the following command:
+
+```bash
+console snapshot status --deep-check [...]
+```
+{% include copy.html %}
+
+Wait for snapshot creation to complete before moving to step 9.
+
+To learn more about snapshot creation, see [Snapshot Creation].
+
+---
+
+## Step 9: Migrate metadata
+
+Run the following command to migrate metadata:
+
+```bash
+console metadata migrate [...]
+```
+{% include copy.html %}
+
+For more information, see [Migrating metadata]({{site.url}}{{site.baseurl}}/migration-assistant/migration-phases/migrating-metadata/).
+
+---
+
+## Step 10: Migrate documents with RFS
+
+You can now use RFS to migrate documents from your original cluster:
+
+1. To start the migration from RFS, start a `backfill` using the following command:
+
+    ```bash
+    console backfill start
+    ```
+    {% include copy.html %}
+
+2. _(Optional)_ To speed up the migration, increase the number of documents processed at a simultaneously by using the following command:
+
+    ```bash
+    console backfill scale <NUM_WORKERS>
+    ```
+    {% include copy.html %}
+
+3. To check the status of the documentation backfill, use the following command:
+
+    ```bash
+    console backfill status
+    ```
+    {% include copy.html %}
+
+4. If you need to stop the backfill process, use the following command:
+
+    ```bash
+    console backfill stop
+    ```
+    {% include copy.html %}
+
+For more information, see [Backfill]({{site.url}}{{site.baseurl}}/migration-assistant/migration-phases/backfill/).
+
+---
+
+## Step 11: Backfill monitoring
+
+Use the following command for detailed monitoring of the backfill process:
+
+```bash
+console backfill status --deep-check
+```
+{% include copy.html %}
+
+You should receive the following output:
+
+```json
+BackfillStatus.RUNNING
+Running=9
+Pending=1
+Desired=10
+Shards total: 62
+Shards completed: 46
+Shards incomplete: 16
+Shards in progress: 11
+Shards unclaimed: 5
+```
+
+Logs and metrics are available in Amazon CloudWatch in the `OpenSearchMigrations` log group.
+
+---
+
+## Step 12: Verify that all documents were migrated 
+
+Use the following query in CloudWatch Logs Insights to identify failed documents:
+
+```bash
+fields @message
+| filter @message like "Bulk request succeeded, but some operations failed."
+| sort @timestamp desc
+| limit 10000
+```
+{% include copy.html %}
+
+If any failed documents are identified, you can index the failed documents directly as opposed to using RFS.
+
diff --git a/_migration-assistant/index.md b/_migration-assistant/index.md
new file mode 100644
index 0000000000..f024fdb69c
--- /dev/null
+++ b/_migration-assistant/index.md
@@ -0,0 +1,75 @@
+---
+layout: default
+title: Migration Assistant for OpenSearch
+nav_order: 1
+has_children: false
+nav_exclude: true
+has_toc: false
+permalink: /migration-assistant/
+redirect_from:
+  - /migration-assistant/index/
+  - /upgrade-to/index/
+  - /upgrade-to/
+---
+
+# Migration Assistant for OpenSearch
+
+Migration Assistant for OpenSearch aids you in successfully performing an end-to-end, zero-downtime migration to OpenSearch from other search providers. It helps with the following scenarios:
+
+- **Metadata migration**: Migrating cluster metadata, such as index settings, aliases, and templates.
+- **Backfill migration**: Migrating existing or historical data from a source to a target cluster.
+- **Live traffic migration**: Replicating live ongoing traffic from a source to a target cluster.
+- **Comparative tooling**: Comparing the performance and behaviors of an existing cluster with a prospective new one.
+
+This user guide focuses on conducting a comprehensive migration involving both existing and live data with zero downtime and the option to back out of a migration.
+
+It's crucial to note that migration strategies are not universally applicable. This guide provides a detailed methodology, based on certain assumptions detailed throughout, emphasizing the importance of robust engineering practices to ensure a successful migration.
+{: .tip }
+
+## Key components 
+
+The following are the key components of Migration Assistant.
+
+### Elasticsearch/OpenSearch source
+
+Your source cluster in this solution operates on Elasticsearch or OpenSearch, hosted on EC2 instances or similar computing environments. A proxy is set up to interact with this source cluster, either positioned in front of or directly on the coordinating nodes of the cluster.
+
+### Migration management console
+
+A console that provides a migration-specific CLI and offers a variety of tools to streamline the migration process.  Everything necessary for completing a migration, other than cleaning up the migration resources, can be done via this Console.
+
+### Traffic capture proxy
+
+This component is designed for HTTP RESTful traffic. It forwards traffic to the source cluster and also splits and channels this traffic to a stream processing service for later playback.
+
+### Traffic Replayer
+
+Acting as a traffic simulation tool, the Traffic Replayer replays recorded request traffic to a target cluster, mirroring source traffic patterns. It links original requests and their responses to those directed at the target cluster, facilitating comparative analysis.
+
+### Metadata migration tool
+
+The Metadata migration tool integrated into the Migration CLI can be used independently to migrate cluster metadata, including index mappings, index configuration settings, templates, component templates, and aliases.
+
+### reindex-from-snapshot
+
+`Reindex-from-Snapshot` (RFS) reindexes data from an existing snapshot. Workers on Amazon Elastic Container Service (Amazon ECS) coordinate the migration of documents from an existing snapshot, reindexing the documents in parallel to a target cluster.
+
+### Target cluster
+
+The destination cluster for migration or comparison in an A/B test.
+
+## Architecture overview
+
+The Migration Assistant architecture is based on the use of an AWS Cloud infrastructure, but most tools are designed to be cloud independent. A local containerized version of this solution is also available.
+
+The design deployed in AWS is as follows: 
+
+![Migration architecture overview]({{site.url}}{{site.baseurl}}/images/migrations/migrations-architecture-overview.png)
+
+1. Client traffic is directed to the existing cluster.
+2. An Application Load Balancer with capture proxies relays traffic to a source while replicating data to Amazon Managed Streaming for Apache Kafka (Amazon MSK).
+3. Using the migration console, you can initiate metadata migration to establish indexes, templates, component templates, and aliases on the target cluster.
+4. With continuous traffic capture in place, you can use a `reindex-from-snapshot` process to capture data from your current index.
+4. Once `reindex-from-snapshot` is complete, captured traffic is replayed from Amazon MSK to the target cluster by the traffic replayer.
+5. Performance and behavior of traffic sent to the source and target clusters are compared by reviewing logs and metrics.
+6. After confirming that the target cluster's functionality meets expectations, clients are redirected to the new target.
diff --git a/_migration-assistant/is-migration-assistant-right-for-you.md b/_migration-assistant/is-migration-assistant-right-for-you.md
new file mode 100644
index 0000000000..073c2b6cd7
--- /dev/null
+++ b/_migration-assistant/is-migration-assistant-right-for-you.md
@@ -0,0 +1,58 @@
+---
+layout: default
+title: Is Migration Assistant right for you?
+nav_order: 5
+---
+
+# Is Migration Assistant right for you?
+
+Before deciding if Migration Assistant is right for you, it's important to assess your specific needs and understand the available tools for performing an upgrade or migration.
+
+Migration Assistant addresses gaps found in other migration solutions, but in some cases, alternative tools may be a better fit.
+
+For instance, if you need to upgrade more than one major version, such as moving from Elasticsearch 6.8 to OpenSearch 2.15, Migration Assistant allows you to do this in a single hop. In contrast, other options like rolling upgrades or snapshot restore would require multiple steps because they cannot handle major version jumps without reindexing your data. Additionally, if you need to capture live traffic and perform a zero-downtime migration, Migration Assistant would be the right choice.
+
+There are also tools available for migrating cluster configuration, templates, and aliases, which can be helpful depending on the complexity of your setup. These tools streamline the migration process by preserving critical settings and custom configurations.
+
+## Migration paths
+
+| **Source Version**          | **Target Version**               |
+|-----------------------------|----------------------------------|
+| Elasticsearch 6.8           | OpenSearch 1.3                   |
+| Elasticsearch 6.8           | OpenSearch 2.15                  |
+| Elasticsearch 7.10.2        | OpenSearch 1.3                   |
+| Elasticsearch 7.10.2        | OpenSearch 2.15                  |
+| Elasticsearch 7.17          | OpenSearch 1.3                   |
+| Elasticsearch 7.17          | OpenSearch 2.15                  |
+| OpenSearch 1.3              | OpenSearch 2.15                  |
+
+ 
+{: .note}
+
+### Supported source and target platforms
+
+* Self-managed (hosted by cloud provider or on-premises)
+* AWS OpenSearch
+
+The tooling is designed to work with other cloud provider platforms, but it is not officially tested with these other platforms. If you would like to add support, please contact one of the maintainers on [GitHub](https://github.com/opensearch-project/opensearch-migrations/blob/main/MAINTAINERS.md).
+
+### Future migration paths
+
+To see the OpenSearch migrations roadmap, go to [OpenSearch Migrations - Roadmap](https://github.com/orgs/opensearch-project/projects/229/views/1).
+
+## Supported components
+
+Before starting a migration, consider the scope of the components involved. The table below outlines the components that should be considered for migration, indicates their support by the Migration Assistant, and provides comments and recommendations.
+
+| Component | Supported | Recommendations   |
+| :--- |:--- | :--- |
+| **Documents**  | Yes  | Migrate existing data with `reindex-from-snapshot` (RFS) and live traffic with Capture and Replay. |
+| **Index settings**  | Yes   | Migrate with the metadata migration tool. |
+| **Index mappings**  | Yes   | Migrate with the metadata migration tool.  |
+| **Index templates**   | Yes   | Migrate with the metadata migration tool. |
+| **Component templates**          | Yes                 | Migrate with the metadata migration tool.                                                                                                                                                                |
+| **Aliases**                      | Yes                 | Migrate with the metadata migration tool.                                                                                                                                                                |
+| **Index State Management (ISM) policies**                 | Expected in 2025    | Manually migrate using an API.                                                                                                                                                                          |
+| **Elasticsearch Kibana dashboards** | Expected in 2025 | This tool is only needed when used to migrate Elasticsearch Kibana Dashboards to OpenSearch Dashboards. To start, export JSON files from Kibana and import them into OpenSearch Dashboards; before importing, use the [`dashboardsSanitizer`](https://github.com/opensearch-project/opensearch-migrations/tree/main/dashboardsSanitizer) tool on X-Pack visualizations like Canvas and Lens in Kibana Dashboards, as they may require recreation for compatibility with OpenSearch. |
+| **Security constructs**          | No                  | Configure roles and permissions based on cloud provider recommendations. For example, if using AWS, leverage AWS Identity and Access Management (IAM) for enhanced security management.                                                  |
+| **Plugins**                      | No                  | Check plugin compatibility; some Elasticsearch plugins may not have direct equivalents in OpenSearch.                                                                                              |
diff --git a/_migration-assistant/migration-console/accessing-the-migration-console.md b/_migration-assistant/migration-console/accessing-the-migration-console.md
new file mode 100644
index 0000000000..ea66f5c04c
--- /dev/null
+++ b/_migration-assistant/migration-console/accessing-the-migration-console.md
@@ -0,0 +1,35 @@
+---
+layout: default
+title: Accessing the migration console
+nav_order: 35
+parent: Migration console
+---
+
+# Accessing the migration console
+
+The Bootstrap box deployed through Migration Assistant contains a script that simplifies access to the migration console through that instance.
+
+To access the migration console, use the following commands:
+
+```shell
+export STAGE=dev
+export AWS_REGION=us-west-2
+/opensearch-migrations/deployment/cdk/opensearch-service-migration/accessContainer.sh migration-console ${STAGE} ${AWS_REGION}
+```
+{% include copy.html %}
+
+When opening the console a message will appear above the command prompt, `Welcome to the Migration Assistant Console`.
+
+On a machine with the [AWS Command Line Interface (AWS CLI)](https://docs.aws.amazon.com/cli/latest/userguide/getting-started-install.html) and the [AWS Session Manager plugin](https://docs.aws.amazon.com/systems-manager/latest/userguide/session-manager-working-with-install-plugin.html), you can directly connect to the migration console. Ensure that you've run `aws configure` with credentials that have access to the environment.
+
+Use the following commands:
+
+```shell
+export STAGE=dev
+export SERVICE_NAME=migration-console
+export TASK_ARN=$(aws ecs list-tasks --cluster migration-${STAGE}-ecs-cluster --family "migration-${STAGE}-${SERVICE_NAME}" | jq --raw-output '.taskArns[0]')
+aws ecs execute-command --cluster "migration-${STAGE}-ecs-cluster" --task "${TASK_ARN}" --container "${SERVICE_NAME}" --interactive --command "/bin/bash"
+```
+{% include copy.html %}
+
+Typically, `STAGE` is equivalent to a standard `dev` environment, but this may vary based on what the user specified during deployment.
\ No newline at end of file
diff --git a/_migration-assistant/migration-console/index.md b/_migration-assistant/migration-console/index.md
new file mode 100644
index 0000000000..3e08e72c5c
--- /dev/null
+++ b/_migration-assistant/migration-console/index.md
@@ -0,0 +1,16 @@
+---
+layout: default
+title: Migration console
+nav_order: 30
+has_children: true
+permalink: /migration-console/
+redirect_from: 
+  - /migration-console/index/
+---
+
+# Migration console
+
+The Migrations Assistant deployment includes an Amazon Elastic Container Service (Amazon ECS) task that hosts tools that run different phases of the migration and check the progress or results of the migration. This ECS task is called the **migration console**. The migration console is a command line interface used to interact with the deployed components of the solution.
+
+This section provides information about how to access the migration console and what commands are supported.
+
diff --git a/_migration-assistant/migration-console/migration-console-commands-references.md b/_migration-assistant/migration-console/migration-console-commands-references.md
new file mode 100644
index 0000000000..21d793b3f3
--- /dev/null
+++ b/_migration-assistant/migration-console/migration-console-commands-references.md
@@ -0,0 +1,131 @@
+---
+layout: default
+title: Command reference
+nav_order: 40
+parent: Migration console
+---
+
+# Migration console command reference
+
+Migration console commands follow this syntax: `console [component] [action]`. The components include `clusters`, `backfill`, `snapshot`, `metadata`, and `replay`. The console is configured with a registry of the deployed services and the source and target cluster, generated from the `cdk.context.json` values.
+
+## Commonly used commands
+
+The exact commands used will depend heavily on use-case and goals, but the following are a series of common commands with a quick description of what they do.
+
+### Check connection
+
+Reports whether both the source and target clusters can be reached and provides their versions.
+
+```sh
+console clusters connection-check
+```
+{% include copy.html %}
+
+### Run `cat-indices`
+
+Runs the `cat-indices` API on the cluster.
+
+```sh
+console clusters cat-indices
+```
+{% include copy.html %}
+
+### Create a snapshot
+
+Creates a snapshot of the source cluster and stores it in a preconfigured Amazon Simple Storage Service (Amazon S3) bucket.
+
+```sh
+console snapshot create
+```
+{% include copy.html %}
+
+## Check snapshot status
+
+Runs a detailed check on the snapshot creation status, including estimated completion time:
+
+```sh
+console snapshot status --deep-check
+```
+{% include copy.html %}
+
+## Evaluate metadata
+
+Performs a dry run of metadata migration, showing which indexes, templates, and other objects will be migrated to the target cluster.
+
+```sh
+console metadata evaluate
+```
+{% include copy.html %}
+
+## Migrate metadata
+
+Migrates the metadata from the source cluster to the target cluster.
+
+```sh
+console metadata migrate
+```
+{% include copy.html %}
+
+## Start a backfill
+
+If `Reindex-From-Snapshot` (RFS) is enabled, this command starts an instance of the service to begin moving documents to the target cluster:
+
+There are similar `scale UNITS` and `stop` commands to change the number of active instances for RFS.
+
+
+```sh
+console backfill start
+```
+{% include copy.html %}
+
+## Check backfill status
+
+Gets the current status of the backfill migration, including the number of operating instances and the progress of the shards.
+
+
+## Start Traffic Replayer
+
+If Traffic Replayer is enabled, this command starts an instance of Traffic Replayer to begin replaying traffic against the target cluster.
+The `stop` command stops all active instances.
+
+```sh
+console replay start
+```
+{% include copy.html %}
+
+## Read logs
+
+Reads any logs that exist when running Traffic Replayer. Use tab completion on the path to fill in the available `NODE_IDs` and, if applicable, log file names. The tuple logs roll over at a certain size threshold, so there may be many files named with timestamps. The `jq` command pretty-prints each line of the tuple output before writing it to file.
+
+```sh
+console tuples show --in /shared-logs-output/traffic-replayer-default/[NODE_ID]/tuples/console.log | jq > readable_tuples.json
+```
+{% include copy.html %}
+
+## Help option
+
+All commands and options can be explored within the tool itself by using the `--help` option, either for the entire `console` application or for individual components (for example, `console backfill --help`). For example:
+
+```bash
+$ console --help
+Usage: console [OPTIONS] COMMAND [ARGS]...
+
+Options:
+  --config-file TEXT  Path to config file
+  --json
+  -v, --verbose       Verbosity level. Default is warn, -v is info, -vv is
+                      debug.
+  --help              Show this message and exit.
+
+Commands:
+  backfill    Commands related to controlling the configured backfill...
+  clusters    Commands to interact with source and target clusters
+  completion  Generate shell completion script and instructions for setup.
+  kafka       All actions related to Kafka operations
+  metadata    Commands related to migrating metadata to the target cluster.
+  metrics     Commands related to checking metrics emitted by the capture...
+  replay      Commands related to controlling the replayer.
+  snapshot    Commands to create and check status of snapshots of the...
+  tuples      All commands related to tuples.
+```
diff --git a/_migration-assistant/migration-phases/assessing-your-cluster-for-migration.md b/_migration-assistant/migration-phases/assessing-your-cluster-for-migration.md
new file mode 100644
index 0000000000..5ded49eb59
--- /dev/null
+++ b/_migration-assistant/migration-phases/assessing-your-cluster-for-migration.md
@@ -0,0 +1,48 @@
+---
+layout: default
+title: Assessing your cluster for migration
+nav_order: 60
+parent: Migration phases
+---
+
+# Assessing your cluster for migration
+
+
+The goal of the Migration Assistant is to streamline the process of migrating from one location or version of Elasticsearch/OpenSearch to another. However, completing a migration sometimes requires resolving client compatibility issues before they can communicate directly with the target cluster.
+
+## Understanding breaking changes
+
+Before performing any upgrade or migration, you should review any documentation of breaking changes.  Even if the cluster is migrated there might be changes required for clients to connect to the new cluster
+
+## Upgrade and breaking changes guides
+
+For migrations paths between Elasticsearch 6.8 and OpenSearch 2.x users should be familiar with documentation in the links below that apply to their specific case:
+
+* [Upgrading Amazon Service Domains](https://docs.aws.amazon.com/opensearch-service/latest/developerguide/version-migration.html).
+
+* [Changes from Elasticsearch to OpenSearch fork](https://docs.aws.amazon.com/opensearch-service/latest/developerguide/rename.html).
+
+* [OpenSearch Breaking Changes](https://opensearch.org/docs/latest/breaking-changes/).
+
+The next step is to set up a proper test bed to verify that your applications will work as expected on the target version.
+
+## Impact of data transformations
+
+Any time you apply a transformation to your data, such as:
+
+- Changing index names
+- Modifying field names or field mappings
+- Splitting indices with type mappings
+
+These changes might need to be reflected in your client configurations. For example, if your clients are reliant on specific index or field names, you must ensure that their queries are updated accordingly.
+
+We recommend running production-like queries against the target cluster before switching over actual production traffic. This helps verify that the client can:
+
+- Communicate with the target cluster
+- Locate the necessary indices and fields
+- Retrieve the expected results
+
+For complex migrations involving multiple transformations or breaking changes, we highly recommend performing a trial migration with representative, non-production data (e.g., in a staging environment) to fully test client compatibility with the target cluster.
+
+
+
diff --git a/_migration-assistant/migration-phases/backfill.md b/_migration-assistant/migration-phases/backfill.md
new file mode 100644
index 0000000000..d2ff7cd873
--- /dev/null
+++ b/_migration-assistant/migration-phases/backfill.md
@@ -0,0 +1,181 @@
+---
+layout: default
+title: Backfill
+nav_order: 90
+parent: Migration phases
+---
+
+# Backfill
+
+After the [metadata]({{site.url}}{{site.baseurl}}/migration-assistant/migration-phases/migrating-metadata/) for your cluster has been migrated, you can use capture proxy data replication and snapshots to backfill your data into the next cluster.
+
+## Capture proxy data replication
+
+If you're interested in capturing live traffic during your migration, Migration Assistant includes an Application Load Balancer for routing traffic to the capture proxy and the target cluster. Upstream client traffic must be routed through the capture proxy in order to replay the requests later. Before using the capture proxy, remember the following:
+
+* The layer upstream from the Application Load Balancer is compatible with the certificate on the Application Load Balancer listener, whether it's for clients or a Network Load Balancer. The `albAcmCertArn` in the `cdk.context.json` may need to be provided to ensure that clients trust the Application Load Balancer certificate.
+* If a Network Load Balancer is used directly upstream of the Application Load Balancer, it must use a TLS listener.
+* Upstream resources and security groups must allow network access to the Migration Assistant Application Load Balancer.
+
+To set up the capture proxy, go to the AWS Management Console and navigate to **EC2 > Load Balancers > Migration Assistant Application Load Balancer**. Copy the Application Load Balancer URL. With the URL copied, you can use one of the following options.
+
+
+### If you are using **Network Load Balancer → Application Load Balancer → Cluster**
+
+1. Ensure that ingress is provided directly to the Application Load Balancer for the capture proxy.
+2. Create a target group for the Migration Assistant Application Load Balancer on port `9200`, and set the health check to `HTTPS`.
+3. Associate this target group with your existing Network Load Balancer on a new listener for testing.
+4. Verify that the health check is successful, and perform smoke testing with some clients through the new listener port.
+5. Once you are ready to migrate all clients, detach the Migration Assistant Application Load Balancer target group from the testing Network Load Balancer listener and modify the existing Network Load Balancer listener to direct traffic to this target group.
+6. Now client requests will be routed through the proxy (once they establish a new connection). Verify the application metrics.
+
+### If you are using **Network Load Balancer → Cluster**
+
+If you do not want to modify application logic, add an Application Load Balancer in front of your cluster and follow the **Network Load Balancer → Application Load Balancer → Cluster** steps. Otherwise:
+
+1. Create a target group for the Application Load Balancer on port `9200` and set the health check to `HTTPS`.
+2. Associate this target group with your existing Network Load Balancer on a new listener.
+3. Verify that the health check is successful, and perform smoke testing with some clients through the new listener port.
+4. Once you are ready to migrate all clients, deploy a change so that clients hit the new listener.
+   
+
+### If you are **not using an Network Load Balancer**
+
+If you're only using backfill as your migration technique, make a client/DNS change to route clients to the Migration Assistant Application Load Balancer on port `9200`.
+
+
+### Kafka connection
+
+After you have routed the client based on your use case, test adding records against HTTP requests using the following steps:
+
+In the migration console, run the following command:
+
+   ```bash
+   console kafka describe-topic-records
+   ```
+   {% include copy.html %}
+   
+   Note the records in the logging topic.
+   
+After a short period, execute the same command again and compare the increased number of records against the expected HTTP requests.
+
+
+## Creating a snapshot
+
+Create a snapshot for your backfill using the following command:
+
+```bash
+console snapshot create
+```
+{% include copy.html %}
+
+To check the progress of your snapshot, use the following command:
+
+```bash
+console snapshot status --deep-check
+```
+{% include copy.html %}
+
+Depending on the size of the data in the source cluster and the bandwidth allocated for snapshots, the process can take some time. Adjust the maximum rate at which the source cluster's nodes create the snapshot using the `--max-snapshot-rate-mb-per-node` option. Increasing the snapshot rate will consume more node resources, which may affect the cluster's ability to handle normal traffic.
+
+## Backfilling documents to the source cluster
+
+From the snapshot you created of your source cluster, you can begin backfilling documents into the target cluster. Once you have started this process, a fleet of workers will spin up to read the snapshot and reindex documents into the target cluster. This fleet of workers can be scaled to increased the speed at which documents are reindexed into the target cluster.
+
+### Checking the starting state of the clusters
+
+You can check the indexes and document counts of the source and target clusters by running the `cat-indices` command. This can be used to monitor the difference between the source and target for any migration scenario. Check the indexes of both clusters using the following command:
+
+```shell
+console clusters cat-indices
+```
+{% include copy.html %}
+
+You should receive the following response:
+
+```shell
+SOURCE CLUSTER
+health status index       uuid                   pri rep docs.count docs.deleted store.size pri.store.size
+green  open   my-index WJPVdHNyQ1KMKol84Cy72Q   1   0          8            0     44.7kb         44.7kb
+
+TARGET CLUSTER
+health status index                        uuid                   pri rep docs.count docs.deleted store.size pri.store.size
+green  open   .opendistro_security         N3uy88FGT9eAO7FTbLqqqA   1   0         10            0     78.3kb         78.3kb
+```
+
+### Starting the backfill
+
+Use the following command to start the backfill and deploy the workers:
+
+```shell
+console backfill start
+```
+{% include copy.html %}
+
+You should receive a response similar to the following:
+
+```shell
+BackfillStatus.RUNNING
+Running=1
+Pending=0
+Desired=1
+Shards total: 48
+Shards completed: 48
+Shards incomplete: 0
+Shards in progress: 0
+Shards unclaimed: 0
+```
+
+The status will be `Running` even if all the shards have been migrated.
+
+### Scaling up the fleet
+
+To speed up the transfer, you can scale the number of workers. It may take a few minutes for these additional workers to come online. The following command will update the worker fleet to a size of 10:
+
+```shell
+console backfill scale 5
+```
+{% include copy.html %}
+
+We recommend slowly scaling up the fleet while monitoring the health metrics of the target cluster to avoid over-saturating it. [Amazon OpenSearch Service domains](https://docs.aws.amazon.com/opensearch-service/latest/developerguide/monitoring.html) provide a number of metrics and logs that can provide this insight.
+
+### Stopping the migration
+
+Backfill requires manually stopping the fleet. Once all the data has been migrated, you can shut down the fleet and all its workers using the following command:
+Backfill requires manually stopping the fleet. Once all the data has been migrated, you can shut down the fleet and all its workers using the following command:
+```shell
+console backfill stop
+```
+
+### Amazon CloudWatch metrics and dashboard
+
+Migration Assistant creates an Amazon CloudWatch dashboard that you can use to visualize the health and performance of the backfill process. It combines the metrics for the backfill workers and, for those migrating to Amazon OpenSearch Service, the target cluster.
+
+You can find the backfill dashboard in the CloudWatch console based on the AWS Region in which you have deployed Migration Assistant. The metric graphs for your target cluster will be blank until you select the OpenSearch domain you're migrating to from the dropdown menu at the top of the dashboard.
+
+## Validating the backfill
+
+After the backfill is complete and the workers have stopped, examine the contents of your cluster using the [Refresh API](https://opensearch.org/docs/latest/api-reference/index-apis/refresh/) and the [Flush API](https://opensearch.org/docs/latest/api-reference/index-apis/flush/). The following example uses the console CLI with the Refresh API to check the backfill status:
+
+```shell
+console clusters cat-indices --refresh
+```
+{% include copy.html %}
+
+This will display the number of documents in each of the indexes in the target cluster, as shown in the following example response:
+
+```shell
+SOURCE CLUSTER
+health status index                uuid                   pri rep docs.count docs.deleted store.size pri.store.size
+green  open   my-index             -DqPQDrATw25hhe5Ss34bQ   1   0          3            0     12.7kb         12.7kb
+
+TARGET CLUSTER
+health status index                     uuid                   pri rep docs.count docs.deleted store.size pri.store.size
+green  open   .opensearch-observability 8HOComzdSlSWCwqWIOGRbQ   1   1          0            0       416b           208b
+green  open   .plugins-ml-config        9tld-PCJToSUsMiyDhlyhQ   5   1          1            0      9.5kb          4.7kb
+green  open   my-index                  bGfGtYoeSU6U6p8leR5NAQ   1   0          3            0      5.5kb          5.5kb
+green  open   .migrations_working_state lopd47ReQ9OEhw4ZuJGZOg   1   1          2            0     18.6kb          6.4kb
+green  open   .kibana_1
+```
+
+You can run additional queries against the target cluster to mimic your production workflow and closely examine the results.
diff --git a/_migration-assistant/migration-phases/index.md b/_migration-assistant/migration-phases/index.md
new file mode 100644
index 0000000000..c3c6c14b07
--- /dev/null
+++ b/_migration-assistant/migration-phases/index.md
@@ -0,0 +1,16 @@
+---
+layout: default
+title: Migration phases
+nav_order: 50
+has_children: true
+permalink: /migration-phases/
+redirect_from: 
+  - /migration-phases/index/
+---
+
+This page details how to conduct a migration with Migration Assistant. It encompasses a variety of scenarios including:
+
+- [**Metadata migration**]({{site.url}}{{site.baseurl}}/migration-assistant/migration-phases/migrating-metadata/): Migrating cluster metadata, such as index settings, aliases, and templates.
+- [**Backfill migration**]({{site.url}}{{site.baseurl}}/migration-assistant/migration-phases/backfill/): Migrating existing or historical data from a source to a target cluster.
+- **Live traffic migration**: Replicating live ongoing traffic from a source to a target cluster.
+
diff --git a/_migrations/migration-phases/metadata/Metadata-Migration.md b/_migration-assistant/migration-phases/migrating-metadata.md
similarity index 58%
rename from _migrations/migration-phases/metadata/Metadata-Migration.md
rename to _migration-assistant/migration-phases/migrating-metadata.md
index 543a249639..249a2ca4d0 100644
--- a/_migrations/migration-phases/metadata/Metadata-Migration.md
+++ b/_migration-assistant/migration-phases/migrating-metadata.md
@@ -1,40 +1,78 @@
 ---
 layout: default
-title: Metadata migration
+title: Migrating metadata
 nav_order: 85
-parent: Metadata
-grand_parent: Migration phases
+parent: Migration phases
 ---
 
-# Metadata migration
+# Migrating metadata
 
-Metadata migration is a relatively fast process to execute so we recommend attempting this workflow as early as possible to discover any issues which could impact longer running migration steps.
+Metadata migration involves creating a snapshot of your cluster and then migrating the metadata from the snapshot using the migration console.
 
-## Prerequisites
-A snapshot of the cluster state will need to be taken, [[guide to create a snapshot|Snapshot Creation]].
+This tool gathers information from a source cluster through a snapshot or through HTTP requests against the source cluster. These snapshots are fully compatible with the backfill process for `Reindex-From-Snapshot` (RFS) scenarios.
 
-## Command Arguments
+After collecting information on the source cluster, comparisons are made against the target cluster. If running a migration, any metadata items that do not already exist will be created on the target cluster.
+
+## Creating the snapshot
+
+Creating a snapshot of the source cluster captures all the metadata and documents to be migrated to a new target cluster.
+
+Create the initial snapshot of the source cluster using the following command:
+
+```shell
+console snapshot create
+```
+{% include copy.html %}
+
+To check the progress of the snapshot in real time, use the following command:
+
+```shell
+console snapshot status --deep-check
+```
+{% include copy.html %}
+
+You should receive the following response when the snapshot is created:
+
+```shell
+SUCCESS
+Snapshot is SUCCESS.
+Percent completed: 100.00%
+Data GiB done: 29.211/29.211
+Total shards: 40
+Successful shards: 40
+Failed shards: 0
+Start time: 2024-07-22 18:21:42
+Duration: 0h 13m 4s
+Anticipated duration remaining: 0h 0m 0s
+Throughput: 38.13 MiB/sec
+```
+
+### Managing slow snapshot speeds
+
+Depending on the size of the data in the source cluster and the bandwidth allocated for snapshots, the process can take some time. Adjust the maximum rate at which the source cluster's nodes create the snapshot using the `--max-snapshot-rate-mb-per-node` option. Increasing the snapshot rate will consume more node resources, which may affect the cluster's ability to handle normal traffic. 
+
+## Command arguments
 
 For the following commands, to identify all valid arguments, please run with `--help`.
 
 ```shell
 console metadata evaluate --help
 ```
+{% include copy.html %}
 
 ```shell
 console metadata migrate --help
 ```
+{% include copy.html %}
 
 Based on the migration console deployment options, a number of commands will be pre-populated. To view them, run console with verbosity:
 
 ```shell
 console -v metadata migrate --help
 ```
+{% include copy.html %}
 
-<details>
-<summary>
-<b>Example "console -v metadata migrate --help" command output<b>
-</summary>
+You should receive a response similar to the following:
 
 ```shell
 (.venv) bash-5.2# console -v metadata migrate --help
@@ -47,22 +85,20 @@ INFO:console_link.models.metadata:Migrating metadata with command: /root/metadat
 .
 .
 ```
-</details>
 
-## Metadata verification with evaluate command
+
+## Using the `evaluate`  command
 
 By scanning the contents of the source cluster, applying filtering, and applying modifications a list of all items that will be migrated will be created.  Any items not seen in this output will not be migrated onto the target cluster if the migrate command was to be run.  This is a safety check before making modifications on the target cluster.
 
 ```shell
 console metadata evaluate [...]
 ```
+{% include copy.html %}
 
-<details>
-<summary>
-<b>Example evaluate command output<b>
-</summary>
+You should receive a response similar to the following:
 
-```
+```bash
 Starting Metadata Evaluation
 Clusters:
    Source:
@@ -89,22 +125,20 @@ Migration Candidates:
 Results:
    0 issue(s) detected
 ```
-</details>
 
-## Metadata migration with migrate command
+
+## Using the migrate command
 
 Running through the same data as the evaluate command all of the migrated items will be applied onto the target cluster.  If re-run multiple times items that were previously migrated will not be recreated.  If any items do need to be re-migrated, please delete them from the target cluster and then rerun the evaluate then migrate commands to ensure the desired changes are made.
 
 ```shell
 console metadata migrate [...]
 ```
+{% include copy.html %}
 
-<details>
-<summary>
-<b>Example migrate command output</b>
-</summary>
+You should receive a response similar to the following:
 
-```
+```shell
 Starting Metadata Migration
 
 Clusters:
@@ -132,50 +166,54 @@ Migrated Items:
 Results:
    0 issue(s) detected
 ```
-</details>
+
 
 ## Metadata verification process
 
 Before moving on to additional migration steps, it is recommended to confirm details of your cluster.  Depending on your configuration, this could be checking the sharding strategy or making sure index mappings are correctly defined by ingesting a test document.
 
-## Troubleshoot issues
+## Troubleshooting
+
+Use these instructions to help troubleshoot the following issues.
+
+### Accessing detailed logs
 
-### Access Detailed Logs
 Metadata migration creates a detailed log file that includes low level tracing information for troubleshooting. For each execution of the program a log file is created inside a shared volume on the migration console named `shared-logs-output` the following command will list all log files, one for each run of the command.
 
 ```shell
 ls -al /shared-logs-output/migration-console-default/*/metadata/
 ```
+{% include copy.html %}
 
 To inspect the file within the console `cat`, `tail` and `grep` commands line tools.  By looking for warnings, errors and exceptions in this log file can help understand the source of failures, or at the very least be useful for creating issues in this project.
 
 ```shell
 tail /shared-logs-output/migration-console-default/*/metadata/*.log
 ```
+{% include copy.html %}
 
-### Warnings / Errors inline
-There might be `WARN` or `ERROR` elements inline the output, they will be accompanied by a short message, such as `WARN - my_index already exists`.  Full information will be in the detailed logs associated with this warnings or errors.
+### Warnings and errors
 
-### OpenSearch running in compatibility mode
-There might be an error about being unable to update an ES 7.10.2 cluster, this can occur when compatibility mode has been enabled on an OpenSearch cluster please disable it to continue, see [Enable compatibility mode](https://docs.aws.amazon.com/opensearch-service/latest/developerguide/rename.html#rename-upgrade) ↗.
+When encountering `WARN` or `ERROR` elements in the response, they will be accompanied by a short message, such as `WARN - my_index already exists`. More information can be found in the detailed logs associated with the warning or error.
 
-## How the tool works
+### OpenSearch running in compatibility mode
 
-This tool gathers information from a source cluster, through a snapshot or through HTTP requests against the source cluster.  These snapshots are fully compatible with the backfill process for Reindex-From-Snapshot (RFS) scenarios, [[learn more|Backfill-Execution]].
+There might be an error about being unable to update an ES 7.10.2 cluster, this can occur when compatibility mode has been enabled on an OpenSearch cluster disable it to continue, see [Enable compatibility mode](https://docs.aws.amazon.com/opensearch-service/latest/developerguide/rename.html#rename-upgrade).
 
-After collecting information on the source cluster comparisons are made on the target cluster.  If running a migration, any metadata items do not already exist will be created on the target cluster.
 
 ### Breaking change compatibility
 
-Metadata migration needs to modify data from the source to the target versions to recreate items.  Sometimes these features are no longer supported and have been removed from the target version.  Sometimes these features are not available on the target version, which is especially true when downgrading.  While this tool is meant to make this process easier, it is not exhaustive in its support.  When encountering a compatibility issue or an important feature gap for your migration, please [search the issues](https://github.com/opensearch-project/opensearch-migrations/issues) and comment + upvote or a [create a new](https://github.com/opensearch-project/opensearch-migrations/issues/new/choose) issue if one cannot be found.
+Metadata migration requires modifying data from the source to the target versions to recreate items. Sometimes these features are no longer supported and have been removed from the target version. Sometimes these features are not available in the target version, which is especially true when downgrading. While this tool is meant to make this process easier, it is not exhaustive in its support. When encountering a compatibility issue or an important feature gap for your migration, [search the issues and comment on the existing issue](https://github.com/opensearch-project/opensearch-migrations/issues) or [create a new](https://github.com/opensearch-project/opensearch-migrations/issues/new/choose) issue if one cannot be found.
 
 #### Deprecation of Mapping Types
+
 In Elasticsearch 6.8 the mapping types feature was discontinued in Elasticsearch 7.0+ which has created complexity in migrating to newer versions of Elasticsearch and OpenSearch, [learn more](https://www.elastic.co/guide/en/elasticsearch/reference/7.17/removal-of-types.html) ↗.
 
 As Metadata migration supports migrating from ES 6.8 on to the latest versions of OpenSearch this scenario is handled by removing the type mapping types and restructuring the template or index properties.  Note that, at the time of this writing multiple type mappings are not supported, [tracking task](https://opensearch.atlassian.net/browse/MIGRATIONS-1778) ↗.
 
 
 **Example starting state with mapping type foo (ES 6):**
+
 ```json
 {
   "mappings": [
@@ -190,8 +228,10 @@ As Metadata migration supports migrating from ES 6.8 on to the latest versions o
   ]
 }
 ```
+{% include copy.html %}
 
 **Example ending state with foo removed (ES 7):**
+
 ```json
 {
   "mappings": {
@@ -202,5 +242,6 @@ As Metadata migration supports migrating from ES 6.8 on to the latest versions o
   }
 }
 ```
+{% include copy.html %}
 
-*Technical details are available, [view source code](https://github.com/opensearch-project/opensearch-migrations/blob/main/transformation/src/main/java/org/opensearch/migrations/transformation/rules/IndexMappingTypeRemoval.java).*
\ No newline at end of file
+For additional technical details, [view the mapping type removal source code](https://github.com/opensearch-project/opensearch-migrations/blob/main/transformation/src/main/java/org/opensearch/migrations/transformation/rules/IndexMappingTypeRemoval.java).
diff --git a/_migrations/migration-phases/post-migration-cleanup/Migration-Infrastructure-Teardown.md b/_migration-assistant/migration-phases/removing-migration-infrastructure.md
similarity index 55%
rename from _migrations/migration-phases/post-migration-cleanup/Migration-Infrastructure-Teardown.md
rename to _migration-assistant/migration-phases/removing-migration-infrastructure.md
index 779dda81c5..656a8e1998 100644
--- a/_migrations/migration-phases/post-migration-cleanup/Migration-Infrastructure-Teardown.md
+++ b/_migration-assistant/migration-phases/removing-migration-infrastructure.md
@@ -1,16 +1,21 @@
+---
+layout: default
+title: Removing migration infrastructure
+nav_order: 120
+parent: Migration phases
+---
 
+# Removing migration infrastructure
 
+After a migration is complete all resources should be removed except for the target cluster, and optionally your Cloudwatch Logs, and Traffic Replayer logs.
 
-After a migration is complete all resources should be removed except for the target cluster, and optionally your Cloudwatch Logs, and Replayer logs.
-
-## Remove Migration Assistant Infrastructure
 To remove all the CDK stack(s) which get created during a deployment you can execute a command similar to below within the CDK directory
 
-```
+```bash
 cdk destroy "*" --c contextId=<CONTEXT_ID>
 ```
+{% include copy.html %}
 
 Follow the instructions on the command-line to remove the deployed resources from the AWS account.
 
-> [!Note] 
-> The AWS Console can also be used to verify, remove, and confirm resources for the Migration Assistant are no longer in the account.
\ No newline at end of file
+The AWS Management Console can also be used to remove Migration Assistant resources and confirm that they are no longer in the account.
\ No newline at end of file
diff --git a/_migration-assistant/migration-phases/switching-traffic-from-the-source-cluster.md b/_migration-assistant/migration-phases/switching-traffic-from-the-source-cluster.md
new file mode 100644
index 0000000000..c43580eef9
--- /dev/null
+++ b/_migration-assistant/migration-phases/switching-traffic-from-the-source-cluster.md
@@ -0,0 +1,52 @@
+---
+layout: default
+title: Switching traffic from the source cluster
+nav_order: 110
+parent: Migration phases
+---
+
+# Switching traffic from the source cluster
+
+After the source and target clusters are synchronized, traffic needs to be switched to the target cluster so that the source cluster can be taken offline.
+
+## Assumptions
+
+This page assumes that the following has occurred before making the switch:
+
+- All client traffic is being routed through a switchover listener in the [MigrationAssistant Application Load Balancer]({{site.url}}{{site.baseurl}}/migration-assistant/migration-phases/backfill/).
+- Client traffic has been verified as compatible with the target cluster.
+- The target cluster is in a good state to accept client traffic.
+- The target proxy service is deployed.
+
+## Switching traffic
+
+Use the following steps to switch traffic from the source cluster to the target cluster:
+
+1. In the AWS Management Console, navigate to **ECS** > **Migration Assistant Cluster**. Note the desired count of the capture proxy, which should be greater than 1.
+
+2. Update the **ECS Service** of the target proxy to be at least as large as the traffic capture proxy. Wait for tasks to start up, and verify that all targets are healthy in the target proxy service's **Load balancer health** section.
+
+3. Navigate to **EC2** > **Load Balancers** > **Migration Assistant ALB**.
+
+4. Navigate to **ALB Metrics** and examine any useful information, specifically looking at **Active Connection Count** and **New Connection Count**. Note any large discrepancies, which can indicate reused connections affecting traffic switchover.
+
+5. Navigate to **Capture Proxy Target Group** (`ALBSourceProxy-<STAGE>-TG`) > **Monitoring**.
+
+6. Examine the **Metrics Requests**, **Target (2XX, 3XX, 4XX, 5XX)**, and **Target Response Time** metrics. Verify that this appears as expected and includes all traffic expected to be included in the switchover. Note details that could help identify anomalies during the switchover, including the expected response time and response code rate.
+
+7. Navigate back to **ALB Metrics** and choose **Target Proxy Target Group** (`ALBTargetProxy-<STAGE>-TG`). Verify that all expected targets are healthy and that none are in a draining state.
+
+8. Navigate back to **ALB Metrics** and to the **Listener** on port `9200`.
+
+9. Choose the **Default rule** and **Edit**.
+
+10. Modify the weights of the targets to switch the desired traffic to the target proxy. To perform a full switchover, modify the **Target Proxy** weight to `1` and the **Source Proxy** weight to `0`.
+
+11. Choose **Save Changes**.
+
+12. Navigate to both **SourceProxy** and **TargetProxy TG Monitoring** metrics and verify that traffic is switching over as expected. If connections are being reused by clients, perform any necessary actions to terminate them. Monitor these metrics until **SourceProxy TG** shows 0 requests when all clients have switched over.
+
+
+## Fallback
+
+If you need to fall back to the source cluster at any point during the switchover, revert the **Default rule** so that the Application Load Balancer routes to the **SourceProxy Target Group**.
\ No newline at end of file
diff --git a/_migration-assistant/migration-phases/using-traffic-replayer.md b/_migration-assistant/migration-phases/using-traffic-replayer.md
new file mode 100644
index 0000000000..5b7af3c3f7
--- /dev/null
+++ b/_migration-assistant/migration-phases/using-traffic-replayer.md
@@ -0,0 +1,309 @@
+---
+layout: default
+title: Using Traffic Replayer
+nav_order: 100
+parent: Migration phases
+---
+
+# Using Traffic Replayer
+
+This guide covers how to use Traffic Replayer to replay captured traffic from a source cluster to a target cluster during the migration process. Traffic Replayer allows you to verify that the target cluster can handle requests in the same way as the source cluster and catch up to real-time traffic for a smooth migration.
+
+## When to run Traffic Replayer
+
+After deploying Migration Assistant, Traffic Replayer does not run by default. It should be started only after all metadata and documents have been migrated to ensure that recent changes to the source cluster are properly reflected in the target cluster.
+
+For example, if a document was deleted after a snapshot was taken, starting Traffic Replayer before the document migration is complete may cause the deletion request to execute before the document is added to the target. Running Traffic Replayer after all other migration processes ensures that the target cluster will be consistent with the source cluster.
+
+## Configuration options
+
+[Traffic Replayer settings]({{site.url}}{{site.baseurl}}/migration-assistant/deploying-migration-assistant/configuration-options/) are configured during the deployment of Migration Assistant. Make sure to set the authentication mode for Traffic Replayer so that it can properly communicate with the target cluster. 
+
+## Using Traffic Replayer
+
+To manage Traffic Replayer, use the `console replay` command. The following examples show the available commands.
+
+### Start Traffic Replayer
+
+The following command starts Traffic Replayer with the options specified at deployment:
+
+```bash
+console replay start
+```
+
+When starting Traffic Replayer, you should receive an output similar to the following:
+
+```bash
+root@ip-10-0-2-66:~# console replay start
+Replayer started successfully.
+Service migration-dev-traffic-replayer-default set to 1 desired count. Currently 0 running and 0 pending.
+```
+
+## Check the status of Traffic Replayer
+
+Use the following command to show the status of Traffic Replayer: 
+
+```bash
+console replay status
+```
+
+Replay will return one of the following statuses:
+
+- `Running` shows how many container instances are actively running. 
+- `Pending` indicates how many instances are being provisione.d 
+- `Desired` shows the total number of instances that should be running.
+
+You should receive an output similar to the following:
+
+```bash
+root@ip-10-0-2-66:~# console replay status
+(<ReplayStatus.STOPPED: 4>, 'Running=0\nPending=0\nDesired=0')
+```
+
+## Stop Traffic Replayer
+
+The following command stops Traffic Replayer:
+
+```bash
+console replay stop
+```
+
+You should receive an output similar to the following:
+
+```bash
+root@ip-10-0-2-66:~# console replay stop
+Replayer stopped successfully.
+Service migration-dev-traffic-replayer-default set to 0 desired count. Currently 0 running and 0 pending.
+```
+
+
+
+### Delivery guarantees
+
+Traffic Replayer retrieves traffic from Kafka and updates its commit cursor after sending requests to the target cluster. This provides an "at least once" delivery guarantee; however, success isn't always guaranteed. Therefore, you should monitor metrics and tuple outputs or perform external validation to ensure that the target cluster is functioning as expected.
+
+## Time scaling
+
+Traffic Replayer sends requests in the same order that they were received from each connection to the source. However, relative timing between different connections is not guaranteed. For example:
+
+- **Scenario**: Two connections exist:one sends a PUT request every minute, and the other sends a GET request every second.
+- **Behavior**: Traffic Replayer will maintain the sequence within each connection, but the relative timing between the connections (PUTs and GETs) is not preserved.
+
+Assume that a source cluster responds to requests (GETs and PUTs) within 100 ms:
+
+- With a **speedup factor of 1**, the target will experience the same request rates and idle periods as the source.
+- With a **speedup factor of 2**, requests will be sent twice as fast, with GETs sent every 500 ms and PUTs every 30 seconds.
+- With a **speedup factor of 10**, requests will be sent 10x faster, and as long as the target responds quickly, Traffic Replayer can maintain the pace.
+
+If the target cannot respond fast enough, Traffic Replayer will wait for the previous request to complete before sending the next one. This may cause delays and affect global relative ordering.
+
+## Transformations
+
+During migrations, some requests may need to be transformed between versions. For example, Elasticsearch previously supported multiple type mappings in indexes, but this is no longer the case in OpenSearch. Clients may need to be adjusted accordingly by splitting documents into multiple indexes or transforming request data.
+
+Traffic Replayer automatically rewrites host and authentication headers, but for more complex transformations, custom transformation rules can be specified using the `--transformer-config` option. For more information, see the [Traffic Replayer README](https://github.com/opensearch-project/opensearch-migrations/blob/c3d25958a44ec2e7505892b4ea30e5fbfad4c71b/TrafficCapture/trafficReplayer/README.md#transformations). 
+
+### Example transformation
+
+Suppose that a source request contains a `tagToExcise` element that needs to be removed and its children promoted and that the URI path includes `extraThingToRemove`, which should also be removed. The following Jolt script handles this transformation:
+
+```json
+[{ "JsonJoltTransformerProvider":
+[
+  {
+    "script": {
+      "operation": "shift",
+      "spec": {
+        "payload": {
+          "inlinedJsonBody": {
+            "top": {
+              "tagToExcise": {
+                "*": "payload.inlinedJsonBody.top.&" 
+              },
+              "*": "payload.inlinedJsonBody.top.&"
+            },
+            "*": "payload.inlinedJsonBody.&"
+          },
+          "*": "payload.&"
+        },
+        "*": "&"
+      }
+    }
+  }, 
+ {
+   "script": {
+     "operation": "modify-overwrite-beta",
+     "spec": {
+       "URI": "=split('/extraThingToRemove',@(1,&))"
+     }
+  }
+ },
+ {
+   "script": {
+     "operation": "modify-overwrite-beta",
+     "spec": {
+       "URI": "=join('',@(1,&))"
+     }
+  }
+ }
+]
+}]
+```
+
+The resulting request sent to the target will appear similar to the following:
+
+```bash
+PUT /oldStyleIndex/moreStuff HTTP/1.0
+host: testhostname
+
+{"top":{"properties":{"field1":{"type":"text"},"field2":{"type":"keyword"}}}}
+```
+{% include copy.html %}
+
+You can pass Base64-encoded transformation scripts using `--transformer-config-base64`.
+
+## Result logs
+
+HTTP transactions from the source capture and those resent to the target cluster are logged in files located at `/shared-logs-output/traffic-replayer-default/*/tuples/tuples.log`. The `/shared-logs-output` directory is shared across containers, including the migration console. You can access these files from the migration console using the same path. Previous runs are also available in a `gzipped` format. 
+
+Each log entry is a newline-delimited JSON object, containing information about the source and target requests/responses along with other transaction details, such as response times. 
+
+These logs contain the contents of all requests, including authorization headers and the contents of all HTTP messages. Ensure that access to the migration environment is restricted, as these logs serve as a source of truth for determining what happened in both the source and target clusters. Response times for the source refer to the amount of time between the proxy sending the end of a request and receiving the response. While response times for the target are recorded in the same manner, keep in mind that the locations of the capture proxy, Traffic Replayer, and target may differ and that these logs do not account for the client's location.
+{: .note}
+
+
+### Example log entry
+
+The following example log entry shows a `/_cat/indices?v` request sent to both the source and target clusters:
+
+```json
+{
+    "sourceRequest": {
+        "Request-URI": "/_cat/indices?v",
+        "Method": "GET",
+        "HTTP-Version": "HTTP/1.1",
+        "Host": "capture-proxy:9200",
+        "Authorization": "Basic YWRtaW46YWRtaW4=",
+        "User-Agent": "curl/8.5.0",
+        "Accept": "*/*",
+        "body": ""
+    },
+    "sourceResponse": {
+        "HTTP-Version": {"keepAliveDefault": true},
+        "Status-Code": 200,
+        "Reason-Phrase": "OK",
+        "response_time_ms": 59,
+        "content-type": "text/plain; charset=UTF-8",
+        "content-length": "214",
+        "body": "aGVhbHRoIHN0YXR1cyBpbmRleCAgICAgICB..."
+    },
+    "targetRequest": {
+        "Request-URI": "/_cat/indices?v",
+        "Method": "GET",
+        "HTTP-Version": "HTTP/1.1",
+        "Host": "opensearchtarget",
+        "Authorization": "Basic YWRtaW46bXlTdHJvbmdQYXNzd29yZDEyMyE=",
+        "User-Agent": "curl/8.5.0",
+        "Accept": "*/*",
+        "body": ""
+    },
+    "targetResponses": [{
+        "HTTP-Version": {"keepAliveDefault": true},
+        "Status-Code": 200,
+        "Reason-Phrase": "OK",
+        "response_time_ms": 721,
+        "content-type": "text/plain; charset=UTF-8",
+        "content-length": "484",
+        "body": "aGVhbHRoIHN0YXR1cyBpbmRleCAgICAgICB..."
+    }],
+    "connectionId": "0242acfffe13000a-0000000a-00000005-1eb087a9beb83f3e-a32794b4.0",
+    "numRequests": 1,
+    "numErrors": 0
+}
+```
+{% include copy.html %}
+
+
+### Decoding log content
+
+The contents of HTTP message bodies are Base64 encoded in order to handle various types of traffic, including compressed data. To view the logs in a more human-readable format, use the console library `tuples show`. Running the script as follows will produce a `readable-tuples.log` in the home directory:
+
+```shell
+console tuples show --in /shared-logs-output/traffic-replayer-default/d3a4b31e1af4/tuples/tuples.log > readable-tuples.log
+```
+
+The `readable-tuples.log` should appear similar to the following:
+
+```json
+{
+    "sourceRequest": {
+        "Request-URI": "/_cat/indices?v",
+        "Method": "GET",
+        "HTTP-Version": "HTTP/1.1",
+        "Host": "capture-proxy:9200",
+        "Authorization": "Basic YWRtaW46YWRtaW4=",
+        "User-Agent": "curl/8.5.0",
+        "Accept": "*/*",
+        "body": ""
+    },
+    "sourceResponse": {
+        "HTTP-Version": {"keepAliveDefault": true},
+        "Status-Code": 200,
+        "Reason-Phrase": "OK",
+        "response_time_ms": 59,
+        "content-type": "text/plain; charset=UTF-8",
+        "content-length": "214",
+        "body": "health status index       uuid         ..."
+    },
+    "targetRequest": {
+        "Request-URI": "/_cat/indices?v",
+        "Method": "GET",
+        "HTTP-Version": "HTTP/1.1",
+        "Host": "opensearchtarget",
+        "Authorization": "Basic YWRtaW46bXlTdHJvbmdQYXNzd29yZDEyMyE=",
+        "User-Agent": "curl/8.5.0",
+        "Accept": "*/*",
+        "body": ""
+    },
+    "targetResponses": [{
+        "HTTP-Version": {"keepAliveDefault": true},
+        "Status-Code": 200,
+        "Reason-Phrase": "OK",
+        "response_time_ms": 721,
+        "content-type": "text/plain; charset=UTF-8",
+        "content-length": "484",
+        "body": "health status index       uuid         ..."
+    }],
+    "connectionId": "0242acfffe13000a-0000000a-00000005-1eb087a9beb83f3e-a32794b4.0",
+    "numRequests": 1,
+    "numErrors": 0
+}
+```
+
+
+## Metrics
+
+Traffic Replayer emits various OpenTelemetry metrics to Amazon CloudWatch, and traces are sent through AWS X-Ray. The following are some useful metrics that can help evaluate cluster performance.
+
+### `sourceStatusCode`
+
+This metric tracks the HTTP status codes for both the source and target clusters, with dimensions for the HTTP verb, such as `GET` or `POST`, and the status code families (200--299). These dimensions can help quickly identify discrepancies between the source and target, such as when `DELETE 200s` becomes `4xx` or `GET 4xx` errors turn into `5xx` errors.
+
+### `lagBetweenSourceAndTargetRequests`
+
+This metric shows the delay between requests hitting the source and target clusters. With a speedup factor greater than 1 and a target cluster that can handle requests efficiently, this value should decrease as the replay progresses, indicating a reduction in replay lag.
+
+### Additional metrics
+
+The following metrics are also reported:
+
+- **Throughput**: `bytesWrittenToTarget` and `bytesReadFromTarget` indicate the throughput to and from the cluster.
+- **Retries**: `numRetriedRequests` tracks the number of requests retried due to status code mismatches between the source and target.
+- **Event counts**: Various `(*)Count` metrics track the number of completed events.
+- **Durations**: `(*)Duration` metrics measure the duration of each step in the process.
+- **Exceptions**: `(*)ExceptionCount` shows the number of exceptions encountered during each processing phase.
+
+
+## CloudWatch considerations
+
+Metrics pushed to CloudWatch may experience a visibility lag of around 5 minutes. CloudWatch also retains higher-resolution data for a shorter period than lower-resolution data. For more information, see [Amazon CloudWatch concepts](https://docs.aws.amazon.com/AmazonCloudWatch/latest/monitoring/cloudwatch_concepts.html).
\ No newline at end of file
diff --git a/_migration-assistant/migration-phases/verifying-migration-tools.md b/_migration-assistant/migration-phases/verifying-migration-tools.md
new file mode 100644
index 0000000000..77df2b4280
--- /dev/null
+++ b/_migration-assistant/migration-phases/verifying-migration-tools.md
@@ -0,0 +1,205 @@
+---
+layout: default
+title: Verifying migration tools
+nav_order: 70
+parent: Migration phases
+---
+
+# Verifying migration tools
+
+Before using the Migration Assistant, take the following steps to verify that your cluster is ready for migration.
+
+## Verifying snapshot creation
+
+Verify that a snapshot can be created of your source cluster and used for metadata and backfill scenarios.
+
+### Installing the Elasticsearch S3 Repository plugin
+
+The snapshot needs to be stored in a location that Migration Assistant can access. This guide uses Amazon Simple Storage Service (Amazon S3). By default, Migration Assistant creates an S3 bucket for storage. Therefore, it is necessary to install the [Elasticsearch S3 repository plugin](https://www.elastic.co/guide/en/elasticsearch/plugins/7.10/repository-s3.html) on your source nodes (https://www.elastic.co/guide/en/elasticsearch/plugins/7.10/repository-s3.html).
+
+Additionally, make sure that the plugin has been configured with AWS credentials that allow it to read and write to Amazon S3. If your Elasticsearch cluster is running on Amazon Elastic Compute Cloud (Amazon EC2) or Amazon Elastic Container Service (Amazon ECS) instances with an AWS Identity and Access Management (IAM) execution role, include the necessary S3 permissions. Alternatively, you can store the credentials in the [Elasticsearch keystore](https://www.elastic.co/guide/en/elasticsearch/plugins/7.10/repository-s3-client.html).
+
+### Verifying the S3 repository plugin configuration
+
+You can verify that the S3 repository plugin is configured correctly by creating a test snapshot.
+
+Create an S3 bucket for the snapshot using the following AWS Command Line Interface (AWS CLI) command:
+
+```shell
+aws s3api create-bucket --bucket <your-bucket-name> --region <your-aws-region>
+```
+{% include copy.html %}
+
+Register a new S3 snapshot repository on your source cluster using the following cURL command:
+
+```shell
+curl -X PUT "http://<your-source-cluster>:9200/_snapshot/test_s3_repository" -H "Content-Type: application/json" -d '{
+  "type": "s3",
+  "settings": {
+    "bucket": "<your-bucket-name>",
+    "region": "<your-aws-region>"
+  }
+}'
+```
+{% include copy.html %}
+
+Next, create a test snapshot that captures only the cluster's metadata:
+
+```shell
+curl -X PUT "http://<your-source-cluster>:9200/_snapshot/test_s3_repository/test_snapshot_1" -H "Content-Type: application/json" -d '{
+  "indices": "",
+  "ignore_unavailable": true,
+  "include_global_state": true
+}'
+```
+{% include copy.html %}
+
+Check the AWS Management Console to confirm that your bucket contains the snapshot. 
+
+### Removing test snapshots after verification
+
+To remove the resources created during verification, you can use the following deletion commands:
+
+**Test snapshot**
+
+```shell
+curl -X DELETE "http://<your-source-cluster>:9200/_snapshot/test_s3_repository/test_snapshot_1?pretty"
+```
+{% include copy.html %}
+
+**Test snapshot repository**
+
+```shell
+curl -X DELETE "http://<your-source-cluster>:9200/_snapshot/test_s3_repository?pretty"
+```
+{% include copy.html %}
+
+**S3 bucket**
+
+```shell
+aws s3 rm s3://<your-bucket-name> --recursive
+aws s3api delete-bucket --bucket <your-bucket-name> --region <your-aws-region>
+```
+{% include copy.html %}
+
+### Troubleshooting
+
+Use this guidance to troubleshoot any of the following snapshot verification issues.
+
+#### Access denied error (403)
+
+If you encounter an error like `AccessDenied (Service: Amazon S3; Status Code: 403)`, verify the following:
+
+- The IAM role assigned to your Elasticsearch cluster has the necessary S3 permissions.
+- The bucket name and AWS Region provided in the snapshot configuration match the actual S3 bucket you created.
+
+#### Older versions of Elasticsearch
+
+Older versions of the Elasticsearch S3 repository plugin may have trouble reading IAM role credentials embedded in Amazon EC2 and Amazon ECS instances. This is because the copy of the AWS SDK shipped with them is too old to read the new standard way of retrieving those credentials, as shown in [the Instance Metadata Service v2 (IMDSv2) specification](https://docs.aws.amazon.com/AWSEC2/latest/UserGuide/ec2-instance-metadata.html). This can result in snapshot creation failures, with an error message similar to the following:
+
+```json
+{"error":{"root_cause":[{"type":"repository_verification_exception","reason":"[migration_assistant_repo] path [rfs-snapshot-repo] is not accessible on master node"}],"type":"repository_verification_exception","reason":"[migration_assistant_repo] path [rfs-snapshot-repo] is not accessible on master node","caused_by":{"type":"i_o_exception","reason":"Unable to upload object [rfs-snapshot-repo/tests-s8TvZ3CcRoO8bvyXcyV2Yg/master.dat] using a single upload","caused_by":{"type":"amazon_service_exception","reason":"Unauthorized (Service: null; Status Code: 401; Error Code: null; Request ID: null)"}}},"status":500}
+```
+
+If you encounter this issue, you can resolve it by temporarily enabling IMDSv1 on the instances in your source cluster for the duration of the snapshot. There is a toggle for this available in the AWS Management Console as well as in the AWS CLI. Switching this toggle will turn on the older access model and enable the Elasticsearch S3 repository plugin to work as normal. For more information about IMDSv1, see [Modify instance metadata options for existing instances](https://docs.aws.amazon.com/AWSEC2/latest/UserGuide/configuring-IMDS-existing-instances.html).
+
+## Switching over client traffic
+
+The Migration Assistant Application Load Balancer is deployed with a listener that shifts traffic between the source and target clusters through proxy services. The Application Load Balancer should start in **Source Passthrough** mode.
+
+### Verifying that the traffic switchover is complete
+
+Use the following steps to verify that the traffic switchover is complete:
+
+1. In the AWS Management Console, navigate to **EC2 > Load Balancers**.
+2. Select the **MigrationAssistant ALB**.
+3. Examine the listener on port `9200` and verify that 100% of the traffic is directed to the **Source Proxy**.
+4. Navigate to the **Migration ECS Cluster** in the AWS Management Console.
+5. Select the **Target Proxy Service**.
+6. Verify that the desired count for the service is running:
+   * If the desired count is not met, update the service to increase it to at least 1 and wait for the service to start.
+7. On the **Health and Metrics** tab under **Load balancer health**, verify that all targets are reporting as healthy:
+   * This confirms that the Application Load Balancer can connect to the target cluster through the target proxy.
+8. (Reset) Update the desired count for the **Target Proxy Service** back to its original value in Amazon ECS.
+
+### Fixing unidentified traffic patterns
+
+When switching over traffic to the target cluster, you might encounter unidentified traffic patterns. To help identify the cause of these patterns, use the following steps:
+* Verify that the target cluster allows traffic ingress from the **Target Proxy Security Group**.
+* Navigate to **Target Proxy ECS Tasks** to investigate any failing tasks.
+Set the **Filter desired status** to **Any desired status** to view all tasks, then navigate to the logs for any stopped tasks.
+
+
+## Verifying replication
+
+Use the following steps to verify that replication is working once the traffic capture proxy is deployed:
+
+
+1. Navigate to the **Migration ECS Cluster** in the AWS Management Console.
+2. Navigate to **Capture Proxy Service**.
+3. Verify that the capture proxy is running with the desired proxy count. If it is not, update the service to increase it to at least 1 and wait for startup.
+4. Under **Health and Metrics** > **Load balancer health**, verify that all targets are healthy. This means that the Application Load Balancer is able to connect to the source cluster through the capture proxy.
+5. Navigate to the **Migration Console Terminal**.
+6. Run `console kafka describe-topic-records`. Wait 30 seconds for another Application Load Balancer health check.
+7. Run `console kafka describe-topic-records` again and verify that the number of RECORDS increased between runs.
+8. Run `console replay start` to start Traffic Replayer.
+9.  Run `tail -f /shared-logs-output/traffic-replayer-default/*/tuples/tuples.log  | jq '.targetResponses[]."Status-Code"'` to confirm that the Kafka requests were sent to the target and that it responded as expected. If the responses don't appear:
+    * Check that the migration console can access the target cluster by running `./catIndices.sh`, which should show the indexes in the source and target.
+    * Confirm that messages are still being recorded to Kafka.
+    * Check for errors in the Traffic Replayer logs (`/migration/STAGE/default/traffic-replayer-default`) using CloudWatch.
+10. (Reset) Update the desired count for the **Capture Proxy Service** back to its original value in Amazon ECS.
+
+### Troubleshooting
+
+Use this guidance to troubleshoot any of the following replication verification issues.
+
+### Health check responses with 401/403 status code
+
+If the source cluster is configured to require authentication, the capture proxy will not be able to verify replication beyond receiving a 401/403 status code for Application Load Balancer health checks. For more information, see [Failure Modes](https://github.com/opensearch-project/opensearch-migrations/blob/main/TrafficCapture/trafficCaptureProxyServer/README.md#failure-modes).
+
+### Traffic does not reach the source cluster 
+
+Verify that the source cluster allows traffic ingress from the Capture Proxy Security Group.
+
+Look for failing tasks by navigating to **Traffic Capture Proxy ECS**. Change **Filter desired status** to **Any desired status** in order to see all tasks and navigate to the logs for stopped tasks.
+
+
+## Resetting before migration
+
+After all verifications are complete, reset all resources before using Migration Assistant for an actual migration. 
+
+The following steps outline how to reset resources with Migration Assistant before executing the actual migration. At this point all verifications are expected to have been completed. These steps can be performed after [Accessing the Migration Console]({{site.url}}{{site.baseurl}}/migration-assistant/migration-console/accessing-the-migration-console/).
+
+### Traffic Replayer
+
+To stop running Traffic Replayer, use the following command:
+
+```bash
+console replay stop
+```
+{% include copy.html %}
+
+### Kafka 
+
+To clear all captured traffic from the Kafka topic, you can run the following command. 
+
+This command will result in the loss of any traffic data captured by the capture proxy up to this point and thus should be used with caution.
+{: .warning}
+
+```bash
+console kafka delete-topic
+```
+{% include copy.html %}
+
+### Target cluster 
+
+To clear non-system indexes from the target cluster that may have been created as a result of testing, you can run the following command: 
+
+This command will result in the loss of all data in the target cluster and should be used with caution.
+{: .warning}
+
+```bash
+console clusters clear-indices --cluster target
+```
+{% include copy.html %}
+
diff --git a/_migrations/Solution-Overview.md b/_migrations/Solution-Overview.md
deleted file mode 100644
index e69b0cd6cf..0000000000
--- a/_migrations/Solution-Overview.md
+++ /dev/null
@@ -1,59 +0,0 @@
----
-layout: default
-title: Migration assistant overview
-nav_order: 15
----
-
-# Migration assistant overview
-
-This Overview outlines the process for successfully performing an end-to-end migration. The solution offered in this repository caters to several specific scenarios:
-
-1. Migrating cluster metadata, such as index settings, aliases, and templates.
-2. Migrating existing or historical data from a source to a target cluster.
-3. Transferring ongoing or live traffic between clusters.
-4. Conducting a comprehensive migration involving both existing and live data with zero downtime and the option to back out of a migration.
-5. Upgrading an existing cluster.
-6. Comparing an existing cluster with a prospective new one.
-
-In this guide, we focus on scenario 4, guiding you through the migration of historical data from a source cluster while concurrently handling live production traffic, which will be captured and redirected to a target cluster. It's crucial to note that migration strategies are not universally applicable. This guide provides a detailed methodology, based on certain assumptions detailed throughout, emphasizing the importance of robust engineering practices and a systematic approach to ensure a successful migration.
-
-## Key Components of the Solution
-
-### Elasticsearch/OpenSearch Source
-Your source cluster in this solution operates on Elasticsearch or OpenSearch, hosted on EC2 instances or similar computing environments. A proxy is set up to interact with this source cluster, either positioned in front of or directly on the coordinating nodes of the cluster.
-
-### Capture Proxy
-This component is designed for HTTP RESTful traffic, playing a dual role. It not only forwards traffic to the source cluster but also splits and channels this traffic to a stream-processing service for later playback.
-
-### Traffic Replayer
-Acting as a traffic simulation tool, the Traffic Replayer replays recorded request traffic to a target cluster, mirroring source traffic patterns. It links original requests and their responses to those directed at the target cluster, facilitating comparative analysis.
-
-### Reindex-from-Snapshort
-Reindexing data from an existing snapshot are Elastic Container Service (ECS) workers that coordinate the migration of documents from an existing snapshot, reindexing the documents in parallel to a target cluster.
-
-### Migration Management Console
-A conatiner within Elastic Container Service (ECS) that orchestrates the deployment of the Migration Assistant for Amazon OpenSearch Service, alongside a variety of tools to streamline the migration process.
-
-### Architecture Overview
-The solution architecture, adaptable for cloud deployment, unfolds as follows:
-
-1. Incoming traffic reaches the existing cluster, targeting each coordinator node.
-2. A Capture Proxy is placed before each coordinator node for traffic capture, storing data in an event stream.
-3. With the continuous capture setup, historical data backfill is initiated.
-4. Post-backfill, the captured traffic is replayed using the Traffic Replayer.
-5. The results from directing traffic to both the original and new clusters are then evaluated.
-
-This architecture is based on the use of AWS cloud infrastructure, but most tools are designed to be cloud-independent. A local containerized version of this solution is also available.
-
-
-Deploying to AWS (covered later in the guide) will deploy the following system design:
-
-![Migration architecture overview]({{site.url}}{{site.baseurl}}/images/migrations/migration-architecture-overview.svg)
-
-1. Traffic is directed to the existing cluster.
-2. An ALB with Capture Proxies are added allowing for traffic capture and storage in Amazon Managed Streaming for Apache Kafka (MSK).
-3. With continuous traffic capture in place, a Reindex-from-Snapshot (RFS) is initiated by the user.
-4. Once Reindex-from-Snapshot, traffic captured is replayed by the user using a Traffic Replayer.
-5. The user evaluates the outcomes from routing traffic to both the original and the new cluster.
-6. After confirming the target cluster’s functionality meets expectations, the user dismantles all related stacks, retaining only the new cluster’s setup.
-    Additionally, the user may retire and discard the old cluster’s legacy infrastructure.
\ No newline at end of file
diff --git a/_migrations/deploying-migration-assistant/configuration-options.md b/_migrations/deploying-migration-assistant/configuration-options.md
deleted file mode 100644
index 5a77bd518a..0000000000
--- a/_migrations/deploying-migration-assistant/configuration-options.md
+++ /dev/null
@@ -1,234 +0,0 @@
----
-layout: default
-title: Configuration options
-nav_order: 15
-parent: Deploying migration assistant
----
-
-# Configuration options
-
-This page outlines the configuration options for three key migrations:
-1. **Metadata Migration**
-2. **Backfill Migration with Reindex-from-Snapshot (RFS)**
-3. **Live Capture Migration with Capture and Replay (C&R)**
-
-Each of these migrations may depend on either a snapshot or a capture proxy. The CDK context blocks below are shown as separate context blocks for each migration type for simplicity. If performing multiple migration types, combine these options, as the actual execution of each migration is controlled from the Migration Console.
-
-It also has a section describing how to specify the auth details for the source and target cluster (no auth, basic auth with a username and password, or sigv4 auth).
-
-> [!TIP]
-For a complete list of configuration options, please refer to the [opensearch-migrations options.md](https://github.com/opensearch-project/opensearch-migrations/blob/main/deployment/cdk/opensearch-service-migration/options.md) but please open an issue for consultation if changing an option that is not listed on this page.
-
-Options for the source cluster endpoint, target cluster endpoint, and existing VPC should be configured for the Migration tools to function effectively.
-
-
-## Metadata Migration Options
-
-## Sample Metadata Migration CDK Options
-
-```json
-{
-  "metadata-migration": {
-    "stage": "dev",
-    "vpcId": <VPC_ID>,
-    "sourceCluster": {
-        "endpoint": <SOURCE_CLUSTER_ENDPOINT>,
-        "version": "ES 7.10",
-        "auth": {"type": "none"}
-    },
-    "targetCluster": {
-        "endpoint": <TARGET_CLUSTER_ENDPOINT>,
-        "auth": {
-            "type": "basic",
-            "username": <TARGET_CLUSTER_USERNAME>,
-            "passwordFromSecretArn": <TARGET_CLUSTER_PASSWORD_SECRET>
-        }
-    },
-    "reindexFromSnapshotServiceEnabled": true,
-    "artifactBucketRemovalPolicy": "DESTROY"
-  }
-}
-```
-
-There are currently no CDK options specific to Metadata migrations, which are performed from the Migration Console. This migration requires an existing snapshot, which can be created from the Migration Console.
-
-<details>
-<summary><b>Shared configuration options table</b>
-</summary>
-
-| Name                  | Example                                                                                             | Description                                                                                                                                                                 |
-|-----------------------|-----------------------------------------------------------------------------------------------------|-----------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
-| `sourceClusterEndpoint` | `"https://source-cluster.elb.us-east-1.endpoint.com"`                                               | The endpoint for the source cluster.                                                                                                                                        |
-| `targetClusterEndpoint` | `"https://vpc-demo-opensearch-cluster-cv6hggdb66ybpk4kxssqt6zdhu.us-west-2.es.amazonaws.com:443"`   | The endpoint for the target cluster. Required if using an existing target cluster for the migration instead of creating a new one.                                           |
-| `vpcId`               | `"vpc-123456789abcdefgh"`                                                                           | The ID of the existing VPC where the migration resources will be placed. The VPC must have at least two private subnets that span two availability zones.                    |
-
-</details>
-
-## Backfill Migration with Reindex-from-Snapshot (RFS) Options
-
-### Sample Backfill Migration CDK Options
-
-```json
-{
-  "backfill-migration": {
-    "stage": "dev",
-    "vpcId": <VPC_ID>,
-    "sourceCluster": {
-        "endpoint": <SOURCE_CLUSTER_ENDPOINT>,
-        "version": "ES 7.10",
-        "auth": {"type": "none"}
-    },
-    "targetCluster": {
-        "endpoint": <TARGET_CLUSTER_ENDPOINT>,
-        "auth": {
-            "type": "basic",
-            "username": <TARGET_CLUSTER_USERNAME>,
-            "passwordFromSecretArn": <TARGET_CLUSTER_PASSWORD_SECRET>
-        }
-    },
-    "reindexFromSnapshotServiceEnabled": true,
-    "reindexFromSnapshotExtraArgs": "",
-    "artifactBucketRemovalPolicy": "DESTROY"
-  }
-}
-```
-
-Performing a Reindex-from-Snapshot backfill migration requires an existing snapshot. The CDK options specific to backfill migrations are listed below. To view all available arguments for `reindexFromSnapshotExtraArgs`, see [here](https://github.com/opensearch-project/opensearch-migrations/blob/main/DocumentsFromSnapshotMigration/README.md#arguments). At a minimum, no extra arguments may be needed.
-
-<details>
-<summary><b>Backfill specific configuration options table</b>
-</summary>
-
-| Name                            | Example                                                               | Description                                                                                                                                                                                                 |
-|---------------------------------|-----------------------------------------------------------------------|-------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
-| `reindexFromSnapshotServiceEnabled` | `true`                                                                | Enables deploying and configuring the RFS ECS service.                                                                                                                                                      |
-| `reindexFromSnapshotExtraArgs`      | `"--target-aws-region us-east-1 --target-aws-service-signing-name es"` | Extra arguments for the Document Migration command, with space separation. See the [RFS Extra Arguments](https://github.com/opensearch-project/opensearch-migrations/blob/main/DocumentsFromSnapshotMigration/README.md#arguments) for more details. You can pass `--no-insecure` to remove the `--insecure` flag. |
-
-</details>
-
-## Live Capture Migration with Capture and Replay (C&R) Options
-
-### Sample Live Capture Migration CDK Options
-
-```json
-{
-  "live-capture-migration": {
-    "stage": "dev",
-    "vpcId": <VPC_ID>,
-    "sourceCluster": {
-        "endpoint": <SOURCE_CLUSTER_ENDPOINT>,
-        "version": "ES 7.10",
-        "auth": {"type": "none"}
-    },
-    "targetCluster": {
-        "endpoint": <TARGET_CLUSTER_ENDPOINT>,
-        "auth": {
-            "type": "basic",
-            "username": <TARGET_CLUSTER_USERNAME>,
-            "passwordFromSecretArn": <TARGET_CLUSTER_PASSWORD_SECRET>
-        }
-    },
-    "captureProxyServiceEnabled": true,
-    "captureProxyExtraArgs": "",
-    "trafficReplayerServiceEnabled": true,
-    "trafficReplayerExtraArgs": "",
-    "artifactBucketRemovalPolicy": "DESTROY"
-  }
-}
-```
-
-Performing a live capture migration requires that a Capture Proxy be configured to capture incoming traffic and send it to the target cluster via the Traffic Replayer service. For arguments available in `captureProxyExtraArgs`, refer to the `@Parameter` fields [here](https://github.com/opensearch-project/opensearch-migrations/blob/main/TrafficCapture/trafficCaptureProxyServer/src/main/java/org/opensearch/migrations/trafficcapture/proxyserver/CaptureProxy.java). For `trafficReplayerExtraArgs`, refer to the `@Parameter` fields [here](https://github.com/opensearch-project/opensearch-migrations/blob/main/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/TrafficReplayer.java). At a minimum, no extra arguments may be needed.
-
-<details>
-<summary><b>Capture and Replay specific configuration options table</b>
-</summary>
-
-| Name                           | Example                                                                                | Description                                                                                                                                                                                                                                                                             |
-|--------------------------------|----------------------------------------------------------------------------------------|-----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
-| `captureProxyServiceEnabled`    | `true`                                                                                 | Enables the Capture Proxy service deployment via a new CloudFormation stack.                                                                                                                                                                     |
-| `captureProxyExtraArgs`         | `"--suppressCaptureForHeaderMatch user-agent .*elastic-java/7.17.0.*"`                 | Extra arguments for the Capture Proxy command, including options specified by the [Capture Proxy](https://github.com/opensearch-project/opensearch-migrations/blob/main/TrafficCapture/trafficCaptureProxyServer/src/main/java/org/opensearch/migrations/trafficcapture/proxyserver/CaptureProxy.java).                         |
-| `trafficReplayerServiceEnabled` | `true`                                                                                 | Enables the Traffic Replayer service deployment via a new CloudFormation stack.                                                                                                                                                                   |
-| `trafficReplayerExtraArgs`      | `"--sigv4-auth-header-service-region es,us-east-1 --speedup-factor 5"`                 | Extra arguments for the Traffic Replayer command, including options for auth headers and other parameters specified by the [Traffic Replayer](https://github.com/opensearch-project/opensearch-migrations/blob/main/TrafficCapture/trafficReplayer/src/main/java/org/opensearch/migrations/replay/TrafficReplayer.java). |
-
-</details>
-
-## Cluster Authentication Options
-
-Both the source and target cluster can use no authentication (e.g. limited to the VPC), basic authentication with a username and password, or SigV4 scoped to a user or role.
-
-Examples of each of these are below.
-
-No auth:
-```
-    "sourceCluster": {
-        "endpoint": <SOURCE_CLUSTER_ENDPOINT>,
-        "version": "ES 7.10",
-        "auth": {"type": "none"}
-    }
-```
-
-Basic auth:
-```
-    "sourceCluster": {
-        "endpoint": <SOURCE_CLUSTER_ENDPOINT>,
-        "version": "ES 7.10",
-        "auth": {
-            "type": "basic",
-            "username": <TARGET_CLUSTER_USERNAME>,
-            "passwordFromSecretArn": <TARGET_CLUSTER_PASSWORD_SECRET>
-        }
-    }
-```
-
-SigV4 auth:
-```
-    "sourceCluster": {
-        "endpoint": <SOURCE_CLUSTER_ENDPOINT>,
-        "version": "ES 7.10",
-        "auth": {
-            "type": "sigv4",
-            "region": "us-east-1",
-            "serviceSigningName": "es"
-        }
-    }
-```
-
-The `serviceSigningName` can be `es` for an Elasticsearch or OpenSearch domain, or `aoss` for an OpenSearch Serverless collection.
-
-All of these auth mechanisms apply to both source and target clusters.
-
-## Troubleshooting
-
-### Restricted Permissions
-When deploying if part of an [AWS Organization](https://docs.aws.amazon.com/organizations/latest/userguide/orgs_introduction.html) ↗ some permissions / resources might not be allowed.  The full list can be generated from the synthesized cdk output with the awsFeatureUsage script.
-
-```
-/opensearch-migrations/deployment/cdk/opensearch-service-migration/awsFeatureUsage.sh [contextId]
-```
-
-<details>
-<summary><b>Capture and Replay specific configuration options table</b>
-</summary>
-
-```shell
-$ /opensearch-migrations/deployment/cdk/opensearch-service-migration/awsFeatureUsage.sh default
-Synthesizing all stacks...
-Synthesizing stack: networkStack-default
-Synthesizing stack: migrationInfraStack
-Synthesizing stack: reindexFromSnapshotStack
-Synthesizing stack: migration-console
-Finding resource usage from synthesized stacks...
------------------------------------
-IAM Policy Actions:
-cloudwatch:GetMetricData
-...
------------------------------------
-Resources Types:
-AWS::CDK::Metadata
-...
-```
-</details>
-
-
-### Network Configuration
-The migration tooling expects the source cluster, target cluster, and migration resources to exist in the same VPC. If this is not the case, manual networking setup outside of this documentation is likely required.
diff --git a/_migrations/deploying-migration-assistant/index.md b/_migrations/deploying-migration-assistant/index.md
deleted file mode 100644
index cbe721dd12..0000000000
--- a/_migrations/deploying-migration-assistant/index.md
+++ /dev/null
@@ -1,5 +0,0 @@
----
-layout: default
-title: Deploying migration assistant
-nav_order: 10
----
\ No newline at end of file
diff --git a/_migrations/index.md b/_migrations/index.md
deleted file mode 100644
index faddfe41ab..0000000000
--- a/_migrations/index.md
+++ /dev/null
@@ -1,59 +0,0 @@
----
-layout: default
-title: Migration Assistant for OpenSearch
-nav_order: 1
-has_children: false
-nav_exclude: true
-has_toc: false
----
-
-# Migration Assistant for OpenSearch
-
-This overview outlines the process for successfully performing an end-to-end, zero-downtime migration. The solution offered in this repository caters to several specific scenarios:
-
-1. **Metadata Migration** - Migrating cluster metadata, such as index settings, aliases, and templates.
-2. **Backfill Migration** - Migrating existing or historical data from a source to a target cluster.
-3. **Live Traffic Migration** - Replicating live ongoing traffic from source to target cluster.
-4. **Comparative Tooling** - Comparing the performance and behaviors of an existing cluster with a prospective new one.
-
-In this guide, we focus on scenarios 1-3, guiding you through a backfill from a source cluster while concurrently handling live production traffic, which will be captured and replayed to a target cluster. 
-
-It's crucial to note that migration strategies are not universally applicable. This guide provides a detailed methodology, based on certain assumptions detailed throughout, emphasizing the importance of robust engineering practices to ensure a successful migration.
-
-
-## Key Components of the Solution
-
-### Elasticsearch/OpenSearch Source
-Your source cluster in this solution operates on Elasticsearch or OpenSearch, hosted on EC2 instances or similar computing environments. A proxy is set up to interact with this source cluster, either positioned in front of or directly on the coordinating nodes of the cluster.
-
-### Migration Management Console
-A console that provides a migration-specific CLI and offers a variety of tools to streamline the migration process.  Everything necessary for completing a migration, other than cleaning up the migration resources, can be done via this Console.
-
-### Traffic Capture Proxy
-This component is designed for HTTP RESTful traffic, playing a dual role. It not only forwards traffic to the source cluster but also splits and channels this traffic to a stream-processing service for later playback.
-
-### Traffic Replayer
-Acting as a traffic simulation tool, the Traffic Replayer replays recorded request traffic to a target cluster, mirroring source traffic patterns. It links original requests and their responses to those directed at the target cluster, facilitating comparative analysis.
-
-### Metadata Migration Tool
-A tool integrated into the Migration CLI that can also be used independently to migrate cluster metadata, including index mappings, index configuration settings, templates, component templates, and aliases.
-
-### Reindex-from-Snapshot
-Reindexing data from an existing snapshot on Elastic Container Service (ECS) workers that coordinate the migration of documents from an existing snapshot, reindexing the documents in parallel to a target cluster.
-
-### Target Cluster
-The destination cluster for migration or comparison in an A/B test.
-
-### Architecture Overview
-This architecture is based on the use of AWS cloud infrastructure, but most tools are designed to be cloud-independent. A local containerized version of this solution is also available.
-
-The design deployed in AWS is as follows: 
-
-![Migration architecture overview]({{site.url}}{{site.baseurl}}/images/migrations/migration-architecture-overview.svg)
-
-1. Client traffic is directed to the existing cluster.
-2. An ALB with Capture Proxies relaying traffic to source while replicating to Amazon MSK.
-3. With continuous traffic capture in place, a Reindex-from-Snapshot (RFS) is initiated by the user via Migration Console.
-4. Once Reindex-from-Snapshot is complete, traffic captured is replayed from MSK by Traffic Replayer.
-5. Performance and behavior of traffic sent to source and target clusters are compared by reviewing logs and metrics.
-6. After confirming the target cluster’s functionality meets expectations the use redirects clients to new target.
diff --git a/_migrations/is-migration-assistant-right-for-you.md b/_migrations/is-migration-assistant-right-for-you.md
deleted file mode 100644
index e4a56a435c..0000000000
--- a/_migrations/is-migration-assistant-right-for-you.md
+++ /dev/null
@@ -1,244 +0,0 @@
----
-layout: default
-title: Is migration assistant right for you?
-nav_order: 5
----
-
-Before deciding if this is the right tool for you, it's important to assess your specific needs and understand the available tools for performing an upgrade or migration.
-
-Migration Assistant addresses gaps found in other migration solutions, but in some cases, alternative tools may be a better fit.
-
-For instance, if you need to upgrade more than one major version—such as moving from Elasticsearch 6.8 to OpenSearch 2.3—Migration Assistant allows you to do this in a single hop. In contrast, other options like rolling upgrades or snapshot restore would require multiple steps, as they cannot handle major version jumps without reindexing your data. Additionally, if you need to capture live traffic and perform a zero-downtime migration, Migration Assistant would be the right choice.
-
-There are also tools available for migrating cluster configuration, templates, and aliases, which can be helpful depending on the complexity of your setup. These tools streamline the migration process by preserving critical settings and custom configurations.
-
-## Migration Paths
-
-| **Source Version**          | **Target Version**               |
-|-----------------------------|----------------------------------|
-| Elasticsearch 6.8           | OpenSearch 1.3                   |
-| Elasticsearch 6.8           | OpenSearch 2.14                  |
-| Elasticsearch 7.10.2        | OpenSearch 1.3                   |
-| Elasticsearch 7.10.2        | OpenSearch 2.14                  |
-| Elasticsearch 7.17          | OpenSearch 1.3                   |
-| Elasticsearch 7.17          | OpenSearch 2.14                  |
-| OpenSearch 1.3              | OpenSearch 2.14                  |
-
-> [!NOTE]  
-> We expect minor versions within the specified major versions above (i.e., Elasticsearch 6 and 7 and OpenSearch 1 and 2) to be supported, but the versions above are tested.
-
-### Supported Source and Target Platforms
-* Self-managed (hosted by cloud provider or on-premises)
-* AWS OpenSearch
-
-The tooling is designed to work with other cloud provider platforms, but it is not officially tested with these other platforms. If you would like to add support, please contact one of the maintainers on [GitHub](https://github.com/opensearch-project/opensearch-migrations/blob/main/MAINTAINERS.md).
-
-### Future Migration Paths
-
-| **Source Version**          | **Target Version**               | **Tracking Issue** |
-|-----------------------------|----------------------------------|--------------------|
-| Elasticsearch 8.x           | OpenSearch 2.x                   |[Issue](https://github.com/opensearch-project/opensearch-migrations/issues/1071)|
-| Elasticsearch 5.6           | OpenSearch 2.x                   |[Issue](https://github.com/opensearch-project/opensearch-migrations/issues/1067)|
-| Elasticsearch 2.3           | OpenSearch 2.x                   |[Issue](https://github.com/opensearch-project/opensearch-migrations/issues/1069)|
-| Elasitcsearch 1.5           | OpenSearch 2.x                   |[Issue](https://github.com/opensearch-project/opensearch-migrations/issues/1070)|
-| OpenSearch 2.x              | OpenSearch 2.x                   |[Issue](https://github.com/opensearch-project/opensearch-migrations/issues/1038)|
-
-## Supported Components
-
-Before starting a migration, consider the scope of the components involved. The table below outlines the components that should be considered for migration, indicates their support by the Migration Assistant, and provides comments and recommendations.
-
-| Component                        | Supported           | Comments and Recommendations                                                                                                                                                                         |
-|----------------------------------|---------------------|------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
-| **Documents**                    | Yes                 | Migrate existing data with Reindex-from-Snapshot and live traffic with Capture-and-Replay                                                                                                           |
-| **Index Settings**               | Yes                 | Migrate with Metadata Migration Tool                                                                                                                                                                |
-| **Index Mappings**               | Yes                 | Migrate with Metadata Migration Tool                                                                                                                                                                |
-| **Index Templates**              | Yes                 | Migrate with Metadata Migration Tool                                                                                                                                                                |
-| **Component Templates**          | Yes                 | Migrate with Metadata Migration Tool                                                                                                                                                                |
-| **Aliases**                      | Yes                 | Migrate with Metadata Migration Tool                                                                                                                                                                |
-| **ISM Policies**                 | Expected in 2025    | Manually migrate using API                                                                                                                                                                          |
-| **Elasticsearch Kibana Dashboards** | Expected in 2025 | Only needed if tooling is being used to migrate Elasticsearch Kibana Dashboards to OpenSearch Dashboards. Export JSON files from Kibana and import into OpenSearch Dashboards; before importing, use the [dashboardsSanitizer](https://github.com/opensearch-project/opensearch-migrations/tree/main/dashboardsSanitizer) tool on X-Pack visualizations like Canvas and Lens in Kibana Dashboards, as they may require recreation for compatibility with OpenSearch. |
-| **Security Constructs**          | No                  | Configure roles and permissions based on cloud provider recommendations. For example, if using AWS, leverage IAM for enhanced security management.                                                  |
-| **Plugins**                      | No                  | Check plugin compatibility; some Elasticsearch plugins may not have direct equivalents in OpenSearch.                                                                                              |
-
----
-
-## OpenSearch Migrations Assessment - Questionnaire
-
-### High-Level / Project Management Questions:
-
-1. **By when do you expect the migration to be completed?**  
-   *Why it’s important:*  
-   Understanding the timeline helps set realistic expectations and plan resources accordingly.
-
-2. **How much downtime can you afford during the migration?**  
-   *Why it’s important:*  
-   This defines the migration strategy, whether zero-downtime or with controlled outages, and helps prevent unexpected service disruptions.
-
-3. **What are your primary goals for the migration?**  
-   (e.g., Performance improvement, cost reduction, feature enhancement, etc.)  
-   *Why it’s important:*  
-   Clarifying the objectives helps tailor the migration process to meet the customer’s expectations and success criteria.
-
-4. **What's your level of acceptance for discrepancies during the upgrade?**  
-   (e.g., If relevancy is re-ordered because the two clusters aren’t exactly in sync, is this tolerable?)  
-   *Why it’s important:*  
-   Helps gauge the flexibility of the customer, especially when dealing with non-deterministic elements like ranking in search results or latency variations.
-
-5. **Are there any SLAs in place for downstream users or services?**  
-   *Why it’s important:*  
-   Understanding SLAs ensures that any changes to performance or downtime do not violate contractual agreements, maintaining service quality.
-
-6. **Do you foresee any regulatory or compliance constraints that might impact the migration timeline or execution?**  
-   *Why it’s important:*  
-   Compliance requirements can dictate migration approaches, particularly regarding data handling, encryption, or audit logging.
-
-7. **Are you open to a trusted proxy preceding your source cluster, even if it adds a 10-30ms latency?**  
-   *Why it’s important:*  
-   A proxy can make certain migrations smoother (e.g., for reindexing or log collection), but it’s crucial to assess the customer’s tolerance for added latency.
-
-8. **Do you possess a dedicated environment for trial upgrades before the production shift?**  
-   (Please outline your typical upgrade process.)  
-   *Why it’s important:*  
-   Testing in a dedicated environment before production can prevent unexpected issues and allow for smoother transitions.
-
-9. **Do you have a rollback plan in case the migration encounters issues?**  
-   *Why it’s important:*  
-   Rollback strategies help ensure business continuity in case the migration fails, minimizing risks to the business.
-
----
-
-### Technical Questions
-
-#### Platform & Architecture:
-
-1. **What are the source and target platforms and their versions?**  
-   (e.g., Elasticsearch 7.10.2 to OpenSearch 2.x)  
-   *Why it’s important:*  
-   Compatibility between versions is key for smooth migrations, ensuring the right tools and processes are used.
-
-2. **Provide a breakdown of nodes in the cluster.**  
-   (e.g., Total nodes, number of coordinating nodes, and number of data nodes.)  
-   *Why it’s important:*  
-   The structure of the cluster affects the complexity of the migration and helps in resource planning.
-
-3. **Are retention policies in place?**  
-   (If so, for how long, and is it on all indices?)  
-   *Why it’s important:*  
-   Retention policies could influence the size of the data that needs to be migrated and how backups or archiving strategies are handled. They may also impact the recommended migration solution.
-
-4. **How do you currently handle backup and recovery in your cluster?**  
-   *Why it’s important:*  
-   A solid backup and recovery strategy is essential for minimizing data loss and ensuring a smooth migration.
-
-5. **Are there schematic diagrams showcasing how Elasticsearch/OpenSearch integrates with your entire system?**  
-   *Why it’s important:*  
-   Understanding the full architecture helps ensure that the migration doesn’t break any dependencies and that integrations continue to work post-migration.
-
-6. **Which authentication and authorization mechanisms are in place?**  
-   *Why it’s important:*  
-   Security configurations need to be migrated and verified to maintain data access controls and compliance post-migration.
-
----
-
-#### Data & Cluster Metrics:
-
-1. **How much data is stored in the cluster?**  
-   *Why it’s important:*  
-   Helps estimate the time and resources required for data transfer, and determines the migration method (batch or streaming).
-
-2. **Could you specify the mean and peak throughput of the cluster?**  
-   *Why it’s important:*  
-   Understanding the performance requirements ensures that the target environment can handle both normal and peak loads.
-
-3. **What are the transactions per second?**  
-   (Also, indices per second, queries per second.)  
-   *Why it’s important:*  
-   This allows for proper sizing and performance tuning of the target cluster.
-
-4. **How many shards do you have and what is the max shard size?**  
-   *Why it’s important:*  
-   Shard size and distribution affect performance and the ease of migration, especially in large datasets.
-
-5. **What version of the Lucene index are you currently using?**  
-   *Why it’s important:*  
-   Index compatibility is critical to ensure the integrity of the data when moving between different versions of Elasticsearch or OpenSearch.
-
-6. **Do source documents contain a _source field?**  
-   *Why it’s important:*  
-   The _source field is essential for data recovery and reindexing; knowing this helps in planning for data replication or migration methods.
-
----
-
-#### Application & Use:
-
-1. **What's the main application of your cluster?**  
-   (e.g., search, logging, analytics, etc.)  
-   *Why it’s important:*  
-   The use case determines the criticality of different features (e.g., search accuracy vs. logging performance) in the target environment.
-
-2. **How many client applications connect to the cluster?**  
-   (Are you aware of any potential upgrade compatibility concerns?)  
-   *Why it’s important:*  
-   Compatibility with clients is crucial for a smooth migration. Some clients might need reconfiguration or updates.
-
-3. **Are there any specific integrations (e.g., AWS, GCP, third-party services) that need to be tested during the migration?**  
-   *Why it’s important:*  
-   Identifying critical integrations helps ensure they continue to function post-migration, preventing system-wide issues.
-
-4. **Share any specifics about the requests directed at your cluster that might pose migration challenges.**  
-   (e.g., request format, payload size.)  
-   *Why it’s important:*  
-   Helps identify any request patterns or payloads that might be problematic during the migration process.
-
-5. **Do clients hit source domains directly, or is there a layer of indirection?**  
-   (e.g., load balancer)  
-   *Why it’s important:*  
-   Understanding how traffic flows into the cluster helps in designing a migration plan with minimal client disruption.
-
----
-
-#### Security & Plugins:
-
-1. **Is inter-node encryption active within the cluster?**  
-   *Why it’s important:*  
-   Ensures that the migration process adheres to the customer’s security requirements, especially for sensitive data.
-
-2. **Do you have data encryption at rest enabled?**  
-   *Why it’s important:*  
-   Encryption settings might need reconfiguration post-migration, and this helps avoid compliance or security issues.
-
-3. **List any plugins in use that will require migration.**  
-   *Why it’s important:*  
-   Some plugins may not be compatible with newer versions of OpenSearch, requiring alternatives or upgrades.
-
-4. **Are you utilizing Kibana or any other visualization tools?**  
-   *Why it’s important:*  
-   Ensures that dashboards and visualization setups are preserved or replicated post-migration.
-
-5. **Are you aware of any custom scripts or ingest pipelines currently in use?**  
-   *Why it’s important:*  
-   Custom components may require validation or modification during the migration, preventing post-migration breakage.
-
----
-
-#### History & Deployment:
-
-1. **Provide the details of the most recent upgrade, including versions involved.**  
-   (If available, a history of all upgrade paths would be beneficial.)  
-   *Why it’s important:*  
-   Helps in assessing potential issues with upgrade compatibility and identifies if any manual fixes were applied during previous upgrades.
-
-2. **How do you install/deploy Elasticsearch/OpenSearch?**  
-   *Why it’s important:*  
-   Deployment methods (e.g., Docker, Kubernetes, bare metal) will affect the migration process and the setup of the target cluster.
-
-3. **Do you have any custom monitoring or alerting tools set up for the cluster?**  
-   (e.g., Datadog, Prometheus, OpenSearch Dashboards.)  
-   *Why it’s important:*  
-   Monitoring tools may require reconfiguration to work with the new environment, ensuring continued operational visibility.
-4. **Can you provide the original version of Elasticsearch/OpenSearch that was used for each of the indices in your cluster?**  
-   *Why it’s important:*  
-   The version history of indices is critical because older index versions may not be compatible with the current or target platform during the migration. Knowing the original versions helps identify any necessary reindexing steps, ensures compatibility with the target cluster, and prevents potential issues related to index corruption, feature deprecation, or incompatibility with newer versions of OpenSearch. It also aids in planning for adjustments in index mappings and settings that may have changed over different versions.
-
-These same questions are available in 
-[OpenSearch Migrations Assessment - Version 5.docx](https://github.com/user-attachments/files/17177220/OpenSearch.Migrations.Assessment.-.Version.5.docx).
\ No newline at end of file
diff --git a/_migrations/meta.md b/_migrations/meta.md
deleted file mode 100644
index 87e763b847..0000000000
--- a/_migrations/meta.md
+++ /dev/null
@@ -1,26 +0,0 @@
-<!-- Document: Meta -->
-This page is meant to describe how the Migration Assistant (MA) documentation is organization and used.
-
-## Organization
-1. All pages should have a commented out section with metadata information used for determining what styles should be applied, eg. `<!-- Document: Meta -->`.
-   - **Meta** these follow unique conventions to the documentation's implementation.
-   - **Home** This is the primary entry point to the project, there should only be one such page.
-   - **Guide** take a user through an substantial part of the MA workflow.  Duplicated information is OK.  They should be styled simaliarally to one another.
-   - **Topic** describe a specific area of functionality in MA and are meant to be digestible from top to bottom in a single sitting.  After the user has read the topic they would use a sidebar navigate to pick the next topic.
-2. Sidebar navigation should include all guides and topics.
-3. There is no hierarchy in project all files are off of the root.
-4. All internal links should use the `[[<DISPLAY-NAME>|<PAGE-NAME>]]` format so testing on forks is easy and broken page links are easier to detect.
-
-## Style
-
-### Links
-1. Links to any external documentation that isn't directly under the purview of the migrations team should be followed with a space and the `↗` character, eg. `[link](...) ↗`.
-
-### Format
-1. Only the home page is has level 1 `#` headers, all other pages should start with a paragraph and the first header start at `##`.
-2. Standard sections
-   - `## Troubleshooting`
-      1. No summary should be included.
-      2. Call out a clear problem or resolution, eg. `### Slow Snapshot Speed`.
-   - `## Related Links`
-     - All links should be bulleted and labeled `- [Migration Console ALB Documentation](...)`
diff --git a/_migrations/migration-console/accessing-the-migration-console.md b/_migrations/migration-console/accessing-the-migration-console.md
deleted file mode 100644
index 9c09515ab6..0000000000
--- a/_migrations/migration-console/accessing-the-migration-console.md
+++ /dev/null
@@ -1,41 +0,0 @@
-
-
-
-The Migrations Assistant deployment includes an ECS task that hosts tools to run different phases of the migration and check the progress or results of the migration.
-
-## SSH into the Migration Console
-Following the AWS Solutions deployment, the bootstrap box contains a script that simplifies access to the migration console through that instance.
-
-To access the Migration Console, use the following commands:
-
-```shell
-export STAGE=dev
-export AWS_REGION=us-west-2
-/opensearch-migrations/deployment/cdk/opensearch-service-migration/accessContainer.sh migration-console ${STAGE} ${AWS_REGION}
-```
-
-When opening the console a message will appear above the command prompt, `Welcome to the Migration Assistant Console`.
-
-<details>
-
-<summary>
-<b>SSH from any machine into Migration Console</b>
-</summary>
-
-On a machine with the [AWS CLI](https://docs.aws.amazon.com/cli/latest/userguide/getting-started-install.html) ↗ and the [AWS Session Manager Plugin](https://docs.aws.amazon.com/systems-manager/latest/userguide/session-manager-working-with-install-plugin.html) ↗, you can directly connect to the migration console. Ensure you've run `aws configure` with credentials that have access to the environment.
-
-Use the following commands:
-
-```shell
-export STAGE=dev
-export SERVICE_NAME=migration-console
-export TASK_ARN=$(aws ecs list-tasks --cluster migration-${STAGE}-ecs-cluster --family "migration-${STAGE}-${SERVICE_NAME}" | jq --raw-output '.taskArns[0]')
-aws ecs execute-command --cluster "migration-${STAGE}-ecs-cluster" --task "${TASK_ARN}" --container "${SERVICE_NAME}" --interactive --command "/bin/bash"
-```
-</details>
-
-## Troubleshooting
-
-### Deployment Stage
-
-Typically, `STAGE` is `dev`, but this may vary based on what the user specified during deployment.
\ No newline at end of file
diff --git a/_migrations/migration-console/index.md b/_migrations/migration-console/index.md
deleted file mode 100644
index 78a8011b57..0000000000
--- a/_migrations/migration-console/index.md
+++ /dev/null
@@ -1,6 +0,0 @@
----
-layout: default
-title: Migration console
-nav_order: 30
-has_children: true
----
\ No newline at end of file
diff --git a/_migrations/migration-console/migration-console-commands-references.md b/_migrations/migration-console/migration-console-commands-references.md
deleted file mode 100644
index 8b906ff9b2..0000000000
--- a/_migrations/migration-console/migration-console-commands-references.md
+++ /dev/null
@@ -1,101 +0,0 @@
-
-
-
-The Migration Assistant Console is a command line interface to interact with the deployed components of the solution.
-
-The commands are in the form of `console [component] [action]`. The components include `clusters`, `backfill` (e.g the Reindex from Snapshot service), `snapshot`, `metadata`, `replay`, etc. The console is configured with a registry of the deployed services and the source and target cluster, generated from the `cdk.context.json` values.
-
-## Commonly Used Commands
-
-The exact commands used will depend heavily on use-case and goals, but the following are a series of common commands with a quick description of what they do.
-
-```sh
-console clusters connection-check
-```
-Reports whether both the source and target clusters can be reached and their versions.
-
-
-```sh
-console clusters cat-indices
-```
-Runs the `_cat/indices` command on each cluster and prints the results.
-
-***
-
-```sh
-console snapshot create
-```
-Initiates creating a snapshot on the source cluster, into a pre-configured S3 bucket.
-
-```sh
-console snapshot status --deep-check
-```
-Runs a detailed check on the status of the snapshot creation, including estimated completion time.
-
-***
-
-```sh
-console metadata evaluate
-```
-Perform a dry run of metadata migration, showing which indices, templates, and other objects will be migrated to the target cluster.
-
-```sh
-console metadata migrate
-```
-Perform an actual metadata migration.
-
-***
-
-```sh
-console backfill start
-```
-If the Reindex From Snapshot service is enabled, start an instance of the service to begin moving documents to the target cluster.
-
-There are similar `scale UNITS` and `stop` commands to change the number of active instances for RFS.
-
-```sh
-console backfill status --deep-check
-```
-See the current status of the backfill migration, with the number of instances operating and the progress of the shards.
-
-***
-
-```sh
-console replay start
-```
-If the Traffic Replayer service is enabled, start an instance of the service to begin replaying traffic against the target cluster.
-The `stop` command stops all active instances.
-
-***
-
-```sh
-console tuples show --in /shared-logs-output/traffic-replayer-default/[NODE_ID]/tuples/console.log | jq > readable_tuples.json
-```
-Use tab completion on the path to fill in the available node ids and, if applicable, log file names. The tuples logs roll over at a certain size threshold, so there may be many files named with timestamps. The `jq` command pretty-prints each line of the tuple output before writing it to file.
-
-
-## Command Reference
-All commands and options can be explored within the tool itself by using the `--help` option, either for the entire `console` application or for individual components (e.g. `console backfill --help`). The console also has command autocomplete set up to assist with usage.
-
-```
-$ console --help
-Usage: console [OPTIONS] COMMAND [ARGS]...
-
-Options:
-  --config-file TEXT  Path to config file
-  --json
-  -v, --verbose       Verbosity level. Default is warn, -v is info, -vv is
-                      debug.
-  --help              Show this message and exit.
-
-Commands:
-  backfill    Commands related to controlling the configured backfill...
-  clusters    Commands to interact with source and target clusters
-  completion  Generate shell completion script and instructions for setup.
-  kafka       All actions related to Kafka operations
-  metadata    Commands related to migrating metadata to the target cluster.
-  metrics     Commands related to checking metrics emitted by the capture...
-  replay      Commands related to controlling the replayer.
-  snapshot    Commands to create and check status of snapshots of the...
-  tuples      All commands related to tuples.
-```
\ No newline at end of file
diff --git a/_migrations/migration-phases/assessment/index.md b/_migrations/migration-phases/assessment/index.md
deleted file mode 100644
index feda45c3f7..0000000000
--- a/_migrations/migration-phases/assessment/index.md
+++ /dev/null
@@ -1,7 +0,0 @@
----
-layout: default
-title: Assessing your cluster
-nav_order: 60
-has_children: true
-parent: Migration phases
----
\ No newline at end of file
diff --git a/_migrations/migration-phases/assessment/required-client-changes.md b/_migrations/migration-phases/assessment/required-client-changes.md
deleted file mode 100644
index 0cce4624bf..0000000000
--- a/_migrations/migration-phases/assessment/required-client-changes.md
+++ /dev/null
@@ -1,41 +0,0 @@
-
-
-
-The goal of the Migration Assistant is to streamline the process of migrating from one location or version of Elasticsearch/OpenSearch to another. However, completing a migration sometimes requires resolving client compatibility issues before they can communicate directly with the target cluster.
-
-It's crucial to understand and plan for any necessary changes before beginning the migration process. The previous page on [[breaking changes between versions|Understanding-breaking-changes]] is a useful resource for identifying potential issues.
-
-## Data Transformations and Client Impact
-
-Any time you apply a transformation to your data, such as:
-
-- Changing index names
-- Modifying field names or field mappings
-- Splitting indices with type mappings
-
-These changes may need to be reflected in your client configurations. For example, if your clients are reliant on specific index or field names, you must ensure that their queries are updated accordingly.
-
-We recommend running production-like queries against the target cluster before switching over actual production traffic. This helps verify that the client can:
-
-- Communicate with the target cluster
-- Locate the necessary indices and fields
-- Retrieve the expected results
-
-For complex migrations involving multiple transformations or breaking changes, we highly recommend performing a trial migration with representative, non-production data (e.g., in a staging environment) to fully test client compatibility with the target cluster.
-
-## Troubleshooting
-
-### Migrating from Elasticsearch (Post-Fork) to OpenSearch
-
-Migrating from post-fork Elasticsearch (7.10.2+) to OpenSearch presents additional challenges because some Elasticsearch clients include license or version checks that can artificially break compatibility. 
-
-No post-fork Elasticsearch clients are fully compatible with OpenSearch 2.x. We recommend switching to the latest version of the [OpenSearch Clients](https://opensearch.org/docs/latest/clients/) ↗.
-
-### Inspecting the tuple output
-
-The Replayer outputs that show the exact requests being sent to both the source and target clusters. Examining these tuples can help you identify any transformations between requests, allowing you to ensure that these changes are reflected in your client code.  See [[In-flight Validation]] for details.
-
-### Related Links
-
-For more information about OpenSearch clients, refer to the official documentation:  
-
diff --git a/_migrations/migration-phases/assessment/understanding-breaking-changes.md b/_migrations/migration-phases/assessment/understanding-breaking-changes.md
deleted file mode 100644
index 73eaee6e66..0000000000
--- a/_migrations/migration-phases/assessment/understanding-breaking-changes.md
+++ /dev/null
@@ -1,16 +0,0 @@
-
-
-
-Before performing any upgrade or migration, you should review any documentation of breaking changes.  Even if the cluster is migrated there might be changes required for clients to connect to the new cluster
-
-## Upgrade and breaking changes guides
-
-For migrations paths between Elasticsearch 6.8 and OpenSearch 2.x users should be familiar with documentation in the links below that apply to their specific case:
-
-* [Upgrading Amazon Service Domains](https://docs.aws.amazon.com/opensearch-service/latest/developerguide/version-migration.html) ↗
-
-* [Changes from Elasticsearch to OpenSearch fork](https://docs.aws.amazon.com/opensearch-service/latest/developerguide/rename.html) ↗
-
-* [OpenSearch Breaking Changes](https://opensearch.org/docs/latest/breaking-changes/) ↗
-
-The next step is to set up a proper test bed to verify that your applications will work as expected on the target version.
diff --git a/_migrations/migration-phases/backfill/backfill-execution.md b/_migrations/migration-phases/backfill/backfill-execution.md
deleted file mode 100644
index 828317bada..0000000000
--- a/_migrations/migration-phases/backfill/backfill-execution.md
+++ /dev/null
@@ -1,94 +0,0 @@
-
-
-
-After the [[Metadata Migration]] has been completed; begin the backfill of documents from the snapshot of the source cluster.
-
-## Document Migration
-Once started a fleet of workers will spin up to read the snapshot and reindex documents on the target cluster. This fleet of workers can be scaled to increased the speed that documents are reindexed onto target cluster.
-
-### Check the starting state of the clusters
-
-You can see the indices and rough document counts of the source and target cluster by running the cat-indices command.  This can be used to monitor the difference between the source and target for any migration scenario.  Check the indices of both clusters with the following command:
-
-```shell
-console clusters cat-indices
-```
-
-<details>
-<summary>
-<b>Example cat-indices command output</b>
-</summary>
-
-```shell
-SOURCE CLUSTER
-health status index       uuid                   pri rep docs.count docs.deleted store.size pri.store.size
-green  open   my-index WJPVdHNyQ1KMKol84Cy72Q   1   0          8            0     44.7kb         44.7kb
-
-TARGET CLUSTER
-health status index                        uuid                   pri rep docs.count docs.deleted store.size pri.store.size
-green  open   .opendistro_security         N3uy88FGT9eAO7FTbLqqqA   1   0         10            0     78.3kb         78.3kb
-```
-</details>
-
-### Start the backfill
-
-By starting the backfill by running the following command, which creates a fleet with a single worker:
-
-```shell
-console backfill start
-```
-
-### Monitor the status
-
-You can use the status check command to see more detail about things like the number of shards completed, in progress, remaining, and the overall status of the operation:
-
-```shell
-console backfill status --deep-check
-```
-
-<details>
-<summary>
-<b>Example status output</b>
-</summary>
-
-```
-BackfillStatus.RUNNING
-Running=1
-Pending=0
-Desired=1
-Shards total: 48
-Shards completed: 48
-Shards incomplete: 0
-Shards in progress: 0
-Shards unclaimed: 0
-```
-</details>
-
->[!Note]
-> The status will be "RUNNING" even if all the shards have been migrated.
-
-### Scale up the fleet
-
-To speed up the transfer, you can scale the number of workers. It may take a few minutes for these additional workers to come online.  The following command will update the worker fleet to a size of ten:
-
-```shell
-console backfill scale 5
-```
-
-### Stopping the migration
-Backfill requires manually stopping the fleet.  Once all the data has been migrated using by checking the status.  You can spin down the fleet and all its workers with the command:
-
-```shell
-console backfill stop
-```
-
-
-## Troubleshooting
-
-### How to scaling the fleet
-
-It is recommended to scale up the fleet slowly while monitoring the health metrics of the Target Cluster to avoid over-saturating it.  Amazon OpenSearch Domains provide a number of metrics and logs that can provide this insight; refer to [the official documentation on the subject](https://docs.aws.amazon.com/opensearch-service/latest/developerguide/monitoring.html) ↗.  The AWS Console for Amazon Opensearch Service surfaces details that can be useful for this as well.
-
-## Related Links
-
-- [Technical details for RFS](https://github.com/opensearch-project/opensearch-migrations/blob/main/RFS/docs/DESIGN.md)
diff --git a/_migrations/migration-phases/backfill/backfill-result-validation.md b/_migrations/migration-phases/backfill/backfill-result-validation.md
deleted file mode 100644
index e6cbd97482..0000000000
--- a/_migrations/migration-phases/backfill/backfill-result-validation.md
+++ /dev/null
@@ -1,37 +0,0 @@
-
-
-
-After the backfill has been completed and the fleet has been stopped 
-
-## Refresh the target cluster
-
-Before examining the contents of the target cluster, it is recommended to run a `_refresh` and `_flush` on the target cluster.  This will help ensure that the report and metrics of the cluster will be accurate portrayed.
-
-## Validate documents on target cluster
-You can check the contents of the Target Cluster after the migration using the Console CLI:
-
-```
-console clusters cat-indices --refresh
-```
-<b>Example cat-indices command output</b>
-
-```shell
-SOURCE CLUSTER
-health status index                uuid                   pri rep docs.count docs.deleted store.size pri.store.size
-green  open   my-index             -DqPQDrATw25hhe5Ss34bQ   1   0          3            0     12.7kb         12.7kb
-
-TARGET CLUSTER
-health status index                     uuid                   pri rep docs.count docs.deleted store.size pri.store.size
-green  open   .opensearch-observability 8HOComzdSlSWCwqWIOGRbQ   1   1          0            0       416b           208b
-green  open   .plugins-ml-config        9tld-PCJToSUsMiyDhlyhQ   5   1          1            0      9.5kb          4.7kb
-green  open   my-index                  bGfGtYoeSU6U6p8leR5NAQ   1   0          3            0      5.5kb          5.5kb
-green  open   .migrations_working_state lopd47ReQ9OEhw4ZuJGZOg   1   1          2            0     18.6kb          6.4kb
-green  open   .kibana_1
-```
-
-This will display the number of documents on each of the indices on the Target Cluster.  It is further recommended to run some queries against the Target Cluster that mimic your production workflow and closely examine the results returned.
-
-## Related Links
-
-- [Refresh API](https://opensearch.org/docs/latest/api-reference/index-apis/refresh/) ↗
-- [Flush API](https://opensearch.org/docs/latest/api-reference/index-apis/flush/) ↗
diff --git a/_migrations/migration-phases/backfill/capture-proxy-data-replication.md b/_migrations/migration-phases/backfill/capture-proxy-data-replication.md
deleted file mode 100644
index 2ed3b1f4c4..0000000000
--- a/_migrations/migration-phases/backfill/capture-proxy-data-replication.md
+++ /dev/null
@@ -1,45 +0,0 @@
-
-
-
-The Migration Assistant includes an Application Load Balancer (ALB) for routing traffic to the capture proxy and/or target. Upstream client traffic must be routed through the capture proxy in order to replay the requests later.
-
-## Assumptions
-
-* The upstream layer from the ALB is compatible with the certificate on the ALB listener (whether it’s clients or a Network Load Balancer, NLB).
-    * The `albAcmCertArn` in the `cdk.context.json` may need to be provided to ensure that clients trust the ALB certificate.
-* If an NLB is used directly upstream of the ALB, it must use a TLS listener.
-* Upstream resources and security groups must allow network access to the Migration Assistant ALB.
-
-## Steps
-
-1. In the AWS Console, navigate to **EC2 > Load Balancers > Migration Assistant ALB**.
-2. Note down the ALB URL.
-3. If you are using **NLB → ALB → Cluster**:
-    1. Ensure ingress is provided directly to the ALB for the capture proxy.
-    2. Create a target group for the Migration Assistant ALB on port 9200, and set the health check to HTTPS.
-    3. Associate this target group with your existing NLB on a new listener (for testing).
-    4. Verify the health check is successful, and perform smoke testing with some clients through the new listener port.
-    5. Once ready to migrate all clients, detach the Migration Assistant ALB target group from the testing NLB listener and modify the existing NLB listener to direct traffic to this target group.
-    6. Now, client requests will be routed through the proxy (once they establish a new connection). Verify application metrics.
-4. If you are using **NLB → Cluster**:
-    1. If you do not wish to modify application logic, add an ALB in front of your cluster and follow the **NLB → ALB → Cluster** steps. Otherwise:
-    2. Create a target group for the ALB on port 9200 and set the health check to HTTPS.
-    3. Associate this target group with your existing NLB on a new listener.
-    4. Verify the health check is successful, and perform smoke testing with some clients through the new listener port.
-    5. Once ready to migrate all clients, deploy a change so that clients hit the new listener.
-5. If you are **not using an NLB**:
-    1. Make a client/DNS change to route clients to the Migration Assistant ALB on port 9200.
-6. In the Migration Console, execute the following command:
-   ```shell
-   console kafka describe-topic-records
-   ```
-   Note the records in the logging topic.
-7. After a short period, execute the same command again and compare the increase in records against the expected HTTP requests.
-
-### Troubleshooting
-
-* Investigate the ALB listener security policy, security groups, ALB certificates, and the proxy's connection to Kafka.
-
-### Related Links
-
-- [Migration Console ALB Documentation](https://github.com/opensearch-project/opensearch-migrations/blob/main/docs/ClientTrafficSwinging.md)
\ No newline at end of file
diff --git a/_migrations/migration-phases/backfill/index.md b/_migrations/migration-phases/backfill/index.md
deleted file mode 100644
index 8bdb1e2a8d..0000000000
--- a/_migrations/migration-phases/backfill/index.md
+++ /dev/null
@@ -1,7 +0,0 @@
----
-layout: default
-title: Backfill
-nav_order: 90
-has_children: true
-parent: Migration phases
----
\ No newline at end of file
diff --git a/_migrations/migration-phases/client-traffic-switchover/Switching-Traffic-from-Source-to-Target.md b/_migrations/migration-phases/client-traffic-switchover/Switching-Traffic-from-Source-to-Target.md
deleted file mode 100644
index ea7182989a..0000000000
--- a/_migrations/migration-phases/client-traffic-switchover/Switching-Traffic-from-Source-to-Target.md
+++ /dev/null
@@ -1,37 +0,0 @@
-
-
-After the source and target clusters are in sync traffic needs to be switched to the target cluster so the source cluster can be taken offline.
-
-## Assumptions
-- All client traffic is being routed through switchover listener in MigrationAssistant ALB
-- Client traffic has been verified to be compatible with Target Cluster
-- Target cluster is in a good state to accept client traffic (i.e. backfill/replay is complete as needed)
-- Target Proxy Service is deployed
-
-## Switch Traffic to the Source Cluster
-1. Within the AWS Console, navigate to ECS > Migration Assistant Cluster
-1. Note down the desired count of the Capture Proxy (it should be > 1)
-1. Update the ECS Service of the Target Proxy to be at least as large as the Traffic Capture Proxy
-1. Wait for tasks to startup, verify all targets healthy within Target Proxy Service "Load balancer health" 
-1. Within the AWS Console, navigate to EC2 > Load Balancers > Migration Assistant ALB
-1. Navigate to ALB Metrics and examine any information which may be useful
-    1. Specifically look at Active Connection Count and New Connection Count and note if theres a big discrepancy, this can indicate a reused connections which affect how traffic will switchover. Once an ALB is re-routed, existing connections will still be routed to the capture proxy until the client/source cluster terminates those.
-1. Navigate to the Capture Proxy Target Group (ALBSourceProxy-<STAGE>-TG) > Monitoring
-1. Examine Metrics Requests, Target (2XX, 3XX, 4XX, 5XX), and Target Response Time, Metrics
-    1. Verify that this looks as expected and includes all traffic expected to be included in the switchover
-    1. Note details that would help identify anomalies during the switchover including expected response time and response code rate.  
-1. Navigate back to ALB and click on Target Proxy Target Group (ALBTargetProxy-<STAGE>-TG)
-1. Verify all expected targets are healthy and none are in draining state
-1. Navigate back to ALB and to the Listener on port 9200
-1. Click on the Default rule and Edit
-1. Modify the weights of the targets to shift desired traffic over to the target proxy
-   1. To perform a full switchover, modify the weight to 1 on Target Proxy and 0 on Source Proxy
-1. Click Save Changes
-1. Navigate to both SourceProxy and TargetProxy TG Monitoring metrics and verify traffic is shifting over as expected
-   1. If connections are being reused by clients, perform any actions if needed to terminate those to get the clients to shift over.
-   1. Monitor until SourceProxy TG shows 0 requests when it is known all clients have switchover
-
-## Troubleshooting
-
-### Fallback
-If needed to fallback, revert the Default rule to have the ALB route to the SourceProxy Target Group
\ No newline at end of file
diff --git a/_migrations/migration-phases/client-traffic-switchover/index.md b/_migrations/migration-phases/client-traffic-switchover/index.md
deleted file mode 100644
index 1a381a0ef6..0000000000
--- a/_migrations/migration-phases/client-traffic-switchover/index.md
+++ /dev/null
@@ -1,7 +0,0 @@
----
-layout: default
-title: Client traffic switchover
-nav_order: 110
-has_children: true
-parent: Migration phases
----
\ No newline at end of file
diff --git a/_migrations/migration-phases/index.md b/_migrations/migration-phases/index.md
deleted file mode 100644
index 95cd93b495..0000000000
--- a/_migrations/migration-phases/index.md
+++ /dev/null
@@ -1,6 +0,0 @@
----
-layout: default
-title: Migration phases
-nav_order: 50
-has_children: true
----
\ No newline at end of file
diff --git a/_migrations/migration-phases/metadata/Snapshot-Creation.md b/_migrations/migration-phases/metadata/Snapshot-Creation.md
deleted file mode 100644
index 683b097d5e..0000000000
--- a/_migrations/migration-phases/metadata/Snapshot-Creation.md
+++ /dev/null
@@ -1,56 +0,0 @@
----
-layout: default
-title: Snapshot creation
-nav_order: 90
-parent: Metadata
-grand_parent: Migration phases
----
-
-
-# Snapshot creation
-
-Creating a snapshot of the source cluster capture all the metadata and documents to migrate onto a new target cluster.
-
-## Limitations
-
-Incremental or "delta" snapshots are not yet supported. For more information, refer to the [tracking issue MIGRATIONS-1624](https://opensearch.atlassian.net/browse/MIGRATIONS-1624). A single snapshot must be used for a backfill.
-
-## Snapshot Creation from the Console
-
-Create the initial snapshot on the source cluster with the following command:
-
-```shell
-console snapshot create
-```
-
-To check the progress of the snapshot in real-time, use the following command:
-
-```shell
-console snapshot status --deep-check
-```
-
-<details>
-<summary><b>Example Output When a Snapshot is Completed</b></summary>
-
-```shell
-console snapshot status --deep-check
-
-SUCCESS
-Snapshot is SUCCESS.
-Percent completed: 100.00%
-Data GiB done: 29.211/29.211
-Total shards: 40
-Successful shards: 40
-Failed shards: 0
-Start time: 2024-07-22 18:21:42
-Duration: 0h 13m 4s
-Anticipated duration remaining: 0h 0m 0s
-Throughput: 38.13 MiB/sec
-```
-</details>
-
-## Troubleshooting
-
-### Slow Snapshot Speed
-
-Depending on the size of the data on the source cluster and the bandwidth allocated for snapshots, the process can take some time. Adjust the maximum rate at which the source cluster's nodes create the snapshot using the `--max-snapshot-rate-mb-per-node` option. Increasing the snapshot rate will consume more node resources, which may affect the cluster's ability to handle normal traffic. If not specified, the default rate for the source cluster's version will be used. For more details, refer to the [Elasticsearch 7.10 snapshot documentation](https://www.elastic.co/guide/en/elasticsearch/reference/7.10/put-snapshot-repo-api.html#put-snapshot-repo-api-request-body) ↗.
\ No newline at end of file
diff --git a/_migrations/migration-phases/metadata/index.md b/_migrations/migration-phases/metadata/index.md
deleted file mode 100644
index ac5618ffd4..0000000000
--- a/_migrations/migration-phases/metadata/index.md
+++ /dev/null
@@ -1,7 +0,0 @@
----
-layout: default
-title: Metadata
-nav_order: 80
-has_children: true
-parent: Migration phases
----
\ No newline at end of file
diff --git a/_migrations/migration-phases/post-migration-cleanup/index.md b/_migrations/migration-phases/post-migration-cleanup/index.md
deleted file mode 100644
index 3f76d3ed34..0000000000
--- a/_migrations/migration-phases/post-migration-cleanup/index.md
+++ /dev/null
@@ -1,7 +0,0 @@
----
-layout: default
-title: Migration infrastructure teardown
-nav_order: 120
-has_children: true
-parent: Migration phases
----
\ No newline at end of file
diff --git a/_migrations/migration-phases/replay-activation-and-validation/In-flight-Validation.md b/_migrations/migration-phases/replay-activation-and-validation/In-flight-Validation.md
deleted file mode 100644
index b2003700f7..0000000000
--- a/_migrations/migration-phases/replay-activation-and-validation/In-flight-Validation.md
+++ /dev/null
@@ -1,152 +0,0 @@
-
-
-
-The Replayer is a long-running process that makes requests to a target cluster to maintain synchronization with the source cluster and enable users to compare the performance between the two clusters. There are two primary ways to assess how the target requests are being handled: through logs and metrics.
-
-## Result Logs
-
-HTTP transactions from the source capture and those resent to the target cluster are logged in files located at `/shared-logs-output/traffic-replayer-default/*/tuples/tuples.log`. The `/shared-logs-output` directory is shared across containers, including the migration console. Users can access these files from the migration console using the same path. Previous runs are also available in gzipped form. 
-
-Each log entry is a newline-delimited JSON object, which contains details of the source and target requests/responses along with other transaction details, such as response times. 
-
-> **Note:** These logs contain the contents of all requests, including Authorization headers and the contents of all HTTP messages. Ensure that access to the migration environment is restricted as these logs serve as a source of truth for determining what happened on both the source and target clusters. Response times for the source refer to the time between the proxy sending the end of a request and receiving the response. While response times for the target are recorded in the same manner, keep in mind that the locations of the capture proxy, replayer, and target may differ, and these logs do not account for the client's location.
-
-<details>
-<summary>
-<b>Example Log Entry</b>
-</summary>
-
-Below is an example log entry for a `/_cat/indices?v` request sent to both the source and target clusters:
-
-```json
-{
-    "sourceRequest": {
-        "Request-URI": "/_cat/indices?v",
-        "Method": "GET",
-        "HTTP-Version": "HTTP/1.1",
-        "Host": "capture-proxy:9200",
-        "Authorization": "Basic YWRtaW46YWRtaW4=",
-        "User-Agent": "curl/8.5.0",
-        "Accept": "*/*",
-        "body": ""
-    },
-    "sourceResponse": {
-        "HTTP-Version": {"keepAliveDefault": true},
-        "Status-Code": 200,
-        "Reason-Phrase": "OK",
-        "response_time_ms": 59,
-        "content-type": "text/plain; charset=UTF-8",
-        "content-length": "214",
-        "body": "aGVhbHRoIHN0YXR1cyBpbmRleCAgICAgICB..."
-    },
-    "targetRequest": {
-        "Request-URI": "/_cat/indices?v",
-        "Method": "GET",
-        "HTTP-Version": "HTTP/1.1",
-        "Host": "opensearchtarget",
-        "Authorization": "Basic YWRtaW46bXlTdHJvbmdQYXNzd29yZDEyMyE=",
-        "User-Agent": "curl/8.5.0",
-        "Accept": "*/*",
-        "body": ""
-    },
-    "targetResponses": [{
-        "HTTP-Version": {"keepAliveDefault": true},
-        "Status-Code": 200,
-        "Reason-Phrase": "OK",
-        "response_time_ms": 721,
-        "content-type": "text/plain; charset=UTF-8",
-        "content-length": "484",
-        "body": "aGVhbHRoIHN0YXR1cyBpbmRleCAgICAgICB..."
-    }],
-    "connectionId": "0242acfffe13000a-0000000a-00000005-1eb087a9beb83f3e-a32794b4.0",
-    "numRequests": 1,
-    "numErrors": 0
-}
-```
-</details>
-
-### Decoding Log Content
-
-The contents of HTTP message bodies are Base64 encoded to handle various types of traffic, including compressed data. To view the logs in a more human-readable format, use the console library `tuples show`. Running the script as follows will produce a `readable-tuples.log` in the home directory:
-
-```shell
-console tuples show --in /shared-logs-output/traffic-replayer-default/d3a4b31e1af4/tuples/tuples.log > readable-tuples.log
-```
-
-<details>
-<summary>
-</b>Example log entry would look after running the script</b>
-</summary>
-
-```json
-{
-    "sourceRequest": {
-        "Request-URI": "/_cat/indices?v",
-        "Method": "GET",
-        "HTTP-Version": "HTTP/1.1",
-        "Host": "capture-proxy:9200",
-        "Authorization": "Basic YWRtaW46YWRtaW4=",
-        "User-Agent": "curl/8.5.0",
-        "Accept": "*/*",
-        "body": ""
-    },
-    "sourceResponse": {
-        "HTTP-Version": {"keepAliveDefault": true},
-        "Status-Code": 200,
-        "Reason-Phrase": "OK",
-        "response_time_ms": 59,
-        "content-type": "text/plain; charset=UTF-8",
-        "content-length": "214",
-        "body": "health status index       uuid         ..."
-    },
-    "targetRequest": {
-        "Request-URI": "/_cat/indices?v",
-        "Method": "GET",
-        "HTTP-Version": "HTTP/1.1",
-        "Host": "opensearchtarget",
-        "Authorization": "Basic YWRtaW46bXlTdHJvbmdQYXNzd29yZDEyMyE=",
-        "User-Agent": "curl/8.5.0",
-        "Accept": "*/*",
-        "body": ""
-    },
-    "targetResponses": [{
-        "HTTP-Version": {"keepAliveDefault": true},
-        "Status-Code": 200,
-        "Reason-Phrase": "OK",
-        "response_time_ms": 721,
-        "content-type": "text/plain; charset=UTF-8",
-        "content-length": "484",
-        "body": "health status index       uuid         ..."
-    }],
-    "connectionId": "0242acfffe13000a-0000000a-00000005-1eb087a9beb83f3e-a32794b4.0",
-    "numRequests": 1,
-    "numErrors": 0
-}
-```
-</details>
-
-## Metrics
-
-The Replayer emits various OpenTelemetry metrics to CloudWatch, and traces are sent through AWS X-Ray. Here are some useful metrics that help evaluate cluster performance:
-
-### `sourceStatusCode`
-
-This metric tracks the HTTP status codes for both the source and target clusters, with dimensions for the HTTP verb (e.g., GET, POST) and the status code families (e.g., 200-299). These dimensions help quickly identify discrepancies between the source and target, such as when DELETE 200s become 4xx or GET 4xx errors turn into 5xx errors.
-
-### `lagBetweenSourceAndTargetRequests`
-
-This metric shows the delay between requests hitting the source and target clusters. With a speedup factor greater than 1 and a target cluster that can handle requests efficiently, this value should decrease as the replay progresses, indicating a reduction in replay lag.
-
-### Additional Metrics
-
-- **Throughput**: `bytesWrittenToTarget` and `bytesReadFromTarget` indicate the throughput to and from the cluster.
-- **Retries**: `numRetriedRequests` tracks the number of requests retried due to status-code mismatches between the source and target.
-- **Event Counts**: Various `(*)Count` metrics track the number of specific events that have completed.
-- **Durations**: `(*)Duration` metrics measure the duration of each step in the process.
-- **Exceptions**: `(*)ExceptionCount` shows the number of exceptions encountered during each processing phase.
-
-## Troubleshooting
-
-### CloudWatch Considerations
-
-Metrics pushed to CloudWatch may experience around a 5-minute visibility lag. CloudWatch also retains higher-resolution data for a shorter period than lower-resolution data. For more details, see [CloudWatch Metrics Retention Policies](https://docs.aws.amazon.com/AmazonCloudWatch/latest/monitoring/cloudwatch_concepts.html) ↗.
diff --git a/_migrations/migration-phases/replay-activation-and-validation/Synchronized-Cluster-Validation.md b/_migrations/migration-phases/replay-activation-and-validation/Synchronized-Cluster-Validation.md
deleted file mode 100644
index a5c1759ae7..0000000000
--- a/_migrations/migration-phases/replay-activation-and-validation/Synchronized-Cluster-Validation.md
+++ /dev/null
@@ -1,161 +0,0 @@
-
-
-
-This guide covers how to use the Replayer to replay captured traffic from a source cluster to a target cluster during the migration process. The Replayer allows users to verify that the target cluster can handle requests in the same way as the source cluster and catch up to real-time traffic for a smooth migration.
-
-## Replayer Configurations
-
-[Replayer settings](Configuration-Options) are configured during the deployment of the Migration Assistant. Make sure to set the authentication mode for the Replayer so it can properly communicate with the target cluster. Refer to the **Limitations** section below for details on how different traffic types are handled.
-
-### Speedup Factor
-
-The `--speedup-factor` option, passed via `trafficReplayerExtraArgs`, adjusts the wait times between requests. For example:
-- A speedup factor of `2` sends requests at twice the original speed (e.g., a request originally sent every minute will now be sent every 30 seconds).
-- A speedup factor of `0.5` will space requests further apart (e.g., requests every 2 minutes instead of every minute).
-
-This setting can be used to stress test the target cluster or to catch up to real-time traffic, ensuring the target cluster is ready for production client switchover.
-
-## When to Run the Replayer
-
-After deploying the Migration Assistant, the Replayer is not running by default. It should be started only after all metadata and documents have been migrated to ensure that recent changes to the source cluster are properly reflected in the target cluster.
-
-For example, if a document was deleted after a snapshot was taken, starting the Replayer before the document migration is complete may cause the deletion request to execute before the document is even added to the target. Running the Replayer after all other migration processes ensures that the target cluster will be consistent with the source cluster.
-
-## Using the Replayer
-
-To manage the Replayer, use the `console replay` command:
-
-- **Start the Replayer**: 
-  ```bash
-  console replay start
-  ```
-  This starts the Replayer with the options specified at deployment.
-
-- **Check Replayer Status**:
-  ```bash
-  console replay status
-  ```
-  This command shows whether the Replayer is running, pending, or desired. "Running" shows how many container instances are actively running, "Pending" indicates how many are being provisioned, and "Desired" shows the total number of instances that should be running.
-
-- **Stop the Replayer**:
-  ```bash
-  console replay stop
-  ```
-
-<details>
-<summary>
-<b>Example Interactions</b>
-</summary>
-
-Check the status of the Replayer:
-```bash
-root@ip-10-0-2-66:~# console replay status
-(<ReplayStatus.STOPPED: 4>, 'Running=0\nPending=0\nDesired=0')
-```
-
-Start the Replayer:
-```bash
-root@ip-10-0-2-66:~# console replay start
-Replayer started successfully.
-Service migration-dev-traffic-replayer-default set to 1 desired count. Currently 0 running and 0 pending.
-```
-
-Stop the Replayer:
-```bash
-root@ip-10-0-2-66:~# console replay stop
-Replayer stopped successfully.
-Service migration-dev-traffic-replayer-default set to 0 desired count. Currently 0 running and 0 pending.
-```
-</details>
-
-### Delivery Guarantees
-
-The Replayer pulls traffic from Kafka and advances its commit cursor after requests have been sent to the target cluster. This provides an "at least once" delivery guarantee—requests will be replayed, but success is not guaranteed. You will need to monitor metrics, tuple outputs, or external validation to ensure the target cluster is performing as expected.
-
-## Time Scaling
-
-The Replayer sends requests in the same order they were received on each connection to the source. However, relative timing between different connections is not guaranteed. For example:
-
-- **Scenario**: Two connections exist—one sends a PUT request every minute, and the other sends a GET request every second.
-- **Behavior**: The Replayer will maintain the sequence within each connection, but the relative timing between the connections (PUTs and GETs) is not preserved.
-
-### Speedup Factor Example
-
-Assume a source cluster responds to requests (GETs and PUTs) within 100ms:
-- With a **speedup factor of 1**, the target will experience the same request rates and idle periods as the source.
-- With a **speedup factor of 2**, requests will be sent twice as fast, with GETs sent every 500ms and PUTs every 30 seconds.
-- At a **speedup factor of 10**, requests will be sent 10x faster, and as long as the target responds quickly, the Replayer can keep pace.
-
-If the target cannot respond fast enough, the Replayer will wait for the previous request to complete before sending the next one. This may cause delays and affect global relative ordering.
-
-## Transformations
-
-During migrations, some requests may need to be transformed between versions. For example, Elasticsearch supported multiple type mappings in indices, but this is no longer the case in OpenSearch. Clients may need to adjust accordingly by splitting documents into multiple indices or transforming request data.
-
-The Replayer automatically rewrites host and authentication headers, but for more complex transformations, custom transformation rules can be passed via the `--transformer-config` option (as described in the [Traffic Replayer README](https://github.com/opensearch-project/opensearch-migrations/blob/c3d25958a44ec2e7505892b4ea30e5fbfad4c71b/TrafficCapture/trafficReplayer/README.md#transformations)). 
-
-### Example Transformation
-
-Suppose a source request includes a "tagToExcise" element that needs to be removed and its children promoted, and the URI path includes "extraThingToRemove" which should also be removed. The following Jolt script handles this transformation:
-
-```json
-[{ "JsonJoltTransformerProvider":
-[
-  {
-    "script": {
-      "operation": "shift",
-      "spec": {
-        "payload": {
-          "inlinedJsonBody": {
-            "top": {
-              "tagToExcise": {
-                "*": "payload.inlinedJsonBody.top.&" 
-              },
-              "*": "payload.inlinedJsonBody.top.&"
-            },
-            "*": "payload.inlinedJsonBody.&"
-          },
-          "*": "payload.&"
-        },
-        "*": "&"
-      }
-    }
-  }, 
- {
-   "script": {
-     "operation": "modify-overwrite-beta",
-     "spec": {
-       "URI": "=split('/extraThingToRemove',@(1,&))"
-     }
-  }
- },
- {
-   "script": {
-     "operation": "modify-overwrite-beta",
-     "spec": {
-       "URI": "=join('',@(1,&))"
-     }
-  }
- }
-]
-}]
-```
-
-The resulting request to the target will look like this:
-
-```http
-PUT /oldStyleIndex/moreStuff HTTP/1.0
-host: testhostname
-
-{"top":{"properties":{"field1":{"type":"text"},"field2":{"type":"keyword"}}}}
-```
-
-You can pass Base64-encoded transformation scripts via `--transformer-config-base64` for convenience.
-
-## Troubleshooting
-
-### Client changes
-See [[Required Client Changes]] for more information on how clients will need to be updated.
-
-### Request Delivery
-The Replayer provides an "at least once" delivery guarantee but does not ensure request success when a replayed request arrives at the target cluster.
diff --git a/_migrations/migration-phases/replay-activation-and-validation/index.md b/_migrations/migration-phases/replay-activation-and-validation/index.md
deleted file mode 100644
index ab8aa175cb..0000000000
--- a/_migrations/migration-phases/replay-activation-and-validation/index.md
+++ /dev/null
@@ -1,7 +0,0 @@
----
-layout: default
-title: Replay activation and validation
-nav_order: 100
-has_children: true
-parent: Migration phases
----
\ No newline at end of file
diff --git a/_migrations/migration-phases/setup-verification/Client-Traffic-Switchover-Verification.md b/_migrations/migration-phases/setup-verification/Client-Traffic-Switchover-Verification.md
deleted file mode 100644
index 617e16db41..0000000000
--- a/_migrations/migration-phases/setup-verification/Client-Traffic-Switchover-Verification.md
+++ /dev/null
@@ -1,23 +0,0 @@
-
-
-
-The Migrations ALB is deployed with a listener that shifts traffic between the source and target clusters through proxy services. The ALB should start in **Source Passthrough** mode.
-
-## Verify traffic switchover has completed
-1. In the AWS Console, navigate to **EC2 > Load Balancers**.
-2. Select the **MigrationAssistant ALB**.
-3. Examine the listener on port 9200 and verify that 100% of traffic is directed to the **Source Proxy**.
-4. Navigate to the **Migration ECS Cluster** in the AWS Console.
-5. Select the **Target Proxy Service**.
-6. Verify that the desired count for the service is running:
-   * If the desired count is not met, update the service to increase it to at least 1 and wait for the service to start.
-7. In the **Health and Metrics** tab under **Load balancer health**, verify that all targets are reporting as healthy:
-   * This confirms the ALB can connect to the target cluster through the target proxy.
-8. (Reset) Update the desired count for the **Target Proxy Service** back to its original value in ECS.
-
-## Troubleshooting
-
-### Unexpected traffic patterns
-* Verify that the target cluster allows traffic ingress from the **Target Proxy Security Group**.
-* Navigate to the **Target Proxy ECS Tasks** to investigate any failing tasks:
-   * Set the "Filter desired status" to "Any desired status" to view all tasks, then navigate to the logs for any stopped tasks.
\ No newline at end of file
diff --git a/_migrations/migration-phases/setup-verification/Snapshot-Creation-Verification.md b/_migrations/migration-phases/setup-verification/Snapshot-Creation-Verification.md
deleted file mode 100644
index 41f55b7eaf..0000000000
--- a/_migrations/migration-phases/setup-verification/Snapshot-Creation-Verification.md
+++ /dev/null
@@ -1,100 +0,0 @@
-
-
-
-Verify that a snapshot can be created and used for metadata and backfill scenarios.
-
-### Install the Elasticsearch S3 Repository Plugin
-
-The snapshot needs to be stored in a location that the Migration Assistant can access. We use AWS S3 as that location, and the Migration Assistant creates an S3 bucket for this purpose. Therefore, it is necessary to install the Elasticsearch S3 Repository Plugin on your source nodes [as described here](https://www.elastic.co/guide/en/elasticsearch/plugins/7.10/repository-s3.html) ↗.
-
-Additionally, ensure that the plugin has been configured with AWS credentials that allow it to read and write to AWS S3. If your Elasticsearch cluster is running on EC2 or ECS instances with an execution IAM Role, include the necessary S3 permissions. Alternatively, you can store the credentials in the Elasticsearch Key Store [as described here](https://www.elastic.co/guide/en/elasticsearch/plugins/7.10/repository-s3-client.html) ↗.
-
-### Verifying S3 Repository Plugin Configuration
-
-You can verify that the S3 Repository Plugin is configured correctly by creating a test snapshot.
-
-Create an S3 bucket for the snapshot using the following AWS CLI command:
-
-```shell
-aws s3api create-bucket --bucket <your-bucket-name> --region <your-aws-region>
-```
-
-Register a new S3 Snapshot Repository on your source cluster using this curl command:
-
-```shell
-curl -X PUT "http://<your-source-cluster>:9200/_snapshot/test_s3_repository" -H "Content-Type: application/json" -d '{
-  "type": "s3",
-  "settings": {
-    "bucket": "<your-bucket-name>",
-    "region": "<your-aws-region>"
-  }
-}'
-```
-
-You should receive a response like: `{"acknowledged":true}`.
-
-Create a test snapshot that captures only the cluster's metadata:
-
-```shell
-curl -X PUT "http://<your-source-cluster>:9200/_snapshot/test_s3_repository/test_snapshot_1" -H "Content-Type: application/json" -d '{
-  "indices": "",
-  "ignore_unavailable": true,
-  "include_global_state": true
-}'
-```
-
-<details>
-<summary><b>Example Response</b></summary>
-
-You should receive a response like: `{"accepted":true}`.
-
-Check the AWS Console to confirm that your bucket contains the snapshot. It will appear similar to this:
-
-![Screenshot 2024-08-06 at 3 25 25 PM](https://github.com/user-attachments/assets/200818a5-e259-4837-aa2a-44c0bd7b099c)
-</details>
-
-### Cleaning Up After Verification
-
-To remove the resources created during verification:
-
-Delete the snapshot:
-
-```shell
-curl -X DELETE "http://<your-source-cluster>:9200/_snapshot/test_s3_repository/test_snapshot_1?pretty"
-```
-
-Delete the snapshot repository:
-
-```shell
-curl -X DELETE "http://<your-source-cluster>:9200/_snapshot/test_s3_repository?pretty"
-```
-
-Delete the S3 bucket and its contents:
-
-```shell
-aws s3 rm s3://<your-bucket-name> --recursive
-aws s3api delete-bucket --bucket <your-bucket-name> --region <your-aws-region>
-```
-
-### Troubleshooting
-
-#### Access Denied Error (403)
-
-If you encounter an error like `AccessDenied (Service: Amazon S3; Status Code: 403)`, verify the following:
-
-- The IAM role assigned to your Elasticsearch cluster has the necessary S3 permissions.
-- The bucket name and region provided in the snapshot configuration match the actual S3 bucket you created.
-
-#### Older versions of Elasticsearch
-
-Older versions of the Elasticsearch S3 Repository Plugin may have trouble reading IAM Role credentials embedded in EC2 and ECS Instances.  This is due to the copy of the AWS SDK shipped in them being being too old to read the new standard way of retrieving those credentials - [the Instance Metadata Service v2 (IMDSv2) specification](https://docs.aws.amazon.com/AWSEC2/latest/UserGuide/ec2-instance-metadata.html).  This can result in Snapshot creation failures, with an error message like:
-
-```
-{"error":{"root_cause":[{"type":"repository_verification_exception","reason":"[migration_assistant_repo] path [rfs-snapshot-repo] is not accessible on master node"}],"type":"repository_verification_exception","reason":"[migration_assistant_repo] path [rfs-snapshot-repo] is not accessible on master node","caused_by":{"type":"i_o_exception","reason":"Unable to upload object [rfs-snapshot-repo/tests-s8TvZ3CcRoO8bvyXcyV2Yg/master.dat] using a single upload","caused_by":{"type":"amazon_service_exception","reason":"Unauthorized (Service: null; Status Code: 401; Error Code: null; Request ID: null)"}}},"status":500}
-```
-
-If you encounter this issue, you can resolve it by temporarily enabling IMDSv1 on the Instances in your source cluster for the duration of the snapshot.  There is a toggle for it available in [the AWS Console](https://docs.aws.amazon.com/AWSEC2/latest/UserGuide/configuring-instance-metadata-options.html), as well as in [the AWS CLI](https://docs.aws.amazon.com/cli/latest/reference/ec2/modify-instance-metadata-options.html#options).  Flipping this toggle will turn on the older access model and enable the Elasticsearch S3 Repository Plugin to work as normal.
-
-### Related Links
-
-- [Elasticsearch S3 Repository Plugin Configuration Guide](https://www.elastic.co/guide/en/elasticsearch/plugins/7.10/repository-s3-client.html) ↗.
diff --git a/_migrations/migration-phases/setup-verification/System-Reset-Before-Migration.md b/_migrations/migration-phases/setup-verification/System-Reset-Before-Migration.md
deleted file mode 100644
index 708dbe5589..0000000000
--- a/_migrations/migration-phases/setup-verification/System-Reset-Before-Migration.md
+++ /dev/null
@@ -1,22 +0,0 @@
-
-
-
-The following steps outline how to reset resources with Migration Assistant before executing the actual migration. At this point all verifications are expected to have been completed. These steps can be performed after [[Accessing the Migration Console]]
-
-## Replayer Stoppage
-To stop a running Replayer service, the following command can be executed:
-```
-console replay stop
-```
-
-## Kafka Reset
-The clear all captured traffic from the Kafka topic, the following command can be executed. **Note**: This command will result in the loss of any captured traffic data up to this point by the capture proxy and thus should be used with caution.
-```
-console kafka delete-topic
-```
-
-## Target Cluster Reset
-To clear non-system indices from the target cluster that may have been created from testing, the following command can be executed. **Note**: This command will result in the loss of all data on the target cluster and should be used with caution.
-```
-console clusters clear-indices --cluster target
-```
diff --git a/_migrations/migration-phases/setup-verification/Traffic-Capture-Verification.md b/_migrations/migration-phases/setup-verification/Traffic-Capture-Verification.md
deleted file mode 100644
index 8a99a941d3..0000000000
--- a/_migrations/migration-phases/setup-verification/Traffic-Capture-Verification.md
+++ /dev/null
@@ -1,36 +0,0 @@
-
-
-
-This guide will describe how once the traffic capture proxy is deployed the captured traffic can be verified.
-
-## Replication setup and validation
-1. Navigate to Migration ECS Cluster in AWS Console
-1. Navigate to Capture Proxy Service
-1. Verify > 0 desired count and running
-   * if not, update service to increase to at least 1 and wait for startup
-1. Within "Load balancer health" on "Health and Metrics" tab, verify all targets are reporting healthy
-    * This means the ALB is able to connect to the source cluster through the capture proxy
-1. Navigate to the Migration Console Terminal
-1. Execute `console kafka describe-topic-records`
-1. Wait 30 seconds for another elb health check to be recorded 
-1. Execute `console kafka describe-topic-records` again, Verify RECORDS increased between runs
-1. Execute `console replay start` to start the replayer
-1. Run `tail -f /shared-logs-output/traffic-replayer-default/*/tuples/tuples.log  | jq '.targetResponses[]."Status-Code"'` to confirm that the Kafka requests were sent to the the target and that it responded as expected... If responses don't appear
-    * check that the migration-console can access the target cluster by running `./catIndices.sh`, which should show indices on the source and target.
-    * confirm that messages are still being recorded to Kafka.
-    * check for errors in the replayer logs ("/migration/STAGE/default/traffic-replayer-default") via CloudWatch
-1. (Reset) Update Traffic Capture Proxy service desired count back to original value in ECS
-
-## Troubleshooting
-
-### Health checks response with 401/403 status code
-If the source cluster is configured to require authentication the capture proxy will not be able to verify beyond receiving 401/403 status code for ALB healthchecks
-
-### Traffic does not reach the source cluster 
-Verify the Source Cluster allows traffic ingress from Capture Proxy Security Group.
-
-Look for failing tasks by navigating to Traffic Capture Proxy ECS Tasks.  Change "Filter desired status" to "Any desired status" in order to see all tasks and navigate to logs for stopped tasks.
-
-### Related Links
-
-- [Traffic Capture Proxy Failure Modes](https://github.com/opensearch-project/opensearch-migrations/blob/main/TrafficCapture/trafficCaptureProxyServer/README.md#failure-modes)
diff --git a/_migrations/migration-phases/setup-verification/index.md b/_migrations/migration-phases/setup-verification/index.md
deleted file mode 100644
index 5126b7cab6..0000000000
--- a/_migrations/migration-phases/setup-verification/index.md
+++ /dev/null
@@ -1,7 +0,0 @@
----
-layout: default
-title: Setup verification
-nav_order: 70
-has_children: true
-parent: Migration phases
----
\ No newline at end of file
diff --git a/_migrations/other-helpful-pages/load-sample-data-into-cluster.md b/_migrations/other-helpful-pages/load-sample-data-into-cluster.md
deleted file mode 100644
index 6dbd9fdcb2..0000000000
--- a/_migrations/other-helpful-pages/load-sample-data-into-cluster.md
+++ /dev/null
@@ -1,144 +0,0 @@
-<!-- Document: Guide -->
-This guide demonstrates how to quickly load test data into an Elasticsearch or OpenSearch source cluster using AWS Glue and the AWS Open Dataset library. We'll walk through indexing Bitcoin transaction data on the source cluster. For more details, refer to [the official AWS documentation on setting up Glue connections to OpenSearch](https://docs.aws.amazon.com/glue/latest/dg/aws-glue-programming-etl-connect-opensearch-home.html) ↗.
-
-## 1. Create Your Source Cluster
-
-Create your source cluster using the method of your choice, keeping in mind the following requirements:
-
-* We will use basic authentication (username/password) for access control. In this example, we are using Elasticsearch 7.10, but earlier versions of Elasticsearch and OpenSearch 1.X and 2.X are also supported.
-* The source cluster must be in a VPC you control and have access to, enabling AWS Glue to send data to it.
-
-## 2. Create the Access Secret in Secrets Manager
-
-Create a secret in AWS Secrets Manager that provides AWS Glue with access to the source cluster’s basic authentication credentials:
-
-1. Navigate to the AWS Secrets Manager Console.
-2. Create a generic secret. Name it as you prefer and configure replication/rotation as needed.
-
-Key fields:
-
-* `opensearch.net.http.auth.user`: The username for accessing the source cluster.
-* `opensearch.net.http.auth.pass`: The password for accessing the source cluster.
-
-<details>
-<summary>
-<b>Example Access Secrets</b>
-</summary>
-
-![Screenshot](https://github.com/user-attachments/assets/dde7e343-4a9c-4f0b-af6d-e7048ecd1b14)
-</details>
-
-## 3. Create an AWS Glue IAM Role
-
-Create an IAM Role that grants AWS Glue the necessary permissions:
-
-1. Navigate to the IAM Console and create a new IAM Role.
-2. Use the following trust policy to allow the AWS Glue service to assume the role:
-
-```json
-{
-    "Version": "2012-10-17",
-    "Statement": [
-        {
-            "Effect": "Allow",
-            "Principal": {
-                "Service": "glue.amazonaws.com"
-            },
-            "Action": "sts:AssumeRole"
-        }
-    ]
-}
-```
-
-3. Attach the following permission sets:
-   * `AWSGlueServiceRole`
-   * `AmazonS3ReadOnlyAccess`
-
-4. Grant the role access to the secret created in step 2 by adding an inline policy like this:
-
-```json
-{
-    "Version": "2012-10-17",
-    "Statement": [
-        {
-            "Effect": "Allow",
-            "Action": "secretsmanager:GetSecretValue",
-            "Resource": "arn:aws:secretsmanager:us-east-1:XXXXXXXXXXXX:secret:migration-assistant-source-cluster-creds-YDtnmx"
-        }
-    ]
-}
-```
-
-## 4. Create an AWS Glue Connection
-
-Create a Glue Connection to provide AWS Glue with access to the source cluster:
-
-1. Navigate to the AWS Glue Console.
-2. Create a new connection of the **Amazon OpenSearch Service** type.
-3. Fill in your source cluster’s details (including VPC, subnet, and security group) and use the secret created earlier.
-
-<details>
-<summary>
-<b>Example Glue Connection Configuration</b>
-</summary>
-
-![Screenshot](https://github.com/user-attachments/assets/b5978b2e-de58-4d46-ad47-ac960e729b89)
-</details>
-
-## 5. (Optional) Examine the Source Dataset
-
-The sample dataset we'll use is the [AWS Public Blockchain dataset](https://registry.opendata.aws/aws-public-blockchain/) ↗, which is available for free. More information can be found [in this blog post](https://aws.amazon.com/blogs/database/access-bitcoin-and-ethereum-open-datasets-for-cross-chain-analytics/) ↗, and you can browse its contents in S3 [here](https://us-east-2.console.aws.amazon.com/s3/buckets/aws-public-blockchain) ↗.
-
-The Bitcoin transaction data we'll load into our source cluster is located at the S3 URI: `s3://aws-public-blockchain/v1.0/btc/transactions/`.
-
-## 6. Create the AWS Glue Job
-
-Now, create a Glue Job in the AWS Glue Console using the connection you created earlier.
-
-### S3 Source
-
-1. Set the S3 URI to `s3://aws-public-blockchain/v1.0/btc/transactions`.
-2. Enable recursive reading of the bucket's contents.
-3. The data format is Parquet.
-
-<details>
-<summary>
-<b>Example Glue Connection</b>
-</summary>
-
-![Screenshot](https://github.com/user-attachments/assets/6fc4c0da-45b9-4c09-ba73-1619f59c9dd3)
-</details>
-
-### OpenSearch Target
-
-1. Select the AWS Glue Connection you created.
-2. Specify the index name where the Bitcoin transaction data will be stored.
-
-<details>
-<summary>
-<b>Example Data Sink</b>
-</summary>
-
-![Screenshot](https://github.com/user-attachments/assets/264d0d17-f7f4-4c07-8567-6cae47c3ccd1)
-</details>
-
-### Pre-Configure the Index Settings
-
-This is an optional step. By default, the Glue Job creates a single-shard index. Since the dataset is approximately 1 TB in size, it's recommended to pre-create the index with multiple shards. Follow this example to create an index with 40 shards:
-
-```bash
-curl -u <your username>:<your password> -X PUT "http://<your source cluster domain>:9200/bitcoin-data" -H 'Content-Type: application/json' -d'
-{
-  "settings": {
-    "number_of_shards": 40,
-    "number_of_replicas": 1
-  }
-}
-'
-```
-
-You can also adjust any additional index settings at this time.
-
-## 7. Run the Glue Job
-
-Once the Glue source and target are configured, run the job in the AWS Console by clicking the **Run** button. You can monitor the job’s progress under the **Runs** tab in the console.
\ No newline at end of file
diff --git a/_migrations/other-helpful-pages/migration-timelines.md b/_migrations/other-helpful-pages/migration-timelines.md
deleted file mode 100644
index 51d4302904..0000000000
--- a/_migrations/other-helpful-pages/migration-timelines.md
+++ /dev/null
@@ -1,105 +0,0 @@
-There is no *one-size-fits-most* migration strategy, this guide seeks to describe possible sample scenario(s) with the goal of helping customers plan their own migration strategy and estimate costs accordingly.
-
-## 15 Day Historical and Live Migration
-
-Key phases:
-
-1. Setup, Planning, and Verification (Days 1-5)
-1. Historical backfill, Catchup, and Validation (Days 6-10)
-1. Final Validation, Traffic Switchover, and Teardown (Days 11-15)
-
-### Timeline
-
-```mermaid
-%%{
-  init: {
-    "gantt": {
-        "fontSize": 20,
-        "barHeight": 40,
-        "sectionFontSize": 24,
-        "leftPadding": 175
-    }
-  }
-}%%
-gantt
-    dateFormat D HH
-    axisFormat Day %d
-    todayMarker off
-    tickInterval 1day
-
-    section Steps
-    Setup and Verification : prep, 1 00, 5d
-    Clear Test Environment : milestone, clear, after prep, 0d
-    Traffic Capture : traffic_capture, after clear, 6d
-    Snapshot : snapshot, after clear, 1d
-    Scale Up Target Cluster for Backfill : backfill_scale, 6 22, 2h
-    Metadata Migration : metadata, after snapshot, 1h
-    Reindex from Snapshot : rfs, after metadata, 71h
-    Scale Down Target Cluster for Replay : replay_scale, after rfs, 2h
-    Traffic Replay: replay, after replay_scale, 46h
-    Traffic Switchover : milestone, switchover, after replay, 0d
-    Validation : validation, after snapshot, 7d
-    Scale Down Target Cluster : 11 00, 2h
-    Teardown   : teardown, 14 00, 2d
-```
-
-#### Explanation of Scaling Operations
-
-This section assumes a customer chooses to deliberatly scale their target cluster for backfill and/or replay to enable a faster and/or cheaper overall migration. In the absence of this, backfill and replay steps may take much longer (likely increasing overall cost).
-
-This plan assumes we can replay 6 days of captured data in under 2 days in order for the source and target clusters to be in sync. Take an example of a source cluster operating at avg. 90% CPU utilization to handle reads/writes from application code, it's improbable that a target cluster with the same scale and configuration will be able to support a request throughput of at least 3x in order to catchup in the given time. The same holds for backfill for write-heavy clusters or clusters where data has accumulated for a long time period, to follow this plan, the target cluster should be scaled such that it can ingest/index all the source data in under 3 days.
-
-
-1. **Scale Up Target Cluster for Backfill**: Occurs after metadata migration and before reindexing. The target cluster is scaled up to handle the resource-intensive reindexing process faster.
-
-
-2. **Scale Down Target Cluster for Replay**: Once the reindexing is complete, the target cluster is scaled down to a more appropriate size for the traffic replay phase. While still provisioned higher than normal production workloads, given replayer has a >1 speedup factor.
-
-3. **Scale Down Target Cluster**: After the validation phase, the target cluster is scaled down to its final operational size. This step ensures that the cluster is rightsized for normal production workloads, balancing performance needs with cost-efficiency.
-
-### Component Durations
-
-This component duration breakdown is useful for identifying the cost of resources deployed during the migration process. It provides a clear overview of how long each component is active or retained, which directly impacts resource utilization and associated costs.
-
-Note: Duration excludes weekends. If actual timeline extends over weekends, duration (and potentially costs) will increase.
-
-```mermaid
-%%{
-  init: {
-    "gantt": {
-        "fontSize": 20,
-        "barHeight": 40,
-        "sectionFontSize": 24,
-        "leftPadding": 175
-    }
-  }
-}%%
-gantt
-    dateFormat D HH
-    axisFormat Day %d
-    todayMarker off
-    tickInterval 1day
-
-    section Services
-    Core Services Runtime (15d) : active, 1 00, 15d
-    Capture Proxy Runtime (6d) : active, capture_active, 6 00, 6d
-    Capture Data Retention (4d) : after capture_active, 4d
-    Snapshot Runtime (1d) : active, snapshot_active, 6 00, 1d
-    Snapshot Retention (9d) : after snapshot_active, 9d
-    Reindex from Snapshot Runtime (3d) : active, historic_active, 7 01, 71h
-    Replayer Runtime (2d) : active, replayer_active, after historic_active, 2d
-    Replayer Data Retention (4d) : after replayer_active, 4d
-    Target Proxy Runtime (4d) : active, after replayer_active, 4d
-```
-
-| Component                         | Duration |
-|-----------------------------------|----------|
-| Core Services Runtime             | 15d      |
-| Capture Proxy Runtime             | 6d       |
-| Capture Data Retention            | 4d       |
-| Snapshot Runtime                  | 1d       |
-| Snapshot Retention                | 9d       |
-| Reindex from Snapshot Runtime     | 3d       |
-| Replayer Runtime                  | 2d       |
-| Replayer Data Retention           | 4d       |
-| Target Proxy Runtime              | 4d       |
diff --git a/_migrations/other-helpful-pages/provisioning-source-cluster-for-testing.md b/_migrations/other-helpful-pages/provisioning-source-cluster-for-testing.md
deleted file mode 100644
index 69b4e930e6..0000000000
--- a/_migrations/other-helpful-pages/provisioning-source-cluster-for-testing.md
+++ /dev/null
@@ -1,91 +0,0 @@
-<!-- Document: Topic -->
-This guide walks you through the steps to provision an Elasticsearch cluster on EC2 using AWS CDK. The CDK that provisions this cluster can be found on the `migration-es` branch of the `opensearch-cluster-cdk` GitHub [forked repository](https://github.com/lewijacn/opensearch-cluster-cdk/tree/migration-es).
-
-TODO ^ lewijacn seems like it should be updated?
-
-## 1. Clone the Repository for Source Cluster CDK
-
-```bash
-git clone https://github.com/lewijacn/opensearch-cluster-cdk.git
-cd opensearch-cluster-cdk
-git checkout migration-es
-```
-
-## 2. Install NPM Dependencies
-
-```bash
-npm install
-```
-
-## 3. Configure AWS Credentials
-
-Configure the desired [AWS credentials](https://docs.aws.amazon.com/cdk/v2/guide/getting_started.html#getting_started_prerequisites) ↗ for the environment, as these will dictate the region and account used for deployment.
-
-## 4. Configure Cluster Options
-
-The configuration below sets up a single-node Elasticsearch 7.10.2 cluster on EC2 and a VPC to host the cluster. Alternatively, you can specify an existing VPC by providing the `vpcId` parameter. The setup includes an internal load balancer, which should be used when interacting with the cluster.
-
-Copy and paste the following configuration into a `cdk.context.json` file at the root of the repository. Replace the `<STAGE>` placeholders with the desired deployment stage, e.g., `dev`.
-
-```json
-{
-  "source-single-node-ec2": {
-    "suffix": "ec2-source-<STAGE>",
-    "networkStackSuffix": "ec2-source-<STAGE>",
-    "distVersion": "7.10.2",
-    "cidr": "12.0.0.0/16",
-    "distributionUrl": "https://artifacts.elastic.co/downloads/elasticsearch/elasticsearch-oss-7.10.2-linux-x86_64.tar.gz",
-    "captureProxyEnabled": false,
-    "securityDisabled": true,
-    "minDistribution": false,
-    "cpuArch": "x64",
-    "isInternal": true,
-    "singleNodeCluster": true,
-    "networkAvailabilityZones": 2,
-    "dataNodeCount": 1,
-    "managerNodeCount": 0,
-    "serverAccessType": "ipv4",
-    "restrictServerAccessTo": "0.0.0.0/0"
-  }
-}
-```
-
-> **Note:** You can specify other versions of Elasticsearch or OpenSearch by modifying the `distributionUrl` parameter.
-
-## 5. Bootstrap CDK in the Region (If Needed)
-
-If this is the first time you're deploying CDK in the region, you'll need to run the following command. **Note:** This only needs to be done once per region.
-
-```bash
-cdk bootstrap --c contextId=source-single-node-ec2 --c contextFile=cdk.context.json
-```
-
-## 6. Deploy CloudFormation Stacks with CDK
-
-Deploy the infrastructure using the following command:
-
-```bash
-cdk deploy "*" --c contextId=source-single-node-ec2 --c contextFile=cdk.context.json
-```
-
-Once the deployment is complete, the CDK will output the internal load balancer endpoint, which can be used within the VPC to interact with the Elasticsearch cluster:
-
-```bash
-# Stack output
-opensearch-infra-stack-ec2-source-dev.loadbalancerurl = opense-clust-owiejfo2345-sdfljsd.elb.us-east-1.amazonaws.com
-
-# Example curl command within the VPC
-curl http://opense-clust-owiejfo2345-sdfljsd.elb.us-east-1.amazonaws.com:9200
-```
-
-## 7. Clean Up Resources
-
-When you are done using the provisioned source cluster, you can delete the resources by running the following command:
-
-```bash
-cdk destroy "*" --c contextId=source-single-node-ec2 --c contextFile=cdk.context.json
-```
-
-For a full list of options, refer to the CDK options in the [repository documentation](https://github.com/lewijacn/opensearch-cluster-cdk/tree/migration-es?tab=readme-ov-file#required-context-parameters).
-
-^ TODO: Are we advertising a fork? Seems like this should be fixed up
\ No newline at end of file
diff --git a/_migrations/quick-start-data-migration.md b/_migrations/quick-start-data-migration.md
deleted file mode 100644
index 62b13292e7..0000000000
--- a/_migrations/quick-start-data-migration.md
+++ /dev/null
@@ -1,262 +0,0 @@
----
-layout: default
-title: Quickstart - Data migration
-nav_order: 10
----
-
-# Quickstart - Data migration
-
-This document outlines how to deploy the Migration Assistant and execute an existing data migration using Reindex-from-Snapshot (RFS). Note that this does not include steps for deploying and capturing live traffic, which is necessary for a zero-downtime migration. Please refer to the "Phases of a Migration" section in the wiki navigation bar for a complete end-to-end migration process, including metadata migration, live capture, Reindex-from-Snapshot, and replay.
-
-## Prerequisites and Assumptions
-* Verify your migration path [is supported](https://github.com/opensearch-project/opensearch-migrations/wiki/Is-Migration-Assistant-Right-for-You%3F#supported-migration-paths). Note that we test with the exact versions specified, but you should be able to migrate data on alternative minor versions as long as the major version is supported.
-* Source cluster must be deployed with the S3 plugin.
-* Target cluster must be deployed.
-* A snapshot will be taken and stored in S3 in this guide, and the following assumptions are made about this snapshot:
-  * The `_source` flag is enabled on all indices to be migrated.
-  * The snapshot includes the global cluster state (`include_global_state` is `true`).
-  * Shard sizes up to approximately 80GB are supported. Larger shards will not be able to migrate. If this is a blocker, please consult the migrations team.
-* Migration Assistant will be installed in the same region and have access to both the source snapshot and target cluster.
-
----
-
-## Step 1 - Installing Bootstrap EC2 Instance (~10 mins)
-1. Log into the target AWS account where you want to deploy the Migration Assistant.
-2. From the browser where you are logged into your target AWS account right-click [here](https://console.aws.amazon.com/cloudformation/home?region=us-east-1#/stacks/new?templateURL=https://solutions-reference.s3.amazonaws.com/migration-assistant-for-amazon-opensearch-service/latest/migration-assistant-for-amazon-opensearch-service.template&redirectId=SolutionWeb) ↗ to load the CloudFormation (Cfn) template from a new browser tab.
-3. Follow the CloudFormation stack wizard:
-   * **Stack Name:** `MigrationBootstrap`
-   * **Stage Name:** `dev`
-   * Hit **Next** on each step, acknowledge on the fourth screen, and hit **Submit**.
-4. Verify that the bootstrap stack exists and is set to `CREATE_COMPLETE`. This process takes around 10 minutes.
-
----
-
-## Step 2 - Setup Bootstrap Instance Access (~5 mins)
-1. After deployment, find the EC2 instance ID for the `bootstrap-dev-instance`.
-2. Create an IAM policy using the snippet below, replacing `<aws-region>`, `<aws-account>`, `<stage>`, and `<ec2-instance-id>`:
-
-```json
-{
-    "Version": "2012-10-17",
-    "Statement": [
-        {
-            "Effect": "Allow",
-            "Action": "ssm:StartSession",
-            "Resource": [
-                "arn:aws:ec2:<aws-region>:<aws-account>:instance/<ec2-instance-id>",
-                "arn:aws:ssm:<aws-region>:<aws-account>:document/SSM-<stage>-BootstrapShell"
-            ]
-        }
-    ]
-}
-```
-
-3. Name the policy, e.g., `SSM-OSMigrationBootstrapAccess`, and create the policy.
-
----
-
-## Step 3 - Login to Bootstrap and Build (~15 mins)
-### Prerequisites:
-* AWS CLI and AWS Session Manager Plugin installed.
-* AWS credentials configured (`aws configure`).
-
-1. Load AWS credentials into your terminal.
-2. Login to the instance using the command below, replacing `<instance-id>` and `<aws-region>`:
-```bash
-aws ssm start-session --document-name SSM-dev-BootstrapShell --target <instance-id> --region <aws-region> [--profile <profile-name>]
-```
-3. Once logged in, run the following command from the shell of the bootstrap instance (within the /opensearch-migrations directory):
-```bash
-./initBootstrap.sh && cd deployment/cdk/opensearch-service-migration
-```
-4. After a successful build, remember the path for infrastructure deployment in the next step.
-
----
-
-## Step 4 - Configuring and Deploying for RFS Use Case (~20 mins)
-1. Add the target cluster password to AWS Secrets Manager as an unstructured string. Be sure to copy the secret ARN for use during deployment.
-2. From the same shell on the bootstrap instance, modify the cdk.context.json file located in the `/opensearch-migrations/deployment/cdk/opensearch-service-migration` directory:
-
-```json
-{
-  "migration-assistant": {
-    "vpcId": "<TARGET CLUSTER VPC ID>",
-    "targetCluster": {
-        "endpoint": "<TARGET CLUSTER ENDPOINT>",
-        "auth": {
-            "type": "basic",
-            "username": "<TARGET CLUSTER USERNAME>",
-            "passwordFromSecretArn": "<TARGET CLUSTER PASSWORD SECRET>"
-        }
-    },
-    "sourceCluster": {
-        "endpoint": "<SOURCE CLUSTER ENDPOINT>",
-        "auth": {
-            "type": "basic",
-            "username": "<TARGET CLUSTER USERNAME>",
-            "passwordFromSecretArn": "<TARGET CLUSTER PASSWORD SECRET>"
-        }
-    },
-    "reindexFromSnapshotExtraArgs": "<RFS PARAMETERS (see below)>",
-    "stage": "dev",
-    "otelCollectorEnabled": true,
-    "migrationConsoleServiceEnabled": true,
-    "reindexFromSnapshotServiceEnabled": true,
-    "migrationAssistanceEnabled": true
-  }
-}
-```
-
-The source and target cluster authorization can be configured to have none, `basic` with a username and password, or `sigv4`. There are examples of each available [here](https://github.com/opensearch-project/opensearch-migrations/wiki/Configuration-Options#cluster-authentication-options).
-
-3. Bootstrap the account with the following command:
-```bash
-cdk bootstrap --c contextId=migration-assistant --require-approval never 
-```
-4. Deploy the stacks:
-```bash
-cdk deploy "*" --c contextId=migration-assistant --require-approval never --concurrency 5
-```
-5. Verify that all CloudFormation stacks were installed successfully.
-
-#### ReindexFromSnapshot Parameters
-* If you're creating a snapshot using migration tooling, these parameters are auto-configured. If you're using an existing snapshot, modify `reindexFromSnapshotExtraArgs` with the following values:
-```bash
---s3-repo-uri s3://<bucket-name>/<repo> --s3-region <region> --snapshot-name <name>
-```
-Note, you will also need to give access to the migrationconsole and reindexFromSnapshot taskRole permissions to the bucket 
-
----
-
-## Step 5 - Deploying the Migration Assistant
-1. Bootstrap the account:
-```bash
-cdk bootstrap --c contextId=migration-assistant --require-approval never --concurrency 5
-```
-2. Deploy the stacks when `cdk.context.json` is fully configured:
-```bash
-cdk deploy "*" --c contextId=migration-assistant --require-approval never --concurrency 3
-```
-
-### Stacks Deployed:
-* Migration Assistant Network stack
-* Reindex From Snapshot stack
-* Migration Console stack
-
----
-
-## Step 6 - Accessing the Migration Console
-Run the following command to access the migration console:
-```bash
-./accessContainer.sh migration-console dev <region>
-```
->[!NOTE]
->`accessContainer.sh` is located in `/opensearch-migrations/deployment/cdk/opensearch-service-migration/` on the bootstrap instance.
-
-_Learn more [[Accessing the Migration Console]]_
-
----
-
-## Step 7 - Checking Connection to Source & Target Clusters
-To verify the connection to the clusters, run:
-```bash
-console clusters connection-check
-```
-
-### Expected Output:
-* **Source Cluster:** Successfully connected!
-* **Target Cluster:** Successfully connected!
-
-_Learn more [[Console commands reference|Migration-Console-commands-references]]_
-
----
-
-## Step 8 - Snapshot Creation
-Run the following to initiate creating a snapshot from the source cluster
-```
-console snapshot create [...]
-```
-
-To check on the progress,
-```
-console snapshot status [...]
-```
-or, for more detail,
-```
-console snapshot status --deep-check [...]
-```
-
-Wait for the snapshot to complete before moving to the next step.
-
-_Learn more [[Snapshot Creation Verification]] [[Snapshot Creation]]_
-
----
-
-## Step 9 - Metadata Migration
-Run the following command to migrate metadata:
-```bash
-console metadata migrate [...]
-```
-
-_Learn more [[Metadata Migration]]_
-
----
-
-## Step 10 - RFS Document Migration
-Start the backfill process:
-```bash
-console backfill start
-```
-
-Scale up the number of workers:
-```bash
-console backfill scale <NUM_WORKERS>
-```
-
-Check the status:
-```bash
-console backfill status
-```
-
-To stop the workers:
-```bash
-console backfill stop
-```
-
-_Learn more [[Backfill Execution]]_
-
----
-
-## Step 11 - Monitoring
-Use the following command for detailed monitoring:
-```bash
-console backfill status --deep-check
-```
-
-### Example Output:
-```text
-BackfillStatus.RUNNING
-Running=9
-Pending=1
-Desired=10
-Shards total: 62
-Shards completed: 46
-Shards incomplete: 16
-Shards in progress: 11
-Shards unclaimed: 5
-```
-
-Logs and metrics are available in CloudWatch in the OpenSearchMigrations log group.
-
----
-
-## Step 12 - Verify all documents were migrated 
-Use the following query in CloudWatch Logs Insights to identify failed documents:
-```bash
-fields @message
-| filter @message like "Bulk request succeeded, but some operations failed."
-| sort @timestamp desc
-| limit 10000
-```
-
-_Learn more [[Backfill Result Validation]]_
\ No newline at end of file
diff --git a/_ml-commons-plugin/remote-models/connectors.md b/_ml-commons-plugin/remote-models/connectors.md
index 3ec6c73b07..788f1b003d 100644
--- a/_ml-commons-plugin/remote-models/connectors.md
+++ b/_ml-commons-plugin/remote-models/connectors.md
@@ -294,7 +294,7 @@ In some cases, you may need to update credentials, like `access_key`, that you u
 ```json
 PUT /_plugins/_ml/models/<model_id>
 {
-  "connector": {
+  "connectors": {
     "credential": {
       "openAI_key": "YOUR NEW OPENAI KEY"
     }
diff --git a/_query-dsl/geo-and-xy/index.md b/_query-dsl/geo-and-xy/index.md
index ee51e1e523..9bcf6a9462 100644
--- a/_query-dsl/geo-and-xy/index.md
+++ b/_query-dsl/geo-and-xy/index.md
@@ -30,7 +30,7 @@ OpenSearch provides the following geographic query types:
 
 - [**Geo-bounding box queries**]({{site.url}}{{site.baseurl}}/opensearch/query-dsl/geo-and-xy/geo-bounding-box/): Return documents with geopoint field values that are within a bounding box. 
 - [**Geodistance queries**]({{site.url}}{{site.baseurl}}/query-dsl/geo-and-xy/geodistance/): Return documents with geopoints that are within a specified distance from the provided geopoint.
-- [**Geopolygon queries**]({{site.url}}{{site.baseurl}}/query-dsl/geo-and-xy/geodistance/): Return documents containing geopoints that are within a polygon.
+- [**Geopolygon queries**]({{site.url}}{{site.baseurl}}/query-dsl/geo-and-xy/geopolygon/): Return documents containing geopoints that are within a polygon.
 - [**Geoshape queries**]({{site.url}}{{site.baseurl}}/query-dsl/geo-and-xy/geoshape/): Return documents that contain:
     - Geoshapes and geopoints that have one of four spatial relations to the provided shape: `INTERSECTS`, `DISJOINT`, `WITHIN`, or `CONTAINS`.
-    - Geopoints that intersect the provided shape.
\ No newline at end of file
+    - Geopoints that intersect the provided shape.
diff --git a/_query-dsl/term/terms.md b/_query-dsl/term/terms.md
index 7dac6a9619..2de0b71bd6 100644
--- a/_query-dsl/term/terms.md
+++ b/_query-dsl/term/terms.md
@@ -183,7 +183,7 @@ PUT classes/_doc/102
 To search for students enrolled in `CS102`, use the dot path notation to specify the full path to the field in the `path` parameter:
 
 ```json
-ET students/_search
+GET students/_search
 {
   "query": {
     "terms": {
@@ -383,4 +383,4 @@ POST /products/_search
   }
 }
 ```
-{% include copy-curl.html %}
\ No newline at end of file
+{% include copy-curl.html %}
diff --git a/_search-plugins/caching/request-cache.md b/_search-plugins/caching/request-cache.md
index 768c75fc92..49d5e8cd82 100644
--- a/_search-plugins/caching/request-cache.md
+++ b/_search-plugins/caching/request-cache.md
@@ -28,7 +28,7 @@ Setting | Data type  | Default | Level | Static/Dynamic | Description
 `indices.cache.cleanup_interval` | Time unit  | `1m` (1 minute)  | Cluster | Static | Schedules a recurring background task that cleans up expired entries from the cache at the specified interval. 
 `indices.requests.cache.size` | Percentage | `1%`      | Cluster | Static | The cache size as a percentage of the heap size (for example, to use 1% of the heap, specify `1%`). 
 `index.requests.cache.enable` | Boolean    | `true`    | Index | Dynamic | Enables or disables the request cache. 
-`indices.requests.cache.enable_for_all_requests` | Boolean    | `false`    | Cluster | Dynamic | Enables or disables caching queries in which `size` is greater than `0`.
+`indices.requests.cache.maximum_cacheable_size` | Integer    | `0`    | Cluster | Dynamic | Sets the maximum `size` of queries to be added to the request cache.
 
 ### Example
 
diff --git a/_search-plugins/knn/painless-functions.md b/_search-plugins/knn/painless-functions.md
index 7a8d9fec7b..4b2311ad65 100644
--- a/_search-plugins/knn/painless-functions.md
+++ b/_search-plugins/knn/painless-functions.md
@@ -51,7 +51,7 @@ The following table describes the available painless functions the k-NN plugin p
 Function name | Function signature | Description
 :--- | :---
 l2Squared | `float l2Squared (float[] queryVector, doc['vector field'])` | This function calculates the square of the L2 distance (Euclidean distance) between a given query vector and document vectors. The shorter the distance, the more relevant the document is, so this example inverts the return value of the l2Squared function. If the document vector matches the query vector, the result is 0, so this example also adds 1 to the distance to avoid divide by zero errors.
-l1Norm | `float l1Norm (float[] queryVector, doc['vector field'])` | This function calculates the square of the L2 distance (Euclidean distance) between a given query vector and document vectors. The shorter the distance, the more relevant the document is, so this example inverts the return value of the l2Squared function. If the document vector matches the query vector, the result is 0, so this example also adds 1 to the distance to avoid divide by zero errors.
+l1Norm | `float l1Norm (float[] queryVector, doc['vector field'])` | This function calculates the L1 Norm distance (Manhattan distance) between a given query vector and document vectors.
 cosineSimilarity | `float cosineSimilarity (float[] queryVector, doc['vector field'])` | Cosine similarity is an inner product of the query vector and document vector normalized to both have a length of 1. If the magnitude of the query vector doesn't change throughout the query, you can pass the magnitude of the query vector to improve performance, instead of calculating the magnitude every time for every filtered document:<br /> `float cosineSimilarity (float[] queryVector, doc['vector field'], float normQueryVector)` <br />In general, the range of cosine similarity is [-1, 1]. However, in the case of information retrieval, the cosine similarity of two documents ranges from 0 to 1 because the tf-idf statistic can't be negative. Therefore, the k-NN plugin adds 1.0 in order to always yield a positive cosine similarity score.
 hamming | `float hamming (float[] queryVector, doc['vector field'])` | This function calculates the Hamming distance between a given query vector and document vectors. The Hamming distance is the number of positions at which the corresponding elements are different. The shorter the distance, the more relevant the document is, so this example inverts the return value of the Hamming distance.
 
@@ -73,4 +73,4 @@ The `hamming` space type is supported for binary vectors in OpenSearch version 2
    Because scores can only be positive, this script ranks documents with vector fields higher than those without.
 
 With cosine similarity, it is not valid to pass a zero vector (`[0, 0, ...]`) as input. This is because the magnitude of such a vector is 0, which raises a `divide by 0` exception in the corresponding formula. Requests containing the zero vector will be rejected, and a corresponding exception will be thrown.
-{: .note }
\ No newline at end of file
+{: .note }
diff --git a/_search-plugins/ltr/logging-features.md b/_search-plugins/ltr/logging-features.md
index fd73eda9a7..7922b8683d 100644
--- a/_search-plugins/ltr/logging-features.md
+++ b/_search-plugins/ltr/logging-features.md
@@ -12,7 +12,7 @@ Feature values need to be logged in order to train a model. This is a crucial co
 
 ## `sltr` query
 
-The `sltr` query is the primary method for running features and evaluating models. When logging, an `sltr` query is used to execute each feature query and retrieve the feature scores. A feature set structure is shown in the following example request:
+The `sltr` query is the primary method for running features and evaluating models. When logging, an `sltr` query is used to execute each feature query and retrieve the feature scores. A feature set structure that works with the [`hello-ltr`](https://github.com/o19s/hello-ltr) demo schema is shown in the following example request:
 
 ```json
 PUT _ltr/_featureset/more_movie_features
diff --git a/_search-plugins/search-pipelines/ml-inference-search-response.md b/_search-plugins/search-pipelines/ml-inference-search-response.md
index e8f17a667c..b0573d17be 100644
--- a/_search-plugins/search-pipelines/ml-inference-search-response.md
+++ b/_search-plugins/search-pipelines/ml-inference-search-response.md
@@ -751,4 +751,8 @@ The response includes the original documents and their reranked scores:
     "shards": []
   }
 }
-```
\ No newline at end of file
+```
+
+## Next steps
+
+- See a comprehensive example of [reranking by a field using an externally hosted cross-encoder model]({{site.url}}{{site.baseurl}}/search-plugins/search-relevance/rerank-by-field-cross-encoder/).
\ No newline at end of file
diff --git a/_search-plugins/search-pipelines/rerank-processor.md b/_search-plugins/search-pipelines/rerank-processor.md
index 84819b17c8..11691eff95 100644
--- a/_search-plugins/search-pipelines/rerank-processor.md
+++ b/_search-plugins/search-pipelines/rerank-processor.md
@@ -191,4 +191,5 @@ POST /book-index/_search?search_pipeline=rerank_byfield_pipeline
 
 - Learn more about [reranking search results]({{site.url}}{{site.baseurl}}/search-plugins/search-relevance/reranking-search-results/).
 - See a complete example of [reranking using a cross-encoder model]({{site.url}}{{site.baseurl}}/search-plugins/search-relevance/rerank-cross-encoder/).
-- See a complete example of [reranking by a document field]({{site.url}}{{site.baseurl}}/search-plugins/search-relevance/rerank-by-field/).
\ No newline at end of file
+- See a complete example of [reranking by a document field]({{site.url}}{{site.baseurl}}/search-plugins/search-relevance/rerank-by-field/).
+- See a comprehensive example of [reranking by a field using an externally hosted cross-encoder model]({{site.url}}{{site.baseurl}}/search-plugins/search-relevance/rerank-by-field-cross-encoder/).
\ No newline at end of file
diff --git a/_search-plugins/search-relevance/rerank-by-field-cross-encoder.md b/_search-plugins/search-relevance/rerank-by-field-cross-encoder.md
new file mode 100644
index 0000000000..7f30689491
--- /dev/null
+++ b/_search-plugins/search-relevance/rerank-by-field-cross-encoder.md
@@ -0,0 +1,276 @@
+---
+layout: default
+title: Reranking by a field using a cross-encoder
+parent: Reranking search results
+grand_parent: Search relevance
+has_children: false
+nav_order: 30
+---
+
+# Reranking by a field using an externally hosted cross-encoder model
+Introduced 2.18
+{: .label .label-purple }
+
+In this tutorial, you'll learn how to use a cross-encoder model hosted on Amazon SageMaker to rerank search results and improve search relevance. 
+
+To rerank documents, you'll configure a search pipeline that processes search results at query time. The pipeline intercepts search results and passes them to the [`ml_inference` search response processor]({{site.url}}{{site.baseurl}}/search-plugins/search-pipelines/ml-inference-search-response/), which invokes the cross-encoder model. The model generates scores used to rerank the matching documents [`by_field`]({{site.url}}{{site.baseurl}}/search-plugins/search-relevance/rerank-by-field/).
+
+## Prerequisite: Deploy a model on Amazon SageMaker
+
+Run the following code to deploy a model on Amazon SageMaker. For this example, you'll use the [`ms-marco-MiniLM-L-6-v2`](https://huggingface.co/cross-encoder/ms-marco-MiniLM-L-6-v2) Hugging Face cross-encoder model hosted on Amazon SageMaker. We recommend using a GPU for better performance:
+
+```python
+import sagemaker
+import boto3
+from sagemaker.huggingface import HuggingFaceModel
+
+sess = sagemaker.Session()
+role = sagemaker.get_execution_role()
+
+hub = {
+    'HF_MODEL_ID':'cross-encoder/ms-marco-MiniLM-L-6-v2',
+    'HF_TASK':'text-classification'
+}
+huggingface_model = HuggingFaceModel(
+    transformers_version='4.37.0',
+    pytorch_version='2.1.0',
+    py_version='py310',
+    env=hub,
+    role=role, 
+)
+predictor = huggingface_model.deploy(
+    initial_instance_count=1, # number of instances
+    instance_type='ml.m5.xlarge' # ec2 instance type
+)
+```
+{% include copy.html %}
+
+After deploying the model, you can find the model endpoint by going to the Amazon SageMaker console in the AWS Management Console and selecting **Inference > Endpoints** on the left tab. Note the URL for the created model; you'll use it to create a connector.
+
+## Running a search with reranking
+
+To run a search with reranking, follow these steps:
+
+1. [Create a connector](#step-1-create-a-connector).
+1. [Register the model](#step-2-register-the-model).
+1. [Ingest documents into an index](#step-3-ingest-documents-into-an-index).
+1. [Create a search pipeline](#step-4-create-a-search-pipeline).
+1. [Search using reranking](#step-5-search-using-reranking).
+
+## Step 1: Create a connector
+
+Create a connector to the cross-encoder model by providing the model URL in the `actions.url` parameter:
+
+```json
+POST /_plugins/_ml/connectors/_create
+{
+  "name": "SageMaker cross-encoder model",
+  "description": "Test connector for SageMaker cross-encoder hosted model",
+  "version": 1,
+  "protocol": "aws_sigv4",
+  "credential": {
+		"access_key": "<YOUR_ACCESS_KEY>",
+		"secret_key": "<YOUR_SECRET_KEY>",
+		"session_token": "<YOUR_SESSION_TOKEN>"
+  },
+  "parameters": {
+    "region": "<REGION>",
+    "service_name": "sagemaker"
+  },
+  "actions": [
+    {
+      "action_type": "predict",
+      "method": "POST",
+      "url": "<YOUR_SAGEMAKER_ENDPOINT_URL>",
+      "headers": {
+        "content-type": "application/json"
+      },
+      "request_body": "{ \"inputs\": { \"text\": \"${parameters.text}\", \"text_pair\": \"${parameters.text_pair}\" }}"
+    }
+  ]
+}
+```
+{% include copy-curl.html %}
+
+Note the connector ID contained in the response; you'll use it in the following step.
+
+## Step 2: Register the model
+
+To register the model, provide the connector ID in the `connector_id` parameter:
+
+```json
+POST /_plugins/_ml/models/_register
+{
+  "name": "Cross encoder model",
+  "version": "1.0.1",
+  "function_name": "remote",
+  "description": "Using a SageMaker endpoint to apply a cross encoder model",
+  "connector_id": "<YOUR_CONNECTOR_ID>"
+} 
+```
+{% include copy-curl.html %}
+
+
+## Step 3: Ingest documents into an index
+
+Create an index and ingest sample documents containing facts about the New York City boroughs:
+
+```json
+POST /nyc_areas/_bulk
+{ "index": { "_id": 1 } }
+{ "borough": "Queens", "area_name": "Astoria", "description": "Astoria is a neighborhood in the western part of Queens, New York City, known for its diverse community and vibrant cultural scene.", "population": 93000, "facts": "Astoria is home to many artists and has a large Greek-American community. The area also boasts some of the best Mediterranean food in NYC." } 
+{ "index": { "_id": 2 } }
+{ "borough": "Queens", "area_name": "Flushing", "description": "Flushing is a neighborhood in the northern part of Queens, famous for its Asian-American population and bustling business district.", "population": 227000, "facts": "Flushing is one of the most ethnically diverse neighborhoods in NYC, with a large Chinese and Korean population. It is also home to the USTA Billie Jean King National Tennis Center." } 
+{ "index": { "_id": 3 } }
+{ "borough": "Brooklyn", "area_name": "Williamsburg", "description": "Williamsburg is a trendy neighborhood in Brooklyn known for its hipster culture, vibrant art scene, and excellent restaurants.", "population": 150000, "facts": "Williamsburg is a hotspot for young professionals and artists. The neighborhood has seen rapid gentrification over the past two decades." } 
+{ "index": { "_id": 4 } }
+{ "borough": "Manhattan", "area_name": "Harlem", "description": "Harlem is a historic neighborhood in Upper Manhattan, known for its significant African-American cultural heritage.", "population": 116000, "facts": "Harlem was the birthplace of the Harlem Renaissance, a cultural movement that celebrated Black culture through art, music, and literature." } 
+{ "index": { "_id": 5 } }
+{ "borough": "The Bronx", "area_name": "Riverdale", "description": "Riverdale is a suburban-like neighborhood in the Bronx, known for its leafy streets and affluent residential areas.", "population": 48000, "facts": "Riverdale is one of the most affluent areas in the Bronx, with beautiful parks, historic homes, and excellent schools." } 
+{ "index": { "_id": 6 } }
+{ "borough": "Staten Island", "area_name": "St. George", "description": "St. George is the main commercial and cultural center of Staten Island, offering stunning views of Lower Manhattan.", "population": 15000, "facts": "St. George is home to the Staten Island Ferry terminal and is a gateway to Staten Island, offering stunning views of the Statue of Liberty and Ellis Island." }
+```
+{% include copy-curl.html %}
+
+## Step 4: Create a search pipeline
+
+Next, create a search pipeline for reranking. In the search pipeline configuration, the `input_map` and `output_map` define how the input data is prepared for the cross-encoder model and how the model's output is interpreted for reranking:
+
+- The `input_map` specifies which fields in the search documents and the query should be used as model inputs:
+    - The `text` field maps to the `facts` field in the indexed documents. It provides the document-specific content that the model will analyze.
+    - The `text_pair` field dynamically retrieves the search query text (`multi_match.query`) from the search request. 
+
+    The combination of `text` (document `facts`) and `text_pair` (search `query`) allows the cross-encoder model to compare the relevance of the document to the query, considering their semantic relationship.
+
+- The `output_map` field specifies how the output of the model is mapped to the fields in the response:
+    - The `rank_score` field in the response will store the model's relevance score, which will be used to perform reranking.
+    
+When using the `by_field` rerank type, the `rank_score` field will contain the same score as the `_score` field. To remove the `rank_score` field from the search results, set `remove_target_field` to `true`. The original BM25 score, before reranking, is included for debugging purposes by setting `keep_previous_score` to `true`. This allows you to compare the original score with the reranked score to evaluate improvements in search relevance.
+    
+To create the search pipeline, send the following request:
+
+```json
+PUT /_search/pipeline/my_pipeline
+{
+  "response_processors": [
+    {
+      "ml_inference": {
+        "tag": "ml_inference",
+        "description": "This processor runs ml inference during search response",
+        "model_id": "<model_id_from_step_3>",
+        "function_name": "REMOTE",
+        "input_map": [
+          {
+            "text": "facts",
+            "text_pair":"$._request.query.multi_match.query"
+          }
+        ],
+        "output_map": [
+          {
+            "rank_score": "$.score"
+          }
+        ],
+        "full_response_path": false,
+        "model_config": {},
+        "ignore_missing": false,
+        "ignore_failure": false,
+        "one_to_one": true
+      },
+       
+      "rerank": {
+        "by_field": {
+          "target_field": "rank_score",
+          "remove_target_field": true,
+          "keep_previous_score" : true
+          }
+      }
+    
+    }
+  ]
+}
+```
+{% include copy-curl.html %}
+
+## Step 5: Search using reranking
+
+Use the following request to search indexed documents and rerank them using the cross-encoder model. The request retrieves documents containing any of the specified terms in the `description` or `facts` fields. These terms are then used to compare and rerank the matched documents:
+
+```json
+POST /nyc_areas/_search?search_pipeline=my_pipeline
+{
+  "query": {
+    "multi_match": {
+      "query": "artists art creative community",
+      "fields": ["description", "facts"]
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+In the response, the `previous_score` field contains the document's BM25 score, which it would have received if you hadn't applied the pipeline. Note that while BM25 ranked "Astoria" the highest, the cross-encoder model prioritized "Harlem" because it matched more search terms:
+
+```json
+{
+  "took": 4,
+  "timed_out": false,
+  "_shards": {
+    "total": 1,
+    "successful": 1,
+    "skipped": 0,
+    "failed": 0
+  },
+  "hits": {
+    "total": {
+      "value": 3,
+      "relation": "eq"
+    },
+    "max_score": 0.03418137,
+    "hits": [
+      {
+        "_index": "nyc_areas",
+        "_id": "4",
+        "_score": 0.03418137,
+        "_source": {
+          "area_name": "Harlem",
+          "description": "Harlem is a historic neighborhood in Upper Manhattan, known for its significant African-American cultural heritage.",
+          "previous_score": 1.6489418,
+          "borough": "Manhattan",
+          "facts": "Harlem was the birthplace of the Harlem Renaissance, a cultural movement that celebrated Black culture through art, music, and literature.",
+          "population": 116000
+        }
+      },
+      {
+        "_index": "nyc_areas",
+        "_id": "1",
+        "_score": 0.0090838,
+        "_source": {
+          "area_name": "Astoria",
+          "description": "Astoria is a neighborhood in the western part of Queens, New York City, known for its diverse community and vibrant cultural scene.",
+          "previous_score": 2.519608,
+          "borough": "Queens",
+          "facts": "Astoria is home to many artists and has a large Greek-American community. The area also boasts some of the best Mediterranean food in NYC.",
+          "population": 93000
+        }
+      },
+      {
+        "_index": "nyc_areas",
+        "_id": "3",
+        "_score": 0.0032599436,
+        "_source": {
+          "area_name": "Williamsburg",
+          "description": "Williamsburg is a trendy neighborhood in Brooklyn known for its hipster culture, vibrant art scene, and excellent restaurants.",
+          "previous_score": 1.5632852,
+          "borough": "Brooklyn",
+          "facts": "Williamsburg is a hotspot for young professionals and artists. The neighborhood has seen rapid gentrification over the past two decades.",
+          "population": 150000
+        }
+      }
+    ]
+  },
+  "profile": {
+    "shards": []
+  }
+}
+```
+ 
\ No newline at end of file
diff --git a/_search-plugins/search-relevance/rerank-by-field.md b/_search-plugins/search-relevance/rerank-by-field.md
index 9c7e7419e5..e6f65a4d25 100644
--- a/_search-plugins/search-relevance/rerank-by-field.md
+++ b/_search-plugins/search-relevance/rerank-by-field.md
@@ -116,7 +116,7 @@ POST /book-index/_search
 ```
 {% include copy-curl.html %}
 
-The response contains documents sorted in descending order based on the `reviews.starts` field. Each document contains the original query score in the `previous_score` field:
+The response contains documents sorted in descending order based on the `reviews.stars` field. Each document contains the original query score in the `previous_score` field:
 
 ```json
 {
@@ -205,4 +205,5 @@ The response contains documents sorted in descending order based on the `reviews
 
 ## Next steps
 
-- Learn more about the [`rerank` processor]({{site.url}}{{site.baseurl}}/search-plugins/search-pipelines/rerank-processor/).
\ No newline at end of file
+- Learn more about the [`rerank` processor]({{site.url}}{{site.baseurl}}/search-plugins/search-pipelines/rerank-processor/).
+- See a comprehensive example of [reranking by a field using an externally hosted cross-encoder model]({{site.url}}{{site.baseurl}}/search-plugins/search-relevance/rerank-by-field-cross-encoder/).
\ No newline at end of file
diff --git a/_search-plugins/search-relevance/rerank-cross-encoder.md b/_search-plugins/search-relevance/rerank-cross-encoder.md
index 854908e69c..64f93c886c 100644
--- a/_search-plugins/search-relevance/rerank-cross-encoder.md
+++ b/_search-plugins/search-relevance/rerank-cross-encoder.md
@@ -118,4 +118,5 @@ Alternatively, you can provide the full path to the field containing the context
 
 ## Next steps
 
-- Learn more about the [`rerank` processor]({{site.url}}{{site.baseurl}}/search-plugins/search-pipelines/rerank-processor/).
\ No newline at end of file
+- Learn more about the [`rerank` processor]({{site.url}}{{site.baseurl}}/search-plugins/search-pipelines/rerank-processor/).
+- See a comprehensive example of [reranking by a field using an externally hosted cross-encoder model]({{site.url}}{{site.baseurl}}/search-plugins/search-relevance/rerank-by-field-cross-encoder/).
\ No newline at end of file
diff --git a/_search-plugins/searching-data/index.md b/_search-plugins/searching-data/index.md
index 279958d97c..42ce7654a0 100644
--- a/_search-plugins/searching-data/index.md
+++ b/_search-plugins/searching-data/index.md
@@ -19,4 +19,4 @@ Feature | Description
 [Sort results]({{site.url}}{{site.baseurl}}/opensearch/search/sort/) | Allow sorting of results by different criteria.
 [Highlight query matches]({{site.url}}{{site.baseurl}}/opensearch/search/highlight/) | Highlight the search term in the results.
 [Retrieve inner hits]({{site.url}}{{site.baseurl}}/search-plugins/searching-data/inner-hits/) | Retrieve underlying hits in nested and parent-join objects.
-[Retrieve specific fields]({{site.url}}{{site.baseurl}}search-plugins/searching-data/retrieve-specific-fields/) | Retrieve only the specific fields
+[Retrieve specific fields]({{site.url}}{{site.baseurl}}/search-plugins/searching-data/retrieve-specific-fields/) | Retrieve only the specific fields
diff --git a/_tools/k8s-operator.md b/_tools/k8s-operator.md
index 7ee1c1adee..5027dcf304 100644
--- a/_tools/k8s-operator.md
+++ b/_tools/k8s-operator.md
@@ -63,40 +63,40 @@ Then install the OpenSearch Kubernetes Operator using the following steps:
 3. Enter `make build manifests`.
 4. Start a Kubernetes cluster. When using minikube, open a new terminal window and enter `minikube start`. Kubernetes will now use a containerized minikube cluster with a namespace called `default`. Make sure that `~/.kube/config` points to the cluster.
 
-```yml
-apiVersion: v1
-clusters:
-- cluster:
-    certificate-authority: /Users/naarcha/.minikube/ca.crt
-    extensions:
-    - extension:
-        last-update: Mon, 29 Aug 2022 10:11:47 CDT
-        provider: minikube.sigs.k8s.io
-        version: v1.26.1
-      name: cluster_info
-    server: https://127.0.0.1:61661
-  name: minikube
-contexts:
-- context:
-    cluster: minikube
-    extensions:
-    - extension:
-        last-update: Mon, 29 Aug 2022 10:11:47 CDT
-        provider: minikube.sigs.k8s.io
-        version: v1.26.1
-      name: context_info
-    namespace: default
-    user: minikube
-  name: minikube
-current-context: minikube
-kind: Config
-preferences: {}
-users:
-- name: minikube
-  user:
-    client-certificate: /Users/naarcha/.minikube/profiles/minikube/client.crt
-    client-key: /Users/naarcha/.minikube/profiles/minikube/client.key
-```    
+  ```yml
+  apiVersion: v1
+  clusters:
+  - cluster:
+      certificate-authority: /Users/naarcha/.minikube/ca.crt
+      extensions:
+      - extension:
+          last-update: Mon, 29 Aug 2022 10:11:47 CDT
+          provider: minikube.sigs.k8s.io
+          version: v1.26.1
+        name: cluster_info
+      server: https://127.0.0.1:61661
+    name: minikube
+  contexts:
+  - context:
+      cluster: minikube
+      extensions:
+      - extension:
+          last-update: Mon, 29 Aug 2022 10:11:47 CDT
+          provider: minikube.sigs.k8s.io
+          version: v1.26.1
+        name: context_info
+      namespace: default
+      user: minikube
+    name: minikube
+  current-context: minikube
+  kind: Config
+  preferences: {}
+  users:
+  - name: minikube
+    user:
+      client-certificate: /Users/naarcha/.minikube/profiles/minikube/client.crt
+      client-key: /Users/naarcha/.minikube/profiles/minikube/client.key
+  ```    
    
 5. Enter `make install` to create the CustomResourceDefinition that runs in your Kubernetes cluster. 
 6. Start the OpenSearch Kubernetes Operator. Enter `make run`. 
@@ -146,4 +146,4 @@ kubectl delete -f opensearch-cluster.yaml
 
 To learn more about how to customize your Kubernetes OpenSearch cluster, including data persistence, authentication methods, and scaling, see the [OpenSearch Kubernetes Operator User Guide](https://github.com/Opster/opensearch-k8s-operator/blob/main/docs/userguide/main.md). 
 
-If you want to contribute to the development of the OpenSearch Kubernetes Operator, see the repo [design documents](https://github.com/Opster/opensearch-k8s-operator/blob/main/docs/designs/high-level.md).
\ No newline at end of file
+If you want to contribute to the development of the OpenSearch Kubernetes Operator, see the repo [design documents](https://github.com/Opster/opensearch-k8s-operator/blob/main/docs/designs/high-level.md).
diff --git a/_tuning-your-cluster/availability-and-recovery/snapshots/searchable_snapshot.md b/_tuning-your-cluster/availability-and-recovery/snapshots/searchable_snapshot.md
index d13955f3f0..7076c792e2 100644
--- a/_tuning-your-cluster/availability-and-recovery/snapshots/searchable_snapshot.md
+++ b/_tuning-your-cluster/availability-and-recovery/snapshots/searchable_snapshot.md
@@ -46,7 +46,7 @@ services:
       - node.search.cache.size=50gb
 ```
 
-
+- Starting with version 2.18, k-NN indexes support searchable snapshots for the NMSLIB and Faiss engines.
 
 ## Create a searchable snapshot index
 
@@ -109,4 +109,3 @@ The following are known limitations of the searchable snapshots feature:
 - Searching remote data can impact the performance of other queries running on the same node. We recommend that users provision dedicated nodes with the `search` role for performance-critical applications.
 - For better search performance, consider [force merging]({{site.url}}{{site.baseurl}}/api-reference/index-apis/force-merge/) indexes into a smaller number of segments before taking a snapshot. For the best performance, at the cost of using compute resources prior to snapshotting, force merge your index into one segment.
 - We recommend configuring a maximum ratio of remote data to local disk cache size using the `cluster.filecache.remote_data_ratio` setting. A ratio of 5 is a good starting point for most workloads to ensure good query performance. If the ratio is too large, then there may not be sufficient disk space to handle the search workload. For more details on the maximum ratio of remote data, see issue [#11676](https://github.com/opensearch-project/OpenSearch/issues/11676).
-- k-NN native-engine-based indexes using `faiss` and `nmslib` engines are incompatible with searchable snapshots.
diff --git a/_tuning-your-cluster/availability-and-recovery/snapshots/snapshot-restore.md b/_tuning-your-cluster/availability-and-recovery/snapshots/snapshot-restore.md
index 759080bdec..ac717633f6 100644
--- a/_tuning-your-cluster/availability-and-recovery/snapshots/snapshot-restore.md
+++ b/_tuning-your-cluster/availability-and-recovery/snapshots/snapshot-restore.md
@@ -110,6 +110,20 @@ You will most likely not need to specify any parameters except for `location`. F
    sudo ./bin/opensearch-keystore add s3.client.default.secret_key
    ```
 
+1. (Optional) If you're using a custom S3 endpoint (for example, MinIO), disable the Amazon EC2 metadata connection:
+
+   ```bash
+   export AWS_EC2_METADATA_DISABLED=true
+   ```
+
+   If you're installing OpenSearch using Helm, update the following settings in your values file:
+
+   ```yml
+   extraEnvs:
+     - name: AWS_EC2_METADATA_DISABLED
+       value: "true"
+   ```
+
 1. (Optional) If you're using temporary credentials, add your session token:
 
    ```bash
diff --git a/_tuning-your-cluster/availability-and-recovery/workload-management/query-group-lifecycle-api.md b/_tuning-your-cluster/availability-and-recovery/workload-management/query-group-lifecycle-api.md
new file mode 100644
index 0000000000..83d66c9eb8
--- /dev/null
+++ b/_tuning-your-cluster/availability-and-recovery/workload-management/query-group-lifecycle-api.md
@@ -0,0 +1,121 @@
+---
+layout: default
+title: Query group lifecycle API
+nav_order: 20
+parent: Workload management
+grand_parent: Availability and recovery
+---
+
+# Query Group Lifecycle API
+
+The Query Group Lifecycle API in creates, updates, retrieves, and deletes query groups. The API categorizes queries into specific groups, called _query groups_ based on desired resource limits.
+
+## Paths and HTTP method
+
+```json
+PUT _wlm/query_group
+PUT _wlm/query_group/<name>
+GET _wlm/query_group
+GET _wlm/query_group/<name>
+DELETE _wlm/query_group/<name>
+```
+
+## Request body fields
+
+| Field | Description	 |
+| :--- | :--- |
+| `_id`  | The ID of the query group, which can be used to associate query requests with the group and enforce the group's resource limits.  |
+| `name`  | The name of the query group. |
+| `resiliency_mode`  | The resiliency mode of the query group. Valid modes are `enforced`, `soft`, and `monitor`. For more information about resiliency modes, see [Operating modes](https://opensearch.org/docs/latest/tuning-your-cluster/availability-and-recovery/workload-management/wlm-feature-overview/#operating-modes). |
+| `resource_limits` | The resource limits for query requests in the query group. Valid resources are `cpu` and `memory`.  |
+
+When creating a query group, make sure that the sum of the resource limits for a single resource, either `cpu` or `memory`, does not exceed 1.
+
+## Example requests
+
+The following requests show how to use the Query Group Lifecycle API.
+
+### Creating a query group
+
+```json
+PUT _wlm/query_group
+{
+  "name": "analytics",
+  "resiliency_mode": "enforced",
+  "resource_limits": {
+    "cpu": 0.4,
+    "memory": 0.2
+  }
+}
+```
+
+### Updating a query group
+
+```json
+PUT _wlm/query_group/analytics
+{
+  "resiliency_mode": "monitor",
+  "resource_limits": {
+    "cpu": 0.41,
+    "memory": 0.21
+  }
+}
+```
+
+### Getting a query group
+
+```json
+GET _wlm/query_group/analytics
+```
+
+### Deleting a query group
+
+```json
+DELETE _wlm/query_group/analytics
+```
+
+## Example responses
+
+OpenSearch returns responses similar to the following.
+
+### Creating a query group
+
+```json
+{
+  "_id":"preXpc67RbKKeCyka72_Gw",
+  "name":"analytics",
+  "resiliency_mode":"enforced",
+  "resource_limits":{
+    "cpu":0.4,
+    "memory":0.2
+  },
+  "updated_at":1726270184642
+}
+```
+
+### Updating query group
+
+```json
+{
+  "_id":"preXpc67RbKKeCyka72_Gw",
+  "name":"analytics",
+  "resiliency_mode":"monitor",
+  "resource_limits":{
+    "cpu":0.41,
+    "memory":0.21
+  },
+  "updated_at":1726270333804
+}
+```
+
+## Response body fields
+
+| Field | Description	 |
+| :--- | :--- |
+| `_id`  | The ID of the query group. |
+| `name`  | The name of the query group. Required when creating a new query group. |
+| `resiliency_mode`  | The resiliency mode of the query group. |
+| `resource_limits` | The resource limits of the query group. |
+| `updated_at` | The time at which the query group was last updated. |
+
+
diff --git a/_tuning-your-cluster/availability-and-recovery/workload-management/wlm-feature-overview.md b/_tuning-your-cluster/availability-and-recovery/workload-management/wlm-feature-overview.md
new file mode 100644
index 0000000000..956a01a774
--- /dev/null
+++ b/_tuning-your-cluster/availability-and-recovery/workload-management/wlm-feature-overview.md
@@ -0,0 +1,194 @@
+---
+layout: default
+title: Workload management
+nav_order: 70
+has_children: true
+parent: Availability and recovery
+---
+
+Introduced 2.18
+{: .label .label-purple }
+
+# Workload management
+
+Workload management allows you to group search traffic and isolate network resources, preventing the overuse of network resources by specific requests. It offers the following benefits:
+
+- Tenant-level admission control and reactive query management. When resource usage exceeds configured limits, it automatically identifies and cancels demanding queries, ensuring fair resource distribution.
+
+- Tenant-level isolation within the cluster for search workloads, operating at the node level.
+
+## Installing workload management
+
+To install workload management, use the following command: 
+
+```json
+./bin/opensearch-plugin install workload-management
+```
+{% include copy-curl.html %}
+
+## Query groups
+
+A _query group_ is a logical grouping of tasks with defined resource limits. System administrators can dynamically manage query groups using the Workload Management APIs. These query groups can be used to create search requests with resource limits. 
+
+### Permissions
+
+Only users with administrator-level permissions can create and update query groups using the Workload Management APIs.
+
+### Operating modes
+
+The following operating modes determine the operating level for a query group:
+
+- **Disabled mode**: Workload management is disabled.
+
+- **Enabled mode**: Workload management is enabled and will cancel and reject queries once the query group's configured thresholds are reached.
+
+- **Monitor_only mode** (Default): Workload management will monitor tasks but will not cancel or reject any queries.
+
+### Example request
+
+The following example request adds a query group named `analytics`:
+
+```json
+PUT _wlm/query_group
+{
+  “name”: “analytics”,
+  “resiliency_mode”: “enforced”,
+  “resource_limits”: {
+    “cpu”: 0.4,
+    “memory”: 0.2
+  }
+}
+```
+{% include copy-curl.html %}
+
+When creating a query group, make sure that the sum of the resource limits for a single resource, such as `cpu` or `memory`, does not exceed `1`.
+
+### Example response
+
+OpenSearch responds with the set resource limits and the `_id` for the query group:
+
+```json
+{
+  "_id":"preXpc67RbKKeCyka72_Gw",
+  "name":"analytics",
+  "resiliency_mode":"enforced",
+  "resource_limits":{
+    "cpu":0.4,
+    "memory":0.2
+  },
+  "updated_at":1726270184642
+}
+```
+
+## Using `queryGroupID`
+
+You can associate a query request with a `queryGroupID` to manage and allocate resources within the limits defined by the query group. By using this ID, request routing and tracking are associated with the query group, ensuring resource quotas and task limits are maintained.
+
+The following example query uses the `queryGroupId` to ensure that the query does not exceed that query group's resource limits:
+
+```json
+GET testindex/_search
+Host: localhost:9200
+Content-Type: application/json
+queryGroupId: preXpc67RbKKeCyka72_Gw
+{
+  "query": {
+    "match": {
+      "field_name": "value"
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+## Workload management settings
+
+The following settings can be used to customize workload management using the `_cluster/settings` API.
+
+| **Setting name**  | **Description**  |
+| :--- | :--- |
+| `wlm.query_group.duress_streak` | Determines the node duress threshold. Once the threshold is reached, the node is marked as `in duress`. |
+| `wlm.query_group.enforcement_interval`  | Defines the monitoring interval. |
+| `wlm.query_group.mode`  | Defines the [operating mode](#operating-modes). |
+| `wlm.query_group.node.memory_rejection_threshold` | Defines the query group level `memory` threshold. When the threshold is reached, the request is rejected. |
+| `wlm.query_group.node.cpu_rejection_threshold` | Defines the query group level `cpu` threshold. When the threshold is reached, the request is rejected. |
+| `wlm.query_group.node.memory_cancellation_threshold` | Controls whether the node is considered to be in duress when the `memory` threshold is reached. Requests routed to nodes in duress are canceled. |
+| `wlm.query_group.node.cpu_cancellation_threshold`    | Controls whether the node is considered to be in duress when the `cpu` threshold is reached. Requests routed to nodes in duress are canceled. |
+
+When setting rejection and cancellation thresholds, remember that the rejection threshold for a resource should always be lower than the cancellation threshold. 
+
+## Workload Management Stats API
+
+The Workload Management Stats API returns workload management metrics for a query group, using the following method:
+
+```json
+GET _wlm/stats
+```
+{% include copy-curl.html %}
+
+### Example response 
+
+```json
+{
+  “_nodes”: {
+    “total”: 1,
+    “successful”: 1,
+    “failed”: 0
+  },
+  “cluster_name”: “XXXXXXYYYYYYYY”,
+  “A3L9EfBIQf2anrrUhh_goA”: {
+    “query_groups”: {
+      “16YGxFlPRdqIO7K4EACJlw”: {
+        “total_completions”: 33570,
+        “total_rejections”: 0,
+        “total_cancellations”: 0,
+        “cpu”: {
+          “current_usage”: 0.03319935314357281,
+          “cancellations”: 0,
+          “rejections”: 0
+        },
+        “memory”: {
+          “current_usage”: 0.002306486276211217,
+          “cancellations”: 0,
+          “rejections”: 0
+        }
+      },
+      “DEFAULT_QUERY_GROUP”: {
+        “total_completions”: 42572,
+        “total_rejections”: 0,
+        “total_cancellations”: 0,
+        “cpu”: {
+          “current_usage”: 0,
+          “cancellations”: 0,
+          “rejections”: 0
+        },
+        “memory”: {
+          “current_usage”: 0,
+          “cancellations”: 0,
+          “rejections”: 0
+        }
+      }
+    }
+  }
+}
+```
+{% include copy-curl.html %}
+
+### Response body fields 
+
+| Field name | Description |
+| :--- | :--- | 
+| `total_completions`  |  The total number of request completions in the `query_group` at the given node. This includes all shard-level and coordinator-level requests. |
+| `total_rejections`    | The total number request rejections in the `query_group` at the given node. This includes all shard-level and coordinator-level requests.    |
+| `total_cancellations` | The total number of cancellations in the `query_group` at the given node. This includes all shard-level and coordinator-level requests.  |
+| `cpu`   | The `cpu` resource type statistics for the `query_group`.  | 
+| `memory`  | The `memory` resource type statistics for the `query_group`.  | 
+
+### Resource type statistics
+
+| Field name  | Description   |
+| :--- | :---- | 
+| `current_usage` |The resource usage for the `query_group` at the given node based on the last run of the monitoring thread. This value is updated based on the `wlm.query_group.enforcement_interval`. |
+| `cancellations` | The number of cancellations resulting from the cancellation threshold being reached.   |
+| `rejections`    |  The number of rejections resulting from the cancellation threshold being reached.   |
+
diff --git a/_tuning-your-cluster/index.md b/_tuning-your-cluster/index.md
index fa0973395f..f434c2b5ec 100644
--- a/_tuning-your-cluster/index.md
+++ b/_tuning-your-cluster/index.md
@@ -20,7 +20,7 @@ To create and deploy an OpenSearch cluster according to your requirements, it’
 
 There are many ways to design a cluster. The following illustration shows a basic architecture that includes a four-node cluster that has one dedicated cluster manager node, one dedicated coordinating node, and two data nodes that are cluster manager eligible and also used for ingesting data.
 
-  The nomenclature for the cluster manager node is now referred to as the cluster manager node.
+  The master node is now referred to as the cluster manager node.
    {: .note }
 
 ![multi-node cluster architecture diagram]({{site.url}}{{site.baseurl}}/images/cluster.png)
diff --git a/_tuning-your-cluster/performance.md b/_tuning-your-cluster/performance.md
index 28f47aeacb..b5066a890c 100644
--- a/_tuning-your-cluster/performance.md
+++ b/_tuning-your-cluster/performance.md
@@ -32,12 +32,9 @@ An increased `index.translog.flush_threshold_size` can also increase the time th
 Before increasing `index.translog.flush_threshold_size`, call the following API operation to get current flush operation statistics:
 
 ```json
-curl -XPOST "os-endpoint/index-name/_stats/flush?pretty"
+GET /<index>/_stats/flush?pretty
 ```
-{% include copy.html %}
-
-
-Replace the `os-endpoint` and `index-name` with your endpoint and index name.
+{% include copy-curl.html %}
 
 In the output, note the number of flushes and the total time. The following example output shows that there are 124 flushes, which took 17,690 milliseconds:
 
@@ -53,9 +50,15 @@ In the output, note the number of flushes and the total time. The following exam
 To increase the flush threshold size, call the following API operation:
 
 ```json
-curl -XPUT "os-endpoint/index-name/_settings?pretty" -d "{"index":{"translog.flush_threshold_size" : "1024MB"}}"
+PUT /<index>/_settings 
+{
+  "index":
+  {
+    "translog.flush_threshold_size" : "1024MB"
+  }
+}
 ```
-{% include copy.html %}
+{% include copy-curl.html %}
 
 In this example, the flush threshold size is set to 1024 MB, which is ideal for instances that have more than 32 GB of memory.
 
@@ -65,9 +68,9 @@ Choose the appropriate threshold size for your cluster.
 Run the stats API operation again to see whether the flush activity changed:
 
 ```json
-curl -XGET "os-endpoint/index-name/_stats/flush?pretty"
+GET /<index>/_stats/flush
 ```
-{% include copy.html %}
+{% include copy-curl.html %}
 
 It's a best practice to increase the `index.translog.flush_threshold_size` only for the current index. After you confirm the outcome, apply the changes to the index template.
 {: .note}
@@ -127,14 +130,14 @@ To reduce the size of the OpenSearch response, use the `filter_path` parameter t
 In the following example, the `index-name`, `type-name`, and `took` fields are excluded from the response:
 
 ```json
-curl -XPOST "es-endpoint/index-name/type-name/_bulk?pretty&filter_path=-took,-items.index._index,-items.index._type" -H 'Content-Type: application/json' -d'
+POST /_bulk?pretty&filter_path=-took,-items.index._index,-items.index._type
 { "index" : { "_index" : "test2", "_id" : "1" } }
 { "user" : "testuser" }
 { "update" : {"_id" : "1", "_index" : "test2"} }
 { "doc" : {"user" : "example"} }
 ```
-{% include copy.html %}
+{% include copy-curl.html %}
 
 ## Compression codecs
 
-In OpenSearch 2.9 and later, there are two new codecs for compression: `zstd` and `zstd_no_dict`. You can optionally specify a compression level for these in the `index.codec.compression_level` setting with values in the [1, 6] range. [Benchmark]({{site.url}}{{site.baseurl}}/im-plugin/index-codecs/#benchmarking) data shows that `zstd` provides a 7% better write throughput and `zstd_no_dict` provides a 14% better throughput, along with a 30% improvement in storage compared with the `default` codec. For more information about compression, see [Index codecs]({{site.url}}{{site.baseurl}}/im-plugin/index-codecs/).
\ No newline at end of file
+In OpenSearch 2.9 and later, there are two new codecs for compression: `zstd` and `zstd_no_dict`. You can optionally specify a compression level for these in the `index.codec.compression_level` setting with values in the [1, 6] range. [Benchmark]({{site.url}}{{site.baseurl}}/im-plugin/index-codecs/#benchmarking) data shows that `zstd` provides a 7% better write throughput and `zstd_no_dict` provides a 14% better throughput, along with a 30% improvement in storage compared with the `default` codec. For more information about compression, see [Index codecs]({{site.url}}{{site.baseurl}}/im-plugin/index-codecs/).
diff --git a/_upgrade-to/index.md b/_upgrade-to/index.md
index 0eea3d6209..696be88c21 100644
--- a/_upgrade-to/index.md
+++ b/_upgrade-to/index.md
@@ -1,6 +1,6 @@
 ---
 layout: default
-title: About the migration process
+title: Upgrading OpenSearch
 nav_order: 1
 nav_exclude: true
 permalink: /upgrade-to/
@@ -8,15 +8,14 @@ redirect_from:
   - /upgrade-to/index/
 ---
 
-# About the migration process
+# Upgrading OpenSearch
 
-The process of migrating from Elasticsearch OSS to OpenSearch varies depending on your current version of Elasticsearch OSS, installation type, tolerance for downtime, and cost-sensitivity. Rather than concrete steps to cover every situation, we have general guidance for the process.
+The process of upgrading your OpenSearch version varies depending on your current version of OpenSearch, installation type, tolerance for downtime, and cost-sensitivity. For migrating to OpenSearch, we provide a [Migration Assistant]({{site.url}}{{site.baseurl}}/migration-assistant/).
 
-Three approaches exist:
+Two upgrade approaches exists:
 
-- Use a snapshot to [migrate your Elasticsearch OSS data]({{site.url}}{{site.baseurl}}/upgrade-to/snapshot-migrate/) to a new OpenSearch cluster. This method may incur downtime.
-- Perform a [restart upgrade or a rolling upgrade]({{site.url}}{{site.baseurl}}/upgrade-to/upgrade-to/) on your existing nodes. A restart upgrade involves upgrading the entire cluster and restarting it, whereas a rolling upgrade requires upgrading and restarting nodes in the cluster one by one.
-- Replace existing Elasticsearch OSS nodes with new OpenSearch nodes. Node replacement is most popular when upgrading [Docker clusters]({{site.url}}{{site.baseurl}}/upgrade-to/docker-upgrade-to/).
+- Perform a [restart upgrade or a rolling upgrade]({{site.url}}{{site.baseurl}}/upgrade-to/snapshot-migrate/) on your existing nodes. A restart upgrade involves upgrading the entire cluster and restarting it, whereas a rolling upgrade requires upgrading and restarting nodes in the cluster one by one.
+- Replace existing OpenSearch nodes with new OpenSearch nodes. Node replacement is most popular when upgrading [Docker clusters]({{site.url}}{{site.baseurl}}/upgrade-to/docker-upgrade-to/).
 
 Regardless of your approach, to safeguard against data loss, we recommend that you take a [snapshot]({{site.url}}{{site.baseurl}}/opensearch/snapshots/snapshot-restore) of all indexes prior to any migration.
 
diff --git a/_upgrade-to/upgrade-to.md b/_upgrade-to/upgrade-to.md
index 340055b214..00950687a5 100644
--- a/_upgrade-to/upgrade-to.md
+++ b/_upgrade-to/upgrade-to.md
@@ -6,6 +6,10 @@ nav_order: 15
 
 # Migrating from Elasticsearch OSS to OpenSearch
 
+
+OpenSearch provides a [Migration Assistant]({{site.url}}{{site.baseurl}}/migration-assistant/) to assist you in migrating from other search solutions.
+{: .warning}
+
 If you want to migrate from an existing Elasticsearch OSS cluster to OpenSearch and find the [snapshot approach]({{site.url}}{{site.baseurl}}/upgrade-to/snapshot-migrate/) unappealing, you can migrate your existing nodes from Elasticsearch OSS to OpenSearch.
 
 If your existing cluster runs an older version of Elasticsearch OSS, the first step is to upgrade to version 6.x or 7.x.
diff --git a/images/migrations/migrations-architecture-overview.png b/images/migrations/migrations-architecture-overview.png
new file mode 100644
index 0000000000..3002da3a87
Binary files /dev/null and b/images/migrations/migrations-architecture-overview.png differ
diff --git a/spec-insert/.gitignore b/spec-insert/.gitignore
new file mode 100644
index 0000000000..c9958b86d2
--- /dev/null
+++ b/spec-insert/.gitignore
@@ -0,0 +1,2 @@
+opensearch-openapi.yaml
+rspec_examples.txt
diff --git a/spec-insert/.rspec b/spec-insert/.rspec
new file mode 100644
index 0000000000..c99d2e7396
--- /dev/null
+++ b/spec-insert/.rspec
@@ -0,0 +1 @@
+--require spec_helper
diff --git a/spec-insert/.rubocop.yml b/spec-insert/.rubocop.yml
new file mode 100644
index 0000000000..5b88e922f4
--- /dev/null
+++ b/spec-insert/.rubocop.yml
@@ -0,0 +1,29 @@
+require: rubocop-rake
+AllCops:
+  Include:
+    - 'lib/**/*.rb'
+    - 'Rakefile'
+  NewCops: enable
+
+Metrics/CyclomaticComplexity:
+  Enabled: false
+Metrics/MethodLength:
+  Enabled: false
+Metrics/ParameterLists:
+  Enabled: false
+Metrics/AbcSize:
+  Enabled: false
+Metrics/PerceivedComplexity:
+  Enabled: false
+
+Layout/EmptyLineAfterGuardClause:
+  Enabled: false
+
+Style/MultilineBlockChain:
+  Enabled: false
+Style/SingleLineMethods:
+  Enabled: false
+
+Naming/FileName:
+  Exclude:
+    - 'lib/jekyll-spec-insert.rb' # For Jekyll to recognize the plugin
diff --git a/spec-insert/jekyll-spec-insert.gemspec b/spec-insert/jekyll-spec-insert.gemspec
new file mode 100644
index 0000000000..d397f40af2
--- /dev/null
+++ b/spec-insert/jekyll-spec-insert.gemspec
@@ -0,0 +1,16 @@
+# frozen_string_literal: true
+
+Gem::Specification.new do |spec|
+  spec.name          = 'jekyll-spec-insert'
+  spec.version       = '0.1.0'
+  spec.authors       = ['Theo Truong']
+  spec.email         = ['theo.nam.truong@gmail.com']
+
+  spec.summary       = 'A Jekyll plugin for inserting OpenSearch OpenAPI specifications into Jekyll sites.'
+
+  spec.files         = Dir['lib/**/*.rb']
+  spec.require_paths = ['lib']
+
+  spec.metadata['rubygems_mfa_required'] = 'true'
+  spec.required_ruby_version = '>= 3.1.0'
+end
diff --git a/spec-insert/lib/api/action.rb b/spec-insert/lib/api/action.rb
new file mode 100644
index 0000000000..5ad3dded77
--- /dev/null
+++ b/spec-insert/lib/api/action.rb
@@ -0,0 +1,68 @@
+# SPDX-License-Identifier: Apache-2.0
+#
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+
+# frozen_string_literal: true
+
+require_relative 'parameter'
+require_relative 'operation'
+
+# A collection of operations that comprise a single API Action
+# AKA operation-group
+class Action
+  # @param [SpecHash] spec Parsed OpenAPI spec
+  def self.actions=(spec)
+    operations = spec.paths.flat_map do |url, ops|
+      ops.filter_map { |verb, op| Operation.new(op, url, verb) unless op['x-ignorable'] }
+    end
+    @actions = operations.group_by(&:group).values.map { |ops| Action.new(ops) }.index_by(&:full_name)
+  end
+
+  # @return [Hash<String, Action>] API Actions indexed by operation-group
+  def self.actions
+    raise 'Actions not set' unless @actions
+    @actions
+  end
+
+  # @return [Array<Operation>] Operations in the action
+  attr_reader :operations
+
+  # @param [Array<Operation>] operations
+  def initialize(operations)
+    @operations = operations
+    @operation = operations.first
+    @spec = @operation&.spec
+  end
+
+  # @return [Array<Parameter>] Input arguments.
+  def arguments; @arguments ||= Parameter.from_operations(@operations.map(&:spec)); end
+
+  # @return [String] Full name of the action (i.e. namespace.action)
+  def full_name; @operation&.group; end
+
+  # return [String] Name of the action
+  def name; @operation&.action; end
+
+  # @return [String] Namespace of the action
+  def namespace; @operation&.namespace; end
+
+  # @return [Array<String>] Sorted unique HTTP verbs
+  def http_verbs; @operations.map(&:http_verb).uniq.sort; end
+
+  # @return [Array<String>] Unique URLs
+  def urls; @operations.map(&:url).uniq; end
+
+  # @return [String] Description of the action
+  def description; @spec&.description; end
+
+  # @return [Boolean] Whether the action is deprecated
+  def deprecated; @spec&.deprecated; end
+
+  # @return [String] Deprecation message
+  def deprecation_message; @spec['x-deprecation-message']; end
+
+  # @return [String] API reference
+  def api_reference; @operation&.external_docs&.url; end
+end
diff --git a/spec-insert/lib/api/operation.rb b/spec-insert/lib/api/operation.rb
new file mode 100644
index 0000000000..6f9fb44cc4
--- /dev/null
+++ b/spec-insert/lib/api/operation.rb
@@ -0,0 +1,34 @@
+# SPDX-License-Identifier: Apache-2.0
+#
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+
+# frozen_string_literal: true
+
+# An API Operation
+class Operation
+  # @return [Openapi3Parser::Node::Operation] Operation Spec
+  attr_reader :spec
+  # @return [String] URL
+  attr_reader :url
+  # @return [String] HTTP Verb
+  attr_reader :http_verb
+  # @return [String] Operation Group
+  attr_reader :group
+  # @return [String] API Action
+  attr_reader :action
+  # @return [String] API Namespace
+  attr_reader :namespace
+
+  # @param [Openapi3Parser::Node::Operation] spec Operation Spec
+  # @param [String] url
+  # @param [String] http_verb
+  def initialize(spec, url, http_verb)
+    @spec = spec
+    @url = url
+    @http_verb = http_verb.upcase
+    @group = spec['x-operation-group']
+    @action, @namespace = @group.split('.').reverse
+  end
+end
diff --git a/spec-insert/lib/api/parameter.rb b/spec-insert/lib/api/parameter.rb
new file mode 100644
index 0000000000..fbd87fd50e
--- /dev/null
+++ b/spec-insert/lib/api/parameter.rb
@@ -0,0 +1,94 @@
+# frozen_string_literal: true
+
+module ArgLocation
+  PATH = :path
+  QUERY = :query
+end
+
+# Represents a parameter of an API action
+class Parameter
+  # @return [String] The name of the parameter
+  attr_reader :name
+  # @return [String] The description of the parameter
+  attr_reader :description
+  # @return [Boolean] Whether the parameter is required
+  attr_reader :required
+  # @return [SpecHash] The JSON schema of the parameter
+  attr_reader :schema
+  # @return [String] Argument type in documentation
+  attr_reader :doc_type
+  # @return [String] The default value of the parameter
+  attr_reader :default
+  # @return [Boolean] Whether the parameter is deprecated
+  attr_reader :deprecated
+  # @return [String] The deprecation message
+  attr_reader :deprecation_message
+  # @return [String] The OpenSearch version when the parameter was deprecated
+  attr_reader :version_deprecated
+  # @return [ArgLocation] The location of the parameter
+  attr_reader :location
+
+  def initialize(name:, description:, required:, schema:, default:, deprecated:, deprecation_message:,
+                 version_deprecated:, location:)
+    @name = name
+    @description = description
+    @required = required
+    @schema = schema
+    @doc_type = get_doc_type(schema).gsub('String / List', 'List').gsub('List / String', 'List')
+    @default = default
+    @deprecated = deprecated
+    @deprecation_message = deprecation_message
+    @version_deprecated = version_deprecated
+    @location = location
+  end
+
+  # @param [SpecHash | nil] schema
+  # @return [String | nil] Documentation type
+  def get_doc_type(schema)
+    return nil if schema.nil?
+    union = schema.anyOf || schema.oneOf
+    return union.map { |sch| get_doc_type(sch) }.join(' / ') unless union.nil?
+    return 'Integer' if schema.type == 'integer'
+    return 'Float' if schema.type == 'number'
+    return 'Boolean' if schema.type == 'boolean'
+    return 'String' if schema.type == 'string'
+    return 'NULL' if schema.type == 'null'
+    return 'List' if schema.type == 'array'
+    'Object'
+  end
+
+  # @param [SpecHash] Full OpenAPI spec
+  def self.global=(spec)
+    @global = spec.components.parameters.filter { |_, p| p['x-global'] }.map { |_, p| from_parameters([p], 1) }
+  end
+
+  # @return [Array<Parameter>] Global parameters
+  def self.global
+    raise 'Global parameters not set' unless @global
+    @global
+  end
+
+  # @param [Array<SpecHash>] operations List of operations of the same group
+  # @return [Array<Parameter>] List of parameters of the operation group
+  def self.from_operations(operations)
+    operations.flat_map(&:parameters).filter { |param| !param['x-global'] }
+              .group_by(&:name).values.map { |params| from_parameters(params, operations.size) }
+  end
+
+  # @param [Array<SpecHash>] params List of parameters of the same name
+  # @param [Integer] opts_count Number of operations involved
+  # @return [Parameter] Single parameter distilled from the list
+  def self.from_parameters(params, opts_count)
+    param = params.first || SpecHash.new
+    schema = param&.schema || SpecHash.new
+    Parameter.new(name: param.name,
+                  description: param.description || schema.description,
+                  required: params.filter(&:required).size >= opts_count,
+                  schema:,
+                  default: param.default || schema.default,
+                  deprecated: param.deprecated || schema.deprecated,
+                  deprecation_message: param['x-deprecation-message'] || schema['x-deprecation-message'],
+                  version_deprecated: param['x-version-deprecated'] || schema['x-version-deprecated'],
+                  location: params.any? { |p| p.in == 'path' } ? ArgLocation::PATH : ArgLocation::QUERY)
+  end
+end
diff --git a/spec-insert/lib/doc_processor.rb b/spec-insert/lib/doc_processor.rb
new file mode 100644
index 0000000000..0aaa01061a
--- /dev/null
+++ b/spec-insert/lib/doc_processor.rb
@@ -0,0 +1,62 @@
+# frozen_string_literal: true
+
+require 'pathname'
+require_relative 'renderers/spec_insert'
+require_relative 'spec_insert_error'
+
+# Processes a file, replacing spec-insert blocks with rendered content
+class DocProcessor
+  START_MARKER = /<!-- spec_insert_start/
+  END_MARKER = /<!-- spec_insert_end -->/
+
+  def initialize(file_path, logger:)
+    @file_path = Pathname(file_path)
+    @logger = logger
+  end
+
+  # Processes the file, replacing spec-insert blocks with rendered content
+  # @param [Boolean] write_to_file Whether to write the changes back to the file
+  def process(write_to_file: true)
+    relative_path = @file_path.relative_path_from(Pathname.new(Dir.pwd))
+    lines = File.readlines(@file_path)
+    original_content = lines.join
+    insertions = find_insertions(lines)
+    return if insertions.empty?
+
+    insertions.reverse_each { |start, finish, insert| lines[start..finish] = insert.render }
+    rendered_content = lines.join
+    if write_to_file && rendered_content != original_content
+      File.write(@file_path, rendered_content)
+      @logger.info "Spec components inserted into #{relative_path} successfully."
+    end
+    rendered_content
+  rescue SpecInsertError => e
+    @logger.error "Error processing #{relative_path}. #{e.message}"
+  end
+
+  private
+
+  # @return Array<[Integer, Integer, SpecInsert]>
+  def find_insertions(lines)
+    start_indices = lines.each_with_index
+                         .filter { |line, _index| line.match?(START_MARKER) }
+                         .map { |_line, index| index }
+    end_indices = start_indices.map do |index|
+      (index..lines.length - 1).find { |i| lines[i].match?(END_MARKER) }
+    end.compact
+
+    validate_markers!(start_indices, end_indices)
+
+    start_indices.zip(end_indices).map do |start, finish|
+      [start, finish, SpecInsert.new(lines[start..finish])]
+    end
+  end
+
+  # @param [Array<Integer>] start_indices
+  # @param [Array<Integer>] end_indices
+  def validate_markers!(start_indices, end_indices)
+    return if start_indices.length == end_indices.length &&
+              start_indices.zip(end_indices).flatten.each_cons(2).all? { |a, b| a < b }
+    raise SpecInsertError, 'Mismatched "spec_insert_start" and "spec_insert_end" markers.'
+  end
+end
diff --git a/spec-insert/lib/insert_arguments.rb b/spec-insert/lib/insert_arguments.rb
new file mode 100644
index 0000000000..6216b8a3e0
--- /dev/null
+++ b/spec-insert/lib/insert_arguments.rb
@@ -0,0 +1,72 @@
+# frozen_string_literal: true
+
+# Doc Insert Arguments
+class InsertArguments
+  COLUMNS = %w[Parameter Description Required Type Default].freeze
+  DEFAULT_COLUMNS = %w[Parameter Type Description].freeze
+  attr_reader :raw
+
+  # @param [Array<String>] lines the lines between <!-- doc_insert_start and -->
+  def initialize(lines)
+    end_index = lines.each_with_index.find { |line, _index| line.match?(/^\s*-->/) }&.last&.- 1
+    @raw = lines[1..end_index].filter { |line| line.include?(':') }.to_h do |line|
+      key, value = line.split(':')
+      [key.strip, value.strip]
+    end
+  end
+
+  # @return [String]
+  def api
+    @raw['api']
+  end
+
+  # @return [String]
+  def component
+    @raw['component']
+  end
+
+  # @return [Array<String>]
+  def columns
+    cols = parse_array(@raw['columns']) || DEFAULT_COLUMNS
+    invalid = cols - COLUMNS
+    raise ArgumentError, "Invalid column(s): #{invalid.join(', ')}" unless invalid.empty?
+    cols
+  end
+
+  # @return [Boolean]
+  def pretty
+    parse_boolean(@raw['pretty'], default: false)
+  end
+
+  # @return [Boolean]
+  def include_global
+    parse_boolean(@raw['include_global'], default: false)
+  end
+
+  # @return [Boolean]
+  def include_deprecated
+    parse_boolean(@raw['include_deprecated'], default: true)
+  end
+
+  # @return [Boolean]
+  def omit_header
+    parse_boolean(@raw['omit_header'], default: false)
+  end
+
+  private
+
+  # @param [String] value comma-separated array
+  def parse_array(value)
+    return nil if value.nil?
+    value.split(',').map(&:strip)
+  end
+
+  # @param [String] value
+  # @param [Boolean] default value to return when nil
+  def parse_boolean(value, default:)
+    return default if value.nil?
+    return true if value.in?(%w[true True TRUE yes Yes YES 1])
+    return false if value.in?(%w[false False FALSE no No NO 0])
+    raise ArgumentError, "Invalid boolean value: #{value}"
+  end
+end
diff --git a/spec-insert/lib/jekyll-spec-insert.rb b/spec-insert/lib/jekyll-spec-insert.rb
new file mode 100644
index 0000000000..14a8997cc8
--- /dev/null
+++ b/spec-insert/lib/jekyll-spec-insert.rb
@@ -0,0 +1,56 @@
+# frozen_string_literal: true
+
+require 'active_support/all'
+require 'listen'
+require 'yaml'
+require_relative 'spec_hash'
+require_relative 'doc_processor'
+
+# Jekyll plugin to insert document components generated from the spec into the Jekyll site
+class JekyllSpecInsert < Jekyll::Command
+  # @param [Mercenary::Program] prog
+  def self.init_with_program(prog)
+    prog.command(:'spec-insert') do |c|
+      c.syntax 'spec-insert [options]'
+      c.option 'watch', '--watch', '-W', 'Watch for changes and rebuild'
+      c.option 'refresh-spec', '--refresh-spec', '-R', 'Redownload the OpenSearch API specification'
+      c.action do |_args, options|
+        spec_file = File.join(Dir.pwd, 'spec-insert/opensearch-openapi.yaml')
+        excluded_paths = YAML.load_file('_config.yml')['exclude']
+        download_spec(spec_file, forced: options['refresh-spec'])
+        SpecHash.load_file(spec_file)
+        run_once(excluded_paths)
+        watch(excluded_paths) if options['watch']
+      end
+    end
+  end
+
+  def self.download_spec(spec_file, forced: false)
+    return if !forced && File.exist?(spec_file) && (File.mtime(spec_file) > 1.day.ago)
+    Jekyll.logger.info 'Downloading OpenSearch API specification...'
+    system 'curl -L -X GET ' \
+           'https://github.com/opensearch-project/opensearch-api-specification' \
+           '/releases/download/main-latest/opensearch-openapi.yaml ' \
+           "-o #{spec_file}"
+  end
+
+  def self.run_once(excluded_paths)
+    excluded_paths = excluded_paths.map { |path| File.join(Dir.pwd, path) }
+    Dir.glob(File.join(Dir.pwd, '**/*.md'))
+       .filter { |file| excluded_paths.none? { |excluded| file.start_with?(excluded) } }
+       .each { |file| DocProcessor.new(file, logger: Jekyll.logger).process }
+  end
+
+  def self.watch(excluded_paths)
+    Jekyll.logger.info "\nWatching for changes...\n"
+    excluded_paths = excluded_paths.map { |path| /\.#{path}$/ }
+
+    Listen.to(Dir.pwd, only: /\.md$/, ignore: excluded_paths) do |modified, added, _removed|
+      (modified + added).each { |file| DocProcessor.new(file, logger: Jekyll.logger).process }
+    end.start
+
+    trap('INT') { exit }
+    trap('TERM') { exit }
+    sleep
+  end
+end
diff --git a/spec-insert/lib/renderers/base_mustache_renderer.rb b/spec-insert/lib/renderers/base_mustache_renderer.rb
new file mode 100644
index 0000000000..b3d756304c
--- /dev/null
+++ b/spec-insert/lib/renderers/base_mustache_renderer.rb
@@ -0,0 +1,20 @@
+# frozen_string_literal: true
+
+require 'mustache'
+
+# Base Mustache Renderer
+class BaseMustacheRenderer < Mustache
+  self.template_path = "#{__dir__}/templates"
+
+  # @param [Action] action API Action
+  # @param [InsertArguments] args
+  def initialize(action, args)
+    super()
+    @action = action
+    @args = args
+  end
+
+  def omit_header
+    @args.omit_header
+  end
+end
diff --git a/spec-insert/lib/renderers/parameter_table_renderer.rb b/spec-insert/lib/renderers/parameter_table_renderer.rb
new file mode 100644
index 0000000000..23312962d8
--- /dev/null
+++ b/spec-insert/lib/renderers/parameter_table_renderer.rb
@@ -0,0 +1,50 @@
+# frozen_string_literal: true
+
+require_relative 'table_renderer'
+
+# Renders a table of parameters of an API action
+class ParameterTableRenderer
+  # @param [Array<Parameter>] parameters
+  # @param [InsertArguments] args
+  def initialize(parameters, args)
+    @columns = args.columns
+    @pretty = args.pretty
+    @parameters = parameters
+    @parameters = @parameters.reject(&:deprecated) unless args.include_deprecated
+    @parameters = @parameters.sort_by { |arg| [arg.required ? 0 : 1, arg.deprecated ? 1 : 0, arg.name] }
+  end
+
+  # @return [String]
+  def render
+    columns = @columns.map { |col| TableRenderer::Column.new(col, col) }
+    rows = @parameters.map { |arg| row(arg) }
+    TableRenderer.new(columns, rows, pretty: @pretty).render_lines.join("\n")
+  end
+
+  private
+
+  def row(param)
+    {
+      'Parameter' => "`#{param.name}`#{' <br> _DEPRECATED_' if param.deprecated}",
+      'Description' => description(param),
+      'Required' => param.required ? 'Required' : nil,
+      'Type' => param.doc_type,
+      'Default' => param.default
+    }
+  end
+
+  def description(param)
+    deprecation = deprecation(param)
+    required = param.required && @columns.exclude?('Required') ? '**(Required)** ' : ''
+    description = param.description.gsub("\n", ' ')
+    default = param.default.nil? || @columns.includes('Default') ? '' : " _(Default: #{param.default})_"
+
+    "#{deprecation}#{required}#{description}#{default}"
+  end
+
+  def deprecation(param)
+    message = ": #{param.deprecation_message}" if param.deprecation_message.present?
+    since = " since #{param.version_deprecated}" if param.version_deprecated.present?
+    "_(Deprecated#{since}#{message})_ " if param.deprecated
+  end
+end
diff --git a/spec-insert/lib/renderers/path_parameters.rb b/spec-insert/lib/renderers/path_parameters.rb
new file mode 100644
index 0000000000..b1265bcf53
--- /dev/null
+++ b/spec-insert/lib/renderers/path_parameters.rb
@@ -0,0 +1,14 @@
+# frozen_string_literal: true
+
+require_relative 'base_mustache_renderer'
+require_relative 'parameter_table_renderer'
+
+# Renders path parameters
+class PathParameters < BaseMustacheRenderer
+  self.template_file = "#{__dir__}/templates/path_parameters.mustache"
+
+  def table
+    params = @action.arguments.select { |arg| arg.location == ArgLocation::PATH }
+    ParameterTableRenderer.new(params, @args).render
+  end
+end
diff --git a/spec-insert/lib/renderers/paths_and_methods.rb b/spec-insert/lib/renderers/paths_and_methods.rb
new file mode 100644
index 0000000000..0685c03b36
--- /dev/null
+++ b/spec-insert/lib/renderers/paths_and_methods.rb
@@ -0,0 +1,15 @@
+# frozen_string_literal: true
+
+require_relative 'base_mustache_renderer'
+
+# Renders paths and http methods
+class PathsAndMethods < BaseMustacheRenderer
+  self.template_file = "#{__dir__}/templates/paths_and_methods.mustache"
+
+  def operations
+    ljust = @action.operations.map { |op| op.http_verb.length }.max
+    @action.operations
+           .sort_by { |op| [op.url.length, op.http_verb] }
+           .map { |op| { verb: op.http_verb.ljust(ljust), path: op.url } }
+  end
+end
diff --git a/spec-insert/lib/renderers/query_parameters.rb b/spec-insert/lib/renderers/query_parameters.rb
new file mode 100644
index 0000000000..37058ba5f1
--- /dev/null
+++ b/spec-insert/lib/renderers/query_parameters.rb
@@ -0,0 +1,15 @@
+# frozen_string_literal: true
+
+require_relative 'base_mustache_renderer'
+require_relative 'parameter_table_renderer'
+
+# Renders query parameters
+class QueryParameters < BaseMustacheRenderer
+  self.template_file = "#{__dir__}/templates/query_parameters.mustache"
+
+  def table
+    params = @action.arguments.select { |arg| arg.location == ArgLocation::QUERY }
+    params += Parameter.global if @args.include_global
+    ParameterTableRenderer.new(params, @args).render
+  end
+end
diff --git a/spec-insert/lib/renderers/spec_insert.rb b/spec-insert/lib/renderers/spec_insert.rb
new file mode 100644
index 0000000000..4d5ddb3803
--- /dev/null
+++ b/spec-insert/lib/renderers/spec_insert.rb
@@ -0,0 +1,42 @@
+# frozen_string_literal: true
+
+require_relative 'base_mustache_renderer'
+require_relative '../insert_arguments'
+require_relative '../api/action'
+require_relative '../spec_insert_error'
+require_relative 'paths_and_methods'
+require_relative 'path_parameters'
+require_relative 'query_parameters'
+
+# Class to render spec insertions
+class SpecInsert < BaseMustacheRenderer
+  COMPONENTS = Set.new(%w[query_params path_params paths_and_http_methods]).freeze
+  self.template_file = "#{__dir__}/templates/spec_insert.mustache"
+
+  # @param [Array<String>] arg_lines the lines between "<!-- doc_insert_start" and "-->"
+  def initialize(arg_lines)
+    args = InsertArguments.new(arg_lines)
+    action = Action.actions[args.api]
+    super(action, args)
+    raise SpecInsertError, '`api` argument not specified.' unless @args.api
+    raise SpecInsertError, "API Action '#{@args.api}' does not exist in the spec." unless @action
+  end
+
+  def arguments
+    @args.raw.map { |key, value| { key:, value: } }
+  end
+
+  def content
+    raise SpecInsertError, '`component` argument not specified.' unless @args.component
+    case @args.component.to_sym
+    when :query_parameters
+      QueryParameters.new(@action, @args).render
+    when :path_parameters
+      PathParameters.new(@action, @args).render
+    when :paths_and_http_methods
+      PathsAndMethods.new(@action, @args).render
+    else
+      raise SpecInsertError, "Invalid component: #{@args.component}"
+    end
+  end
+end
diff --git a/spec-insert/lib/renderers/table_renderer.rb b/spec-insert/lib/renderers/table_renderer.rb
new file mode 100644
index 0000000000..1cabc435bd
--- /dev/null
+++ b/spec-insert/lib/renderers/table_renderer.rb
@@ -0,0 +1,58 @@
+# frozen_string_literal: true
+
+# TableRenderer renders a markdown table with the given columns and rows
+class TableRenderer
+  # Column object for rendering markdown tables
+  class Column
+    attr_reader :title, :key
+    attr_accessor :width
+
+    # @param [String] title display title
+    # @param [String | Symbol] key key to access in row hash
+    def initialize(title, key)
+      @title = title
+      @key = key
+      @width = 0
+    end
+  end
+
+  # @param [Array<Column>] columns
+  # @param [Array<Hash>] rows
+  # @param [Boolean] pretty whether to render a pretty table or a compact one
+  def initialize(columns, rows, pretty:)
+    @column = columns
+    @rows = rows
+    @pretty = pretty
+  end
+
+  # @return [Array<String>]
+  def render_lines
+    calculate_column_widths if @pretty
+    [render_column, render_divider] + render_rows
+  end
+
+  private
+
+  def calculate_column_widths
+    @column.each do |column|
+      column.width = [@rows.map { |row| row[column.key].to_s.length }.max || 0, column.title.length].max
+    end
+  end
+
+  def render_column
+    columns = @column.map { |column| column.title.ljust(column.width) }.join(' | ')
+    @pretty ? "| #{columns} |" : columns
+  end
+
+  def render_divider
+    dividers = @column.map { |column| ":#{'-' * [column.width + 1, 3].max}" }
+    @pretty ? "|#{dividers.join('|')}|" : dividers.join(' | ')
+  end
+
+  def render_rows
+    @rows.map do |row|
+      cells = @column.map { |column| row[column.key].to_s.ljust(column.width).gsub('|', '\|') }.join(' | ')
+      @pretty ? "| #{cells} |" : cells
+    end
+  end
+end
diff --git a/spec-insert/lib/renderers/templates/path_parameters.mustache b/spec-insert/lib/renderers/templates/path_parameters.mustache
new file mode 100644
index 0000000000..9d9a2df9d4
--- /dev/null
+++ b/spec-insert/lib/renderers/templates/path_parameters.mustache
@@ -0,0 +1,4 @@
+{{^omit_header}}
+## Path parameters
+{{/omit_header}}
+{{{table}}}
\ No newline at end of file
diff --git a/spec-insert/lib/renderers/templates/paths_and_methods.mustache b/spec-insert/lib/renderers/templates/paths_and_methods.mustache
new file mode 100644
index 0000000000..3c2df68011
--- /dev/null
+++ b/spec-insert/lib/renderers/templates/paths_and_methods.mustache
@@ -0,0 +1,8 @@
+{{^omit_header}}
+## Paths and HTTP methods
+{{/omit_header}}
+```json
+{{#operations}}
+{{{verb}}} {{{path}}}
+{{/operations}}
+```
\ No newline at end of file
diff --git a/spec-insert/lib/renderers/templates/query_parameters.mustache b/spec-insert/lib/renderers/templates/query_parameters.mustache
new file mode 100644
index 0000000000..d7331d8f5a
--- /dev/null
+++ b/spec-insert/lib/renderers/templates/query_parameters.mustache
@@ -0,0 +1,7 @@
+{{^omit_header}}
+## Query parameters
+{{#optional}}
+All query parameters are optional.
+{{/optional}}
+{{/omit_header}}
+{{{table}}}
\ No newline at end of file
diff --git a/spec-insert/lib/renderers/templates/spec_insert.mustache b/spec-insert/lib/renderers/templates/spec_insert.mustache
new file mode 100644
index 0000000000..63b6323d48
--- /dev/null
+++ b/spec-insert/lib/renderers/templates/spec_insert.mustache
@@ -0,0 +1,7 @@
+<!-- spec_insert_start
+{{#arguments}}
+{{{key}}}: {{{value}}}
+{{/arguments}}
+-->
+{{{content}}}
+<!-- spec_insert_end -->
diff --git a/spec-insert/lib/spec_hash.rb b/spec-insert/lib/spec_hash.rb
new file mode 100644
index 0000000000..06a872c9b9
--- /dev/null
+++ b/spec-insert/lib/spec_hash.rb
@@ -0,0 +1,60 @@
+# frozen_string_literal: true
+
+require 'yaml'
+require_relative 'api/action'
+require_relative 'api/parameter'
+
+# Spec class for parsing OpenAPI spec
+# It's basically a wrapper around a Hash that allows for accessing hash values as object attributes
+# and resolving of $refs
+class SpecHash
+  def self.load_file(file_path)
+    @raw = YAML.load_file(file_path)
+    @parsed = SpecHash.new(@raw, parsed: false)
+    Action.actions = @parsed
+    Parameter.global = @parsed
+  end
+
+  # @return [Hash] Raw OpenAPI Spec
+  class << self; attr_reader :raw; end
+
+  # @return [Spec] Parsed OpenAPI Spec
+  class << self; attr_reader :parsed; end
+
+  attr_reader :hash
+
+  # @param [Hash] hash
+  def initialize(hash = {}, parsed: true)
+    @hash = parsed ? hash : parse(hash)
+  end
+
+  def [](key)
+    parse(@hash[key])
+  end
+
+  def respond_to_missing?(name, include_private = false)
+    @hash.key?(name.to_s) || @hash.respond_to?(name) || super
+  end
+
+  def method_missing(name, ...)
+    return @hash.send(name, ...) if @hash.respond_to?(name)
+    parse(@hash[name.to_s])
+  end
+
+  private
+
+  def parse(value)
+    return value.map { |v| parse(v) } if value.is_a?(Array)
+    return value unless value.is_a?(Hash)
+    ref = value.delete('$ref')
+    value.transform_values! { |v| parse(v) }
+    return SpecHash.new(value) unless ref
+    SpecHash.new(parse(resolve(ref)).merge(value))
+  end
+
+  def resolve(ref)
+    parts = ref.split('/')
+    parts.shift
+    self.class.raw.dig(*parts)
+  end
+end
diff --git a/spec-insert/lib/spec_insert_error.rb b/spec-insert/lib/spec_insert_error.rb
new file mode 100644
index 0000000000..0ee5ccf159
--- /dev/null
+++ b/spec-insert/lib/spec_insert_error.rb
@@ -0,0 +1,4 @@
+# frozen_string_literal: true
+
+# Error unique to the SpecInsert process
+class SpecInsertError < StandardError; end
diff --git a/spec-insert/spec/_fixtures/actual_output/.gitignore b/spec-insert/spec/_fixtures/actual_output/.gitignore
new file mode 100644
index 0000000000..de056073af
--- /dev/null
+++ b/spec-insert/spec/_fixtures/actual_output/.gitignore
@@ -0,0 +1 @@
+**/*.md
diff --git a/spec-insert/spec/_fixtures/expected_output/param_tables.md b/spec-insert/spec/_fixtures/expected_output/param_tables.md
new file mode 100644
index 0000000000..596f185458
--- /dev/null
+++ b/spec-insert/spec/_fixtures/expected_output/param_tables.md
@@ -0,0 +1,43 @@
+Typical Path Parameters Example
+
+<!-- spec_insert_start
+api: search
+component: path_parameters
+-->
+## Path parameters
+Parameter | Type | Description
+:--- | :--- | :---
+`index` | List | Comma-separated list of data streams, indexes, and aliases to search. Supports wildcards (`*`). To search all data streams and indexes, omit this parameter or use `*` or `_all`.
+<!-- spec_insert_end -->
+
+Query Parameters Example with Global Parameters, Pretty Print, and Custom Columns
+
+<!-- spec_insert_start
+api: search
+component: query_parameters
+include_global: true
+pretty: true
+columns: Type, Parameter, Description, Required, Default
+-->
+## Query parameters
+| Type    | Parameter                 | Description                                                                                                                        | Required | Default |
+|:--------|:--------------------------|:-----------------------------------------------------------------------------------------------------------------------------------|:---------|:--------|
+| Boolean | `analyze_wildcard`        | If true, wildcard and prefix queries are analyzed. This parameter can only be used when the q query string parameter is specified. | Required |         |
+| String  | `analyzer`                | Analyzer to use for the query string. This parameter can only be used when the q query string parameter is specified.              |          |         |
+| Boolean | `pretty`                  | Whether to pretty format the returned JSON response.                                                                               |          |         |
+| Boolean | `human` <br> _DEPRECATED_ | _(Deprecated since 3.0: Use the `format` parameter instead.)_ Whether to return human readable values for statistics.              |          |         |
+<!-- spec_insert_end -->
+
+Query Parameters Example with only Parameter and Description Columns
+
+<!-- spec_insert_start
+api: search
+component: query_parameters
+columns: Parameter, Description
+omit_header: true
+-->
+Parameter | Description
+:--- | :---
+`analyze_wildcard` | **(Required)** If true, wildcard and prefix queries are analyzed. This parameter can only be used when the q query string parameter is specified.
+`analyzer` | Analyzer to use for the query string. This parameter can only be used when the q query string parameter is specified.
+<!-- spec_insert_end -->
diff --git a/spec-insert/spec/_fixtures/expected_output/paths_and_http_methods.md b/spec-insert/spec/_fixtures/expected_output/paths_and_http_methods.md
new file mode 100644
index 0000000000..8ca1569b52
--- /dev/null
+++ b/spec-insert/spec/_fixtures/expected_output/paths_and_http_methods.md
@@ -0,0 +1,13 @@
+
+<!-- spec_insert_start
+api: search
+component: paths_and_http_methods
+-->
+## Paths and HTTP methods
+```json
+GET  /_search
+POST /_search
+GET  /{index}/_search
+POST /{index}/_search
+```
+<!-- spec_insert_end -->
diff --git a/spec-insert/spec/_fixtures/input/param_tables.md b/spec-insert/spec/_fixtures/input/param_tables.md
new file mode 100644
index 0000000000..d9f24e23f9
--- /dev/null
+++ b/spec-insert/spec/_fixtures/input/param_tables.md
@@ -0,0 +1,39 @@
+Typical Path Parameters Example
+
+<!-- spec_insert_start
+api: search
+component: path_parameters
+-->
+THIS
+    TEXT
+        SHOULD
+            BE
+                REPLACED
+<!-- spec_insert_end -->
+
+Query Parameters Example with Global Parameters, Pretty Print, and Custom Columns
+
+<!-- spec_insert_start
+api: search
+component: query_parameters
+include_global: true
+pretty: true
+columns: Type, Parameter, Description, Required, Default
+-->
+  THIS TEXT SHOULD BE REPLACED
+<!-- spec_insert_end -->
+
+Query Parameters Example with only Parameter and Description Columns
+
+<!-- spec_insert_start
+api: search
+component: query_parameters
+columns: Parameter, Description
+omit_header: true
+-->
+THIS
+TEXT
+SHOULD
+BE
+REPLACED
+<!-- spec_insert_end -->
diff --git a/spec-insert/spec/_fixtures/input/paths_and_http_methods.md b/spec-insert/spec/_fixtures/input/paths_and_http_methods.md
new file mode 100644
index 0000000000..0e92b8af8e
--- /dev/null
+++ b/spec-insert/spec/_fixtures/input/paths_and_http_methods.md
@@ -0,0 +1,6 @@
+
+<!-- spec_insert_start
+api: search
+component: paths_and_http_methods
+-->
+<!-- spec_insert_end -->
diff --git a/spec-insert/spec/_fixtures/opensearch_spec.yaml b/spec-insert/spec/_fixtures/opensearch_spec.yaml
new file mode 100644
index 0000000000..7c67f27e69
--- /dev/null
+++ b/spec-insert/spec/_fixtures/opensearch_spec.yaml
@@ -0,0 +1,120 @@
+openapi: 3.1.0
+info:
+  title: OpenSearch API Specification
+  version: 1.0.0
+  x-api-version: 2.16.0
+paths:
+  /_search:
+    get:
+      operationId: search.0
+      x-operation-group: search
+      x-version-added: '1.0'
+      description: Returns results matching a query.
+      externalDocs:
+        url: https://opensearch.org/docs/latest/api-reference/search/
+      parameters:
+        - $ref: '#/components/parameters/search___query.analyze_wildcard'
+        - $ref: '#/components/parameters/search___query.analyzer'
+    post:
+      operationId: search.1
+      x-operation-group: search
+      x-version-added: '1.0'
+      description: Returns results matching a query.
+      externalDocs:
+          url: https://opensearch.org/docs/latest/api-reference/search/
+      parameters:
+          - $ref: '#/components/parameters/search___query.analyze_wildcard'
+          - $ref: '#/components/parameters/search___query.analyzer'
+  /{index}/_search:
+    get:
+      operationId: search.2
+      x-operation-group: search
+      x-version-added: '1.0'
+      description: Returns results matching a query.
+      externalDocs:
+        url: https://opensearch.org/docs/latest/api-reference/search/
+      parameters:
+        - $ref: '#/components/parameters/search___path.index'
+        - $ref: '#/components/parameters/search___query.analyze_wildcard'
+        - $ref: '#/components/parameters/search___query.analyzer'
+    post:
+      operationId: search.3
+      x-operation-group: search
+      x-version-added: '1.0'
+      description: Returns results matching a query.
+      externalDocs:
+        url: https://opensearch.org/docs/latest/api-reference/search/
+      parameters:
+        - $ref: '#/components/parameters/search___path.index'
+        - $ref: '#/components/parameters/search___query.analyze_wildcard'
+        - $ref: '#/components/parameters/search___query.analyzer'
+components:
+
+  parameters:
+
+    _global___query.pretty:
+      name: pretty
+      in: query
+      description: Whether to pretty format the returned JSON response.
+      schema:
+        type: boolean
+      default: false
+      x-global: true
+
+    _global___query.human:
+      name: human
+      in: query
+      description: Whether to return human readable values for statistics.
+      schema:
+        type: boolean
+      default: true
+      x-global: true
+      deprecated: true
+      x-version-deprecated: '3.0'
+      x-deprecation-message: Use the `format` parameter instead.
+
+    search___path.index:
+      in: path
+      name: index
+      description: |-
+        Comma-separated list of data streams, indexes, and aliases to search.
+        Supports wildcards (`*`).
+        To search all data streams and indexes, omit this parameter or use `*` or `_all`.
+      required: true
+      schema:
+        $ref: '#/components/schemas/_common___Indices'
+      style: simple
+
+    search___query.analyze_wildcard:
+      in: query
+      name: analyze_wildcard
+      required: true
+      description: |-
+        If true, wildcard and prefix queries are analyzed.
+        This parameter can only be used when the q query string parameter is specified.
+      schema:
+        type: boolean
+        default: false
+      style: form
+
+    search___query.analyzer:
+      in: query
+      name: analyzer
+      description: |-
+        Analyzer to use for the query string.
+        This parameter can only be used when the q query string parameter is specified.
+      schema:
+        type: string
+      style: form
+
+  schemas:
+
+    _common___Indices:
+      oneOf:
+        - $ref: '#/components/schemas/_common___IndexName'
+        - type: array
+          items:
+            $ref: '#/components/schemas/_common___IndexName'
+
+    _common___IndexName:
+      type: string
diff --git a/spec-insert/spec/doc_processor_spec.rb b/spec-insert/spec/doc_processor_spec.rb
new file mode 100644
index 0000000000..073613a2a9
--- /dev/null
+++ b/spec-insert/spec/doc_processor_spec.rb
@@ -0,0 +1,24 @@
+# frozen_string_literal: true
+
+require_relative 'spec_helper'
+require_relative '../lib/doc_processor'
+require_relative '../lib/spec_hash'
+
+describe DocProcessor do
+  SpecHash.load_file('spec/_fixtures/opensearch_spec.yaml')
+
+  def test_file(file_name)
+    expected_output = File.read("#{__dir__}/_fixtures/expected_output/#{file_name}.md")
+    actual_output = described_class.new("#{__dir__}/_fixtures/input/#{file_name}.md", logger: Logger.new($stdout)).process(write_to_file: false)
+    File.write("./spec/_fixtures/actual_output/#{file_name}.md", actual_output)
+    expect(actual_output).to eq(expected_output)
+  end
+
+  it 'inserts the param tables correctly' do
+    test_file('param_tables')
+  end
+
+  it 'inserts the paths and http methods correctly' do
+    test_file('paths_and_http_methods')
+  end
+end
diff --git a/spec-insert/spec/spec_helper.rb b/spec-insert/spec/spec_helper.rb
new file mode 100644
index 0000000000..74d9dc9bb9
--- /dev/null
+++ b/spec-insert/spec/spec_helper.rb
@@ -0,0 +1,102 @@
+# This file was generated by the `rspec --init` command. Conventionally, all
+# specs live under a `spec` directory, which RSpec adds to the `$LOAD_PATH`.
+# The generated `.rspec` file contains `--require spec_helper` which will cause
+# this file to always be loaded, without a need to explicitly require it in any
+# files.
+#
+# Given that it is always loaded, you are encouraged to keep this file as
+# light-weight as possible. Requiring heavyweight dependencies from this file
+# will add to the boot time of your test suite on EVERY test run, even for an
+# individual file that may not need all of that loaded. Instead, consider making
+# a separate helper file that requires the additional dependencies and performs
+# the additional setup, and require it from the spec files that actually need
+# it.
+#
+# See https://rubydoc.info/gems/rspec-core/RSpec/Core/Configuration
+RSpec.configure do |config|
+  # rspec-expectations config goes here. You can use an alternate
+  # assertion/expectation library such as wrong or the stdlib/minitest
+  # assertions if you prefer.
+  config.expect_with :rspec do |expectations|
+    # This option will default to `true` in RSpec 4. It makes the `description`
+    # and `failure_message` of custom matchers include text for helper methods
+    # defined using `chain`, e.g.:
+    #     be_bigger_than(2).and_smaller_than(4).description
+    #     # => "be bigger than 2 and smaller than 4"
+    # ...rather than:
+    #     # => "be bigger than 2"
+    expectations.include_chain_clauses_in_custom_matcher_descriptions = true
+  end
+
+  # rspec-mocks config goes here. You can use an alternate test double
+  # library (such as bogus or mocha) by changing the `mock_with` option here.
+  config.mock_with :rspec do |mocks|
+    # Prevents you from mocking or stubbing a method that does not exist on
+    # a real object. This is generally recommended, and will default to
+    # `true` in RSpec 4.
+    mocks.verify_partial_doubles = true
+  end
+
+  # This option will default to `:apply_to_host_groups` in RSpec 4 (and will
+  # have no way to turn it off -- the option exists only for backwards
+  # compatibility in RSpec 3). It causes shared context metadata to be
+  # inherited by the metadata hash of host groups and examples, rather than
+  # triggering implicit auto-inclusion in groups with matching metadata.
+  config.shared_context_metadata_behavior = :apply_to_host_groups
+
+  # The settings below are suggested to provide a good initial experience
+  # with RSpec, but feel free to customize to your heart's content.
+
+  # This allows you to limit a spec run to individual examples or groups
+  # you care about by tagging them with `:focus` metadata. When nothing
+  # is tagged with `:focus`, all examples get run. RSpec also provides
+  # aliases for `it`, `describe`, and `context` that include `:focus`
+  # metadata: `fit`, `fdescribe` and `fcontext`, respectively.
+  config.filter_run_when_matching :focus
+
+  # Allows RSpec to persist some state between runs in order to support
+  # the `--only-failures` and `--next-failure` CLI options. We recommend
+  # you configure your source control system to ignore this file.
+  config.example_status_persistence_file_path = 'rspec_examples.txt'
+
+  # Limits the available syntax to the non-monkey patched syntax that is
+  # recommended. For more details, see:
+  # https://rspec.info/features/3-12/rspec-core/configuration/zero-monkey-patching-mode/
+  config.disable_monkey_patching!
+
+  # This setting enables warnings. It's recommended, but in some cases may
+  # be too noisy due to issues in dependencies.
+  config.warnings = true
+
+  # Many RSpec users commonly either run the entire suite or an individual
+  # file, and it's useful to allow more verbose expected_output when running an
+  # individual spec file.
+  if config.files_to_run.one?
+    # Use the documentation formatter for detailed expected_output,
+    # unless a formatter has already been configured
+    # (e.g. via a command-line flag).
+    config.default_formatter = 'doc'
+  end
+
+  # Print the 10 slowest examples and example groups at the
+  # end of the spec run, to help surface which specs are running
+  # particularly slow.
+  config.profile_examples = 10
+
+  # Run specs in random order to surface order dependencies. If you find an
+  # order dependency and want to debug it, you can fix the order by providing
+  # the seed, which is printed after each run.
+  #     --seed 1234
+  config.order = :random
+
+  # Seed global randomization in this process using the `--seed` CLI option.
+  # Setting this allows you to use `--seed` to deterministically reproduce
+  # test failures related to randomization by passing the same `--seed` value
+  # as the one that triggered the failure.
+  Kernel.srand config.seed
+
+  config.expose_dsl_globally = true
+end
+
+require 'active_support/all'
+require 'rspec'
diff --git a/templates/EXPERIMENTAL_TEMPLATE.md b/templates/EXPERIMENTAL_TEMPLATE.md
index 6aa06c5824..b954a98a5d 100644
--- a/templates/EXPERIMENTAL_TEMPLATE.md
+++ b/templates/EXPERIMENTAL_TEMPLATE.md
@@ -10,5 +10,5 @@ parent:
 This is an experimental feature and is not recommended for use in a production environment. For updates on the progress of the feature or if you want to leave feedback, see the associated [GitHub issue](https://example.issue.link).    
 {: .warning}
 
-This is an experimental feature and is not recommended for use in a production environment. For updates on the progress the feature or if you want to leave feedback, join the discussion in the [OpenSearch forum](https://forum.opensearch.org/).    
-{: .warning}
\ No newline at end of file
+This is an experimental feature and is not recommended for use in a production environment. For updates on the progress the feature or if you want to leave feedback, join the discussion on the [OpenSearch forum](https://forum.opensearch.org/).    
+{: .warning}