Name: Elasticsearch 8.x Expert
Author: chrishuffman5

搵技能.../

# First node startup output includes:
# - elastic user password
# - Enrollment token for Kibana
# - Enrollment token for other nodes

# Enroll a new node
bin/elasticsearch --enrollment-token <token>

# Enroll Kibana
bin/kibana --enrollment-token <token>

# Reset elastic password
bin/elasticsearch-reset-password -u elastic

# Generate enrollment token for additional nodes
bin/elasticsearch-create-enrollment-token -s node

# Generate enrollment token for Kibana
bin/elasticsearch-create-enrollment-token -s kibana

PUT /semantic-search
{
  "mappings": {
    "properties": {
      "title": { "type": "text" },
      "title_embedding": {
        "type": "dense_vector",
        "dims": 384,
        "index": true,
        "similarity": "cosine"
      }
    }
  }
}

POST /semantic-search/_doc/1
{
  "title": "Introduction to Elasticsearch",
  "title_embedding": [0.12, -0.34, 0.56, ...]
}

POST /semantic-search/_search
{
  "knn": {
    "field": "title_embedding",
    "query_vector": [0.11, -0.32, 0.55, ...],
    "k": 10,
    "num_candidates": 100
  },
  "_source": ["title"]
}

POST /semantic-search/_search
{
  "query": {
    "match": { "title": "elasticsearch guide" }
  },
  "knn": {
    "field": "title_embedding",
    "query_vector": [0.11, -0.32, 0.55, ...],
    "k": 10,
    "num_candidates": 100,
    "boost": 0.5
  },
  "size": 10
}

POST /semantic-search/_search
{
  "knn": {
    "field": "title_embedding",
    "query_vector": [0.11, -0.32, 0.55, ...],
    "k": 10,
    "num_candidates": 100,
    "filter": {
      "term": { "category": "technology" }
    }
  }
}

Version	Enhancement
8.0	Initial kNN search support with HNSW
8.4	Filtered kNN, hybrid search (kNN + query), kNN in bool query
8.6	Quantization support for reduced memory footprint
8.8	Nested kNN search, improved performance
8.10	Byte-quantized vectors (int8), reduced memory by ~4x
8.12	Better quantization, scalar quantization built-in
8.14	BBQ (Better Binary Quantization) for ~32x memory reduction
8.15	Improved HNSW graph building, bit vectors

{
  "type": "dense_vector",
  "dims": 768,
  "index": true,
  "similarity": "cosine",
  "index_options": {
    "type": "hnsw",
    "m": 16,
    "ef_construction": 100
  }
}

PUT _ml/trained_models/sentence-transformers__all-minilm-l6-v2/deployment/_start
{
  "number_of_allocations": 1,
  "threads_per_allocation": 2,
  "queue_capacity": 1024
}

PUT _ingest/pipeline/text-embedding
{
  "processors": [
    {
      "inference": {
        "model_id": "sentence-transformers__all-minilm-l6-v2",
        "input_output": [
          {
            "input_field": "text",
            "output_field": "text_embedding"
          }
        ]
      }
    }
  ]
}

POST /my-index/_search
{
  "knn": {
    "field": "text_embedding",
    "query_vector_builder": {
      "text_embedding": {
        "model_id": "sentence-transformers__all-minilm-l6-v2",
        "model_text": "What is Elasticsearch?"
      }
    },
    "k": 10,
    "num_candidates": 100
  }
}

PUT /my-index
{
  "mappings": {
    "properties": {
      "content_embedding": {
        "type": "sparse_vector"
      }
    }
  }
}

POST /my-index/_search
{
  "query": {
    "sparse_vector": {
      "field": "content_embedding",
      "inference_id": "elser_model",
      "query": "What is Elasticsearch?"
    }
  }
}

PUT _index_template/metrics-template
{
  "index_patterns": ["metrics-*"],
  "template": {
    "settings": {
      "index.mode": "time_series",
      "index.routing_path": ["host.name", "metric.name"],
      "index.time_series.start_time": "2024-01-01T00:00:00Z",
      "index.time_series.end_time": "2024-12-31T23:59:59Z"
    },
    "mappings": {
      "properties": {
        "@timestamp": { "type": "date" },
        "host.name": { "type": "keyword", "time_series_dimension": true },
        "metric.name": { "type": "keyword", "time_series_dimension": true },
        "metric.value": { "type": "double", "time_series_metric": "gauge" }
      }
    }
  }
}

POST _snapshot/my-repo/snapshot-1/_mount?storage=shared_cache
{
  "index": "old-logs-2023",
  "renamed_index": "searchable-old-logs-2023"
}

Type	Data Location	Performance	Use Case
`full_copy`	Full copy on local node	Fast (same as normal)	Warm tier (frequent access)
`shared_cache`	Object storage + local cache	Slower (cache misses = S3 reads)	Frozen tier (infrequent access)

# elasticsearch.yml (frozen data node)
node.roles: [data_frozen]
xpack.searchable.snapshot.shared_cache.size: 90%

POST _security/api_key
{
  "name": "search-service",
  "role_descriptors": {
    "search": {
      "indices": [
        {
          "names": ["products*"],
          "privileges": ["read"]
        }
      ]
    }
  },
  "expiration": "30d",
  "metadata": {
    "application": "search-service",
    "environment": "production"
  }
}

PUT _security/api_key/api-key-id
{
  "role_descriptors": {
    "search": {
      "indices": [
        {
          "names": ["products*", "catalog*"],
          "privileges": ["read"]
        }
      ]
    }
  },
  "metadata": {
    "updated_at": "2024-01-15"
  }
}

POST _security/cross_cluster/api_key
{
  "name": "cross-cluster-key",
  "access": {
    "search": [
      { "names": ["logs-*"] }
    ],
    "replication": [
      { "names": ["critical-data"] }
    ]
  }
}

POST _query
{
  "query": """
    FROM logs-*
    | WHERE log.level == "error" AND @timestamp > NOW() - 24 hours
    | STATS count = COUNT(*) BY host.name
    | SORT count DESC
    | LIMIT 10
  """
}

// Aggregation with multiple metrics
FROM metrics-*
| WHERE @timestamp > NOW() - 1 hour
| STATS avg_cpu = AVG(system.cpu.percent), max_cpu = MAX(system.cpu.percent) BY host.name
| WHERE avg_cpu > 80
| SORT avg_cpu DESC

// Enrichment and transformation
FROM logs-*
| WHERE log.level == "error"
| EVAL error_type = CASE(
    message LIKE "*timeout*", "timeout",
    message LIKE "*connection refused*", "connection",
    "other"
  )
| STATS count = COUNT(*) BY error_type
| SORT count DESC

// Pattern matching
FROM logs-*
| GROK message "%{IP:client_ip} %{WORD:method} %{URIPATHPARAM:path} %{NUMBER:status}"
| WHERE status >= 500
| STATS error_count = COUNT(*) BY path
| SORT error_count DESC

PUT _synonyms/my-synonyms-set
{
  "synonyms_set": [
    { "id": "rule1", "synonyms": "elasticsearch, ES, elastic search" },
    { "id": "rule2", "synonyms": "kubernetes, k8s, kube" },
    { "id": "rule3", "synonyms": "database => db" }
  ]
}

PUT /my-index
{
  "settings": {
    "analysis": {
      "filter": {
        "syn_filter": {
          "type": "synonym_graph",
          "synonyms_set": "my-synonyms-set",
          "updateable": true
        }
      },
      "analyzer": {
        "syn_analyzer": {
          "type": "custom",
          "tokenizer": "standard",
          "filter": ["lowercase", "syn_filter"]
        }
      }
    }
  }
}

PUT _synonyms/my-synonyms-set/rule4
{
  "synonyms": "AWS, Amazon Web Services"
}

Version	Feature
8.0	Security by default, kNN search, NLP inference, removal of mapping types
8.1	TSDB index mode (preview), Kibana Discover improvements
8.2	Improved kNN performance, geo_grid aggregation
8.3	Downsampling for TSDB, runtime fields improvements
8.4	Filtered kNN search, hybrid kNN+BM25, API key updates
8.5	Random sampler aggregation, improved keyword suggestion
8.6	kNN quantization support, improved join field performance
8.7	TSDB GA, health API, improved multi-field kNN
8.8	ELSER model, query-time vector generation, nested kNN
8.9	Improved ES
8.10	Synonyms API, cross-cluster API keys, byte-quantized kNN
8.11	ES
8.12	Scalar quantization for vectors, improved logsdb
8.13	Semantic text field type, retrievers API
8.14	BBQ quantization, improved search performance
8.15	Bit vectors, improved HNSW, logsdb improvements
8.16	Improved synthetic source, passkey authentication
8.17	Final 8.x feature release before 9.0

# 7.x (deprecated)
PUT /my-index/_mapping/_doc { ... }

# 8.x (correct)
PUT /my-index/_mapping { ... }

# 7.x (deprecated)
GET /my-index/_doc/1/_source

# 8.x (correct)
GET /my-index/_source/1

curl -H "Content-Type: application/vnd.elasticsearch+json;compatible-with=7" \
     -H "Accept: application/vnd.elasticsearch+json;compatible-with=7" \
     localhost:9200/my-index/_search

# 1. Check deprecation log
curl -s localhost:9200/_migration/deprecations?pretty

# 2. Resolve all deprecation warnings before upgrading

# 3. Ensure all nodes are on the latest 7.17.x
curl -s localhost:9200/_cat/nodes?v&h=name,version

# 4. Take a snapshot
curl -X PUT localhost:9200/_snapshot/pre-upgrade-repo/pre-8x-snapshot?wait_for_completion=true

# 5. Check index compatibility (indices created in 6.x need reindexing)
curl -s localhost:9200/_cat/indices?v&h=index,creation.date.string

# 1. Disable shard allocation
curl -X PUT localhost:9200/_cluster/settings -H 'Content-Type: application/json' -d '{
  "persistent": { "cluster.routing.allocation.enable": "primaries" }
}'

# 2. Flush
curl -X POST localhost:9200/_flush

# 3. Stop ES on target node, upgrade, start ES
systemctl stop elasticsearch
# ... upgrade package/binary ...
systemctl start elasticsearch

# 4. Wait for node to rejoin
curl -s localhost:9200/_cat/nodes?v

# 5. Re-enable allocation
curl -X PUT localhost:9200/_cluster/settings -H 'Content-Type: application/json' -d '{
  "persistent": { "cluster.routing.allocation.enable": "all" }
}'

# 6. Wait for green, repeat for next node
curl -s localhost:9200/_cluster/health?wait_for_status=green&timeout=5m

Elasticsearch 8.x Expert | Skills Pool

Elasticsearch 8.x Expert

Elasticsearch 8.x Expert

Key Features Introduced in Elasticsearch 8.x

Security by Default (8.0)

kNN Vector Search (8.0+, Improved in 8.4+, 8.8+, 8.12+)

NLP Inference (8.0+, PyTorch Models)

TSDB Index Mode (8.1+, GA in 8.7)

Searchable Snapshots (GA in 8.0)

Elastic Agent and Fleet (8.0+)

API Key Authentication Improvements (8.0+)

ES|QL (Elasticsearch Query Language, 8.11+)

Synonyms API (8.10+)

Other Notable 8.x Features

Breaking Changes from 7.x to 8.x

Removed Features

Behavioral Changes

API Changes

REST API Compatibility (7.x to 8.x)

Migration Guide: 7.x to 8.x

Pre-Migration Checklist

Upgrade Path

Rolling Upgrade Procedure

Common Pitfalls (8.x-Specific)

Version Boundaries

Reference Files

Vector Index Tuning

Azure Resource Manager Redis Dotnet

Redis Expert

Elasticsearch

Cache Expert

Abp Mongodb