• cloudwatch_exporter-aws-es.png
    cloudwatch_exporter-aws-es.png
  1. Grafana version >= 7
  2. exporter https://github.com/prometheus/cloudwatch_exporter
  3. exporter config
---
region: us-east-1
delay_seconds: 60
metrics:
# ES集群运行状态
  # 集群状态
  - aws_namespace: AWS/ES
    aws_metric_name: ClusterStatus.green
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Average]
  - aws_namespace: AWS/ES
    aws_metric_name: ClusterStatus.yellow
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Average]
  - aws_namespace: AWS/ES
    aws_metric_name: ClusterStatus.red
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Average]
  # 集群写入状态
  - aws_namespace: AWS/ES
    aws_metric_name: ClusterIndexWritesBlocked
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Average]
  # 主实例连接状态
  - aws_namespace: AWS/ES
    aws_metric_name: MasterReachableFromNode
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Average]
  # 快照失败状态
  - aws_namespace: AWS/ES
    aws_metric_name: AutomatedSnapshotFailure
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Average]
  # 节点总数
  - aws_namespace: AWS/ES
    aws_metric_name: Nodes
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Average]
  # 存储空间
  - aws_namespace: AWS/ES
    aws_metric_name: FreeStorageSpace
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Minimum,Sum]
  # Kibana运行状况
  - aws_namespace: AWS/ES
    aws_metric_name: KibanaHealthyNodes
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Average]
  # 已删除文档数量
  - aws_namespace: AWS/ES
    aws_metric_name: DeletedDocuments
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Average]
  # 可搜索文档数量
  - aws_namespace: AWS/ES
    aws_metric_name: SearchableDocuments
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Average]
# 关键性能指标
  # 索引速率 /min
  - aws_namespace: AWS/ES
    aws_metric_name: IndexingRate
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Average]
  # 搜索查询速率 /min
  - aws_namespace: AWS/ES
    aws_metric_name: SearchRate
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Average]
  # 索引延迟 s
  - aws_namespace: AWS/ES
    aws_metric_name: IndexingLatency
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Average]
  # 搜索查询延迟 s
  - aws_namespace: AWS/ES
    aws_metric_name: SearchLatency
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Average]
  # 请求响应
  - aws_namespace: AWS/ES
    aws_metric_name: 2xx
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Average]
  - aws_namespace: AWS/ES
    aws_metric_name: 3xx
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Average]
  - aws_namespace: AWS/ES
    aws_metric_name: 4xx
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Average]
  - aws_namespace: AWS/ES
    aws_metric_name: 5xx
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Average]
  # 无效主机标头请求数量
  - aws_namespace: AWS/ES
    aws_metric_name: InvalidHostHeaderRequests
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Average]
  # 请求数量
  - aws_namespace: AWS/ES
    aws_metric_name: ElasticsearchRequests
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Average]
# 专用主节点(非必须)
  # CPU利用率
  - aws_namespace: AWS/ES
    aws_metric_name: MasterCPUUtilization
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Average]
  # JVM 内存压力 
  - aws_namespace: AWS/ES
    aws_metric_name: MasterJVMMemoryPressure
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Average]
# 数据节点
  # 最大CPU利用率
  - aws_namespace: AWS/ES
    aws_metric_name: CPUUtilization
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Maximum]
  # 最大 JVM 内存压力 
  - aws_namespace: AWS/ES
    aws_metric_name: JVMMemoryPressure
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Maximum]
  # 最小可用存储空间
  - aws_namespace: AWS/ES
    aws_metric_name: FreeStorageSpace
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Minimum]
  # 最大内存利用率
  - aws_namespace: AWS/ES
    aws_metric_name: SysMemoryUtilization
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Maximum]
# Elasticsearch JVM 垃圾回收
  # 年轻代回收
  - aws_namespace: AWS/ES
    aws_metric_name: JVMGCYoungCollectionCount
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Average]
  # 年轻代回收时间
  - aws_namespace: AWS/ES
    aws_metric_name: JVMGCYoungCollectionTime
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Average]
  # 年老代回收
  - aws_namespace: AWS/ES
    aws_metric_name: JVMGCOldCollectionCount
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Average]
  # 年老代回收时间
  - aws_namespace: AWS/ES
    aws_metric_name: JVMGCOldCollectionTime
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Average]
# Elasticsearch JVM 线程池
  # 写入线程池
  - aws_namespace: AWS/ES
    aws_metric_name: ThreadpoolWriteThreads
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Average]
  # 索引线程池
  - aws_namespace: AWS/ES
    aws_metric_name: ThreadpoolIndexThreads
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Average]
  # 搜索线程池
  - aws_namespace: AWS/ES
    aws_metric_name: ThreadpoolSearchThreads
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Average]
  # 合并线程池
  - aws_namespace: AWS/ES
    aws_metric_name: ThreadpoolForce_mergeThreads
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Average]
# 跨集群搜索连接
  # 跨集群入站请求
  - aws_namespace: AWS/ES
    aws_metric_name: CrossClusterInboundRequests
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Average]
  # 跨集群出站请求
  - aws_namespace: AWS/ES
    aws_metric_name: CrossClusterOutboundRequests
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Average]
  # 跨集群出站连接
  - aws_namespace: AWS/ES
    aws_metric_name: CrossClusterOutboundConnections
    aws_dimensions: [DomainName, ClientId]
    aws_statistics: [Average]
Get this dashboard:
13972