@llplmlyd
        
        2021-06-28T09:19:55.000000Z
        字数 3651
        阅读 838
    数据库-TiDB
# TiDBcount(probe_success{tidb_cluster="$tidb_cluster", group="tidb"} == 1)# PDcount(probe_success{tidb_cluster="$tidb_cluster", group="pd"} == 1)#TiKVcount(probe_success{tidb_cluster="$tidb_cluster", group="tikv"} == 1)#TiFlashcount(probe_success{tidb_cluster="$tidb_cluster", group="tiflash"} == 1)# Pumpcount(probe_success{tidb_cluster="$tidb_cluster", group="pump"} == 1)
## 整个集群的磁盘使用率sum(pd_cluster_status{tidb_cluster="$tidb_cluster", instance="$instance",type="storage_size"}) / sum(pd_cluster_status{tidb_cluster="$tidb_cluster", instance="$instance",type="storage_capacity"})## 失联的store数量sum(pd_cluster_status{tidb_cluster="$tidb_cluster", instance="$instance", type="store_disconnected_count"})## 不健康的store数量sum(pd_cluster_status{tidb_cluster="$tidb_cluster", instance="$instance", type="store_unhealth_count"})## 存储空间较低的store数量sum(pd_cluster_status{tidb_cluster="$tidb_cluster", instance="$instance", type="store_low_space_count"})## 进程停止的store数量sum(pd_cluster_status{tidb_cluster="$tidb_cluster", instance="$instance", type="store_down_count"})## 正在下线的store数量sum(pd_cluster_status{tidb_cluster="$tidb_cluster", instance="$instance", type="store_offline_count"})## 已经下线的store数量sum(pd_cluster_status{tidb_cluster="$tidb_cluster", instance="$instance", type="store_tombstone_count"})
# 当前集群的 Region 总量,请注意 Region 数量与副本数无关pd_cluster_status{tidb_cluster="$tidb_cluster", instance="$instance", type="leader_count"}## region healthpd_regions_status{tidb_cluster="$tidb_cluster", instance="$instance"}sum(pd_regions_status{tidb_cluster="$tidb_cluster"}) by (instance, type)
## PD 启动时间(time() - process_start_time_seconds{tidb_cluster="$tidb_cluster",job=~".*pd.*"})## 创建的调度sum(delta(pd_schedule_operators_count{tidb_cluster="$tidb_cluster", instance="$instance", event="create"}[1m])) by (type)## 完成的调度sum(delta(pd_schedule_operators_count{tidb_cluster="$tidb_cluster", instance="$instance", event="finish"}[1m])) by (type)
## TiKV leader infosum(tikv_raftstore_region_count{tidb_cluster="$tidb_cluster", type="leader"}) by (instance)## TiKV region infosum(tikv_raftstore_region_count{tidb_cluster="$tidb_cluster", type="region"}) by (instance)## TiKV 内存使用率avg(process_resident_memory_bytes{tidb_cluster="$tidb_cluster", instance=~"$instance"}) by (instance)## TiKV Server is Busysum(rate(tikv_scheduler_too_busy_total{instance=~"$instance"}[1m])) by (instance)sum(rate(tikv_channel_full_total{instance=~"$instance"}[1m])) by (instance, type)sum(rate(tikv_coprocessor_request_error{instance=~"$instance", type='full'}[1m])) by (instance)avg(tikv_engine_write_stall{instance=~"$instance", type="write_stall_percentile99"}) by (instance)## TiKV 未compact的堆积字节数量,反映写入压力情况sum(tikv_engine_pending_compaction_bytes{tidb_cluster="$tidb_cluster", instance=~"$instance", db="$db"}) by (cf)
## TiDB info 内存信息process_resident_memory_bytes{tidb_cluster="$tidb_cluster", job="tidb"}## TiDB运行时间(time() - process_start_time_seconds{tidb_cluster="$tidb_cluster", job="tidb"})## TiDB 各个节点的连接数tidb_server_connections{tidb_cluster="$tidb_cluster"}## 集群总的连接数sum(tidb_server_connections{tidb_cluster="$tidb_cluster"})## TiDB查询延迟99%histogram_quantile(0.99, sum(rate(tidb_server_handle_query_duration_seconds_bucket{tidb_cluster="$tidb_cluster", sql_type!="internal"}[1m])) by (le))## TiDB查询延迟95%histogram_quantile(0.95, sum(rate(tidb_server_handle_query_duration_seconds_bucket{tidb_cluster="$tidb_cluster", sql_type!="internal"}[1m])) by (le))## 集群QPS# 按照类型sum(rate(tidb_executor_statement_total{tidb_cluster="$tidb_cluster"}[1m])) by (type)# 总的sum(rate(tidb_executor_statement_total{tidb_cluster="$tidb_cluster"}[1m]))## 集群TPSsum(rate(tidb_session_transaction_duration_seconds_count{tidb_cluster="$tidb_cluster"}[1m])) by (type, txn_mode)