diff options
Diffstat (limited to 'templates/db/tidb_http/tidb_pd_http/template_db_tidb_pd_http.yaml')
-rw-r--r-- | templates/db/tidb_http/tidb_pd_http/template_db_tidb_pd_http.yaml | 46 |
1 files changed, 45 insertions, 1 deletions
diff --git a/templates/db/tidb_http/tidb_pd_http/template_db_tidb_pd_http.yaml b/templates/db/tidb_http/tidb_pd_http/template_db_tidb_pd_http.yaml index eb7f7b7d391..7016873346f 100644 --- a/templates/db/tidb_http/tidb_pd_http/template_db_tidb_pd_http.yaml +++ b/templates/db/tidb_http/tidb_pd_http/template_db_tidb_pd_http.yaml @@ -1,11 +1,13 @@ zabbix_export: version: '5.4' - date: '2021-05-09T00:00:00Z' + date: '2021-05-10T19:41:58Z' groups: - + uuid: 748ad4d098d447d492bb935c907f652f name: Templates/Databases templates: - + uuid: 43596328d4d74a5592906a9e08e3fd96 template: 'TiDB PD by HTTP' name: 'TiDB PD by HTTP' description: | @@ -23,6 +25,7 @@ zabbix_export: name: Templates/Databases items: - + uuid: 3a1fd879a08a445cbf438f3d68078111 name: 'PD: Get instance metrics' type: HTTP_AGENT key: pd.get_metrics @@ -45,6 +48,7 @@ zabbix_export: tag: Application value: 'Zabbix raw items' - + uuid: 7eb740eed4eb43a0a449e1c1436e582b name: 'PD: Get instance status' type: HTTP_AGENT key: pd.get_status @@ -65,6 +69,7 @@ zabbix_export: tag: Application value: 'Zabbix raw items' - + uuid: 101266930d0747748bf3cbd9259e2818 name: 'PD: GRPC Commands total, rate' type: DEPENDENT key: pd.grpc_command.rate @@ -89,6 +94,7 @@ zabbix_export: tag: Application value: 'PD instance' - + uuid: c18f702f68bf4fed94a598daffdada8a name: 'PD: Status' type: DEPENDENT key: pd.status @@ -118,10 +124,12 @@ zabbix_export: value: 'PD instance' triggers: - + uuid: ab1d0d23dad844099e42debb71512887 expression: 'last(/TiDB PD by HTTP/pd.status)=0' name: 'PD: Instance is not responding' priority: AVERAGE - + uuid: 0b71c8a5104b46ebbeabe0d708b6676e name: 'PD: Uptime' type: DEPENDENT key: pd.uptime @@ -149,12 +157,14 @@ zabbix_export: value: 'PD instance' triggers: - + uuid: 9f47a19f6f424df598e74c5a653ebf27 expression: 'last(/TiDB PD by HTTP/pd.uptime)<10m' name: 'PD: has been restarted (uptime < 10m)' priority: INFO description: 'Uptime is less than 10 minutes' manual_close: 'YES' - + uuid: c7e8e9bf01d04e5db25bd8eaafff3b80 name: 'PD: Version' type: DEPENDENT key: pd.version @@ -180,6 +190,7 @@ zabbix_export: value: 'PD instance' triggers: - + uuid: e0e2d4f5a4a14feebb61409014e94a2e expression: '(last(/TiDB PD by HTTP/pd.version,#1)<>last(/TiDB PD by HTTP/pd.version,#2))=1 and length(last(/TiDB PD by HTTP/pd.version))>0' name: 'PD: Version has changed (new version: {ITEM.VALUE})' priority: INFO @@ -187,6 +198,7 @@ zabbix_export: manual_close: 'YES' discovery_rules: - + uuid: cd1f27cf5f1d4f6f84032386ec7f8abb name: 'Cluster metrics discovery' type: DEPENDENT key: pd.cluster.discovery @@ -194,6 +206,7 @@ zabbix_export: description: 'Discovery cluster specific metrics.' item_prototypes: - + uuid: fe49e1de54214fb0ac882feb42fdee3b name: 'TiDB cluster: Number of regions' type: DEPENDENT key: 'pd.cluster_status.leader_count[{#SINGLETON}]' @@ -212,6 +225,7 @@ zabbix_export: tag: Application value: 'TiDB cluster' - + uuid: 0950ba514e05447c8cfe726ec2d76944 name: 'TiDB cluster: Current peer count' type: DEPENDENT key: 'pd.cluster_status.region_count[{#SINGLETON}]' @@ -230,6 +244,7 @@ zabbix_export: tag: Application value: 'TiDB cluster' - + uuid: d39f58372e3f464c87b2ec42acdf2061 name: 'TiDB cluster: Storage capacity' type: DEPENDENT key: 'pd.cluster_status.storage_capacity[{#SINGLETON}]' @@ -254,6 +269,7 @@ zabbix_export: tag: Application value: 'TiDB cluster' - + uuid: c72e6a2f89d041c4bf764021b9bc182c name: 'TiDB cluster: Storage size' type: DEPENDENT key: 'pd.cluster_status.storage_size[{#SINGLETON}]' @@ -274,6 +290,7 @@ zabbix_export: tag: Application value: 'TiDB cluster' - + uuid: 517cea991add45319d30047ac96fd9e4 name: 'TiDB cluster: Disconnect stores' type: DEPENDENT key: 'pd.cluster_status.store_disconnected[{#SINGLETON}]' @@ -297,11 +314,13 @@ zabbix_export: value: 'TiDB cluster' trigger_prototypes: - + uuid: 077d39f8ea194081a9d0c5dfdec4d1b5 expression: 'last(/TiDB PD by HTTP/pd.cluster_status.store_disconnected[{#SINGLETON}])>0' name: 'TiDB cluster: There are disconnected TiKV nodes' priority: WARNING description: 'PD does not receive a TiKV heartbeat within 20 seconds. Normally a TiKV heartbeat comes in every 10 seconds.' - + uuid: 7125a7c858264f339e879c1389c6c027 name: 'TiDB cluster: Down stores' type: DEPENDENT key: 'pd.cluster_status.store_down[{#SINGLETON}]' @@ -325,11 +344,13 @@ zabbix_export: value: 'TiDB cluster' trigger_prototypes: - + uuid: 526b935d3fa04825b7544eb6efd50ab5 expression: 'last(/TiDB PD by HTTP/pd.cluster_status.store_down[{#SINGLETON}])>0' name: 'TiDB cluster: There are offline TiKV nodes' priority: AVERAGE description: 'PD has not received a TiKV heartbeat for a long time.' - + uuid: c3bd9d1e0f6c427ab5232e57769030d1 name: 'TiDB cluster: Lowspace stores' type: DEPENDENT key: 'pd.cluster_status.store_low_space[{#SINGLETON}]' @@ -353,11 +374,13 @@ zabbix_export: value: 'TiDB cluster' trigger_prototypes: - + uuid: 87ef0f211afd4d58adec05007ef1d263 expression: 'last(/TiDB PD by HTTP/pd.cluster_status.store_low_space[{#SINGLETON}])>0' name: 'TiDB cluster: There are low space TiKV nodes' priority: AVERAGE description: 'Indicates that there is no sufficient space on the TiKV node.' - + uuid: 3c24fb49463b45f199dbc3955e87d01b name: 'TiDB cluster: Offline stores' type: DEPENDENT key: 'pd.cluster_status.store_offline[{#SINGLETON}]' @@ -379,6 +402,7 @@ zabbix_export: tag: Application value: 'TiDB cluster' - + uuid: 476a1b6e3c9b4b41ae1637f0e12801c9 name: 'TiDB cluster: Tombstone stores' type: DEPENDENT key: 'pd.cluster_status.store_tombstone[{#SINGLETON}]' @@ -401,6 +425,7 @@ zabbix_export: tag: Application value: 'TiDB cluster' - + uuid: 89db2b996fbe41bdb6b82ccf75139090 name: 'TiDB cluster: Unhealth stores' type: DEPENDENT key: 'pd.cluster_status.store_unhealth[{#SINGLETON}]' @@ -423,6 +448,7 @@ zabbix_export: tag: Application value: 'TiDB cluster' - + uuid: ff80108e2a5e45779a428a6fd31ea089 name: 'TiDB cluster: Normal stores' type: DEPENDENT key: 'pd.cluster_status.store_up[{#SINGLETON}]' @@ -446,12 +472,14 @@ zabbix_export: value: 'TiDB cluster' trigger_prototypes: - + uuid: fecf63d033b146d986f03e8d34e2d884 expression: 'min(/TiDB PD by HTTP/pd.cluster_status.storage_size[{#SINGLETON}],5m)/last(/TiDB PD by HTTP/pd.cluster_status.storage_capacity[{#SINGLETON}])*100>{$PD.STORAGE_USAGE.MAX.WARN}' name: 'TiDB cluster: Current storage usage is too high (over {$PD.STORAGE_USAGE.MAX.WARN}% for 5m)' priority: WARNING description: 'Over {$PD.STORAGE_USAGE.MAX.WARN}% of the cluster space is occupied.' graph_prototypes: - + uuid: 270de7aa73cf454cb147a3f5b39ebb35 name: 'TiDB cluster: Storage Usage[{#SINGLETON}]' graph_items: - @@ -483,6 +511,7 @@ zabbix_export: parameters: - 1h - + uuid: 113c6ba7d7f74051b042241441c43db0 name: 'gRPC commands discovery' type: DEPENDENT key: pd.grpc_command.discovery @@ -490,6 +519,7 @@ zabbix_export: description: 'Discovery grpc commands specific metrics.' item_prototypes: - + uuid: 7b96abc0e68a405ea5693f4f445936fe name: 'PD: GRPC Commands: {#GRPC_METHOD}, rate' type: DEPENDENT key: 'pd.grpc_command.rate[{#GRPC_METHOD}]' @@ -541,6 +571,7 @@ zabbix_export: parameters: - 1h - + uuid: 2cb28d7c862d442a84b5942eb4b54e2f name: 'Region discovery' type: DEPENDENT key: pd.region.discovery @@ -548,6 +579,7 @@ zabbix_export: description: 'Discovery region specific metrics.' item_prototypes: - + uuid: 024bf1d31bbd40a49d683d962887c6e0 name: 'PD: Region heartbeat: error, rate' type: DEPENDENT key: 'pd.region_heartbeat.error.rate[{#STORE_ADDRESS}]' @@ -573,6 +605,7 @@ zabbix_export: tag: Application value: 'TiDB Store [{#STORE_ADDRESS}]' - + uuid: 1d1d686f5c544a89a691a9b75e5c3b11 name: 'PD: Region heartbeat: active, rate' type: DEPENDENT key: 'pd.region_heartbeat.ok.rate[{#STORE_ADDRESS}]' @@ -598,6 +631,7 @@ zabbix_export: tag: Application value: 'TiDB Store [{#STORE_ADDRESS}]' - + uuid: c44f934ce8a144afa95252041535ef44 name: 'PD: Region schedule push: total, rate' type: DEPENDENT key: 'pd.region_heartbeat.push.err.rate[{#STORE_ADDRESS}]' @@ -622,6 +656,7 @@ zabbix_export: tag: Application value: 'TiDB Store [{#STORE_ADDRESS}]' - + uuid: ea76344669de4251a0e7bef35d70494a name: 'PD: Region heartbeat: total, rate' type: DEPENDENT key: 'pd.region_heartbeat.rate[{#STORE_ADDRESS}]' @@ -675,6 +710,7 @@ zabbix_export: parameters: - 1h - + uuid: 771ba9e078a14ca489eb2acf906080e9 name: 'Region labels discovery' type: DEPENDENT key: pd.region_labels.discovery @@ -682,6 +718,7 @@ zabbix_export: description: 'Discovery region labels specific metrics.' item_prototypes: - + uuid: 117efc3f2fe64c51a18cd3be162185ea name: 'TiDB cluster: Regions label: {#TYPE}' type: DEPENDENT key: 'pd.region_labels[{#TYPE}]' @@ -722,6 +759,7 @@ zabbix_export: parameters: - 1h - + uuid: ffbf9adaa72842fdbb49c008625c1575 name: 'Region status discovery' type: DEPENDENT key: pd.region_status.discovery @@ -729,6 +767,7 @@ zabbix_export: description: 'Discovery region status specific metrics.' item_prototypes: - + uuid: 45ef4940b0454492b70116d8958c9b11 name: 'TiDB cluster: Regions status: {#TYPE}' type: DEPENDENT key: 'pd.region_status[{#TYPE}]' @@ -749,12 +788,14 @@ zabbix_export: value: 'TiDB cluster' trigger_prototypes: - + uuid: 101bb66de2a948169aad0b0790dcf35e expression: 'min(/TiDB PD by HTTP/pd.region_status[{#TYPE}],5m)>0' name: 'TiDB cluster: There are unresponsive peers' discover: NO_DISCOVER priority: WARNING description: 'The number of Regions with an unresponsive peer reported by the Raft leader.' - + uuid: e1db516832aa44a99642c1f597656d3b expression: 'min(/TiDB PD by HTTP/pd.region_status[{#TYPE}],5m)>{$PD.MISS_REGION.MAX.WARN}' name: 'TiDB cluster: Too many missed regions (over {$PD.MISS_REGION.MAX.WARN} in 5m)' discover: NO_DISCOVER @@ -815,6 +856,7 @@ zabbix_export: status: ENABLED discover: DISCOVER - + uuid: b4b8007810ad4f7ba8da212cdde5b71b name: 'Running scheduler discovery' type: DEPENDENT key: pd.scheduler.discovery @@ -822,6 +864,7 @@ zabbix_export: description: 'Discovery scheduler specific metrics.' item_prototypes: - + uuid: c6748a20540f49b293795bc72480dda7 name: 'TiDB cluster: Scheduler status: {#KIND}' type: DEPENDENT key: 'pd.scheduler[{#KIND}]' @@ -882,6 +925,7 @@ zabbix_export: description: 'PD server URL' valuemaps: - + uuid: bce54cbdf2b8487985f9c7847a4c4918 name: 'Service state' mappings: - |