diff options
author | Sten Turpin <stenwt@users.noreply.github.com> | 2016-02-10 10:28:03 -0600 |
---|---|---|
committer | Sten Turpin <stenwt@users.noreply.github.com> | 2016-02-10 10:28:03 -0600 |
commit | 9c339b580e81eee7b9a4e7707b72176336732b98 (patch) | |
tree | 3f7f722100540beca53a71c1c6c578e13b9c949e /roles/os_zabbix | |
parent | 6f4aeb1039df339e8a4e1500920e078f09c944a3 (diff) | |
parent | 5e8f8fdca37bcfb9222fa644d9f0a49451636c8f (diff) | |
download | openshift-9c339b580e81eee7b9a4e7707b72176336732b98.tar.gz openshift-9c339b580e81eee7b9a4e7707b72176336732b98.tar.bz2 openshift-9c339b580e81eee7b9a4e7707b72176336732b98.tar.xz openshift-9c339b580e81eee7b9a4e7707b72176336732b98.zip |
Merge pull request #1372 from stenwt/sturpin-2016-02-09-registry-health
added nodes not ready and nodes not schedulable triggers
Diffstat (limited to 'roles/os_zabbix')
-rw-r--r-- | roles/os_zabbix/vars/template_openshift_master.yml | 26 |
1 files changed, 26 insertions, 0 deletions
diff --git a/roles/os_zabbix/vars/template_openshift_master.yml b/roles/os_zabbix/vars/template_openshift_master.yml index 5aae2496a..bcf75e457 100644 --- a/roles/os_zabbix/vars/template_openshift_master.yml +++ b/roles/os_zabbix/vars/template_openshift_master.yml @@ -201,6 +201,18 @@ g_template_openshift_master: applications: - Openshift Master Metrics + - key: openshift.master.nodesnotready.count + description: "This check shows how many nodes in a cluster are in NotReady state." + type: int + applications: + - Openshift Master + + - key: openshift.master.nodesnotschedulable.count + description: "This check shows how many nodes in a cluster are not schedulable." + type: int + applications: + - Openshift Master + - key: openshift.master.apiserver.latency.summary.pods.quantile.list.5 description: "Value from https://master/metrics. This is the time, in miliseconds, that 50% of the pod operations have taken to completed." type: int @@ -361,6 +373,20 @@ g_template_openshift_master: - 'Openshift Master API health check is failing on {HOST.NAME}' priority: high + - name: 'Hosts not ready according to {HOST.NAME}' + expression: '{Template Openshift Master:openshift.master.nodesnotready.count.last(#2)>0' + url: 'https://github.com/openshift/ops-sop/blob/master/V3/Alerts/openshift_node.asciidoc' + dependencies: + - 'Openshift Master procecss not running on {HOST.NAME}' + priority: high + + - name: 'Hosts not schedulable according to {HOST.NAME}' + expression: '{Template Openshift Master:openshift.master.nodesnotschedulable.count.last(#2)>0' + url: 'https://github.com/openshift/ops-sop/blob/master/V3/Alerts/openshift_node.asciidoc' + dependencies: + - 'Openshift Master procecss not running on {HOST.NAME}' + priority: info + zgraphs: - name: Openshift Master API Server Latency Pods LIST Quantiles width: 900 |