From d1933cbe454730291ca412f0b48a349b4079dab4 Mon Sep 17 00:00:00 2001 From: zhizhang Date: Wed, 24 Feb 2016 10:48:18 +0800 Subject: add key of openshift.master.app.build.create --- roles/os_zabbix/vars/template_openshift_master.yml | 6 ++++++ 1 file changed, 6 insertions(+) (limited to 'roles/os_zabbix/vars') diff --git a/roles/os_zabbix/vars/template_openshift_master.yml b/roles/os_zabbix/vars/template_openshift_master.yml index e36f23a2b..4ddff6545 100644 --- a/roles/os_zabbix/vars/template_openshift_master.yml +++ b/roles/os_zabbix/vars/template_openshift_master.yml @@ -6,6 +6,12 @@ g_template_openshift_master: applications: - Openshift Master key: openshift.master.app.create + + - key: openshift.master.app.build.create + description: "check the app create with a build process" + type: int + applications: + - Openshift Master - key: openshift.master.process.count description: Shows number of master processes running -- cgit v1.2.3 From 0a2afe60757991ce7d32d0cf4d9344394225d0c2 Mon Sep 17 00:00:00 2001 From: zhizhang Date: Thu, 25 Feb 2016 11:10:39 +0800 Subject: add trigger for app creation with build process --- roles/os_zabbix/vars/template_openshift_master.yml | 15 +++++++++++++++ 1 file changed, 15 insertions(+) (limited to 'roles/os_zabbix/vars') diff --git a/roles/os_zabbix/vars/template_openshift_master.yml b/roles/os_zabbix/vars/template_openshift_master.yml index 4ddff6545..836456b89 100644 --- a/roles/os_zabbix/vars/template_openshift_master.yml +++ b/roles/os_zabbix/vars/template_openshift_master.yml @@ -301,6 +301,13 @@ g_template_openshift_master: - 'Openshift Master process not running on {HOST.NAME}' priority: avg + - name: 'Application creation with build has failed on {HOST.NAME}' + expression: '{Template Openshift Master:openshift.master.app.build.create.last(#1)}=1 and {Template Openshift Master:openshift.master.app.build.create.last(#2)}=1' + url: 'https://github.com/openshift/ops-sop/blob/master/V3/Alerts/check_create_app.asciidoc' + dependencies: + - 'Openshift Master process not running on {HOST.NAME}' + priority: avg + - name: 'Application creation has failed multiple times in the last hour on {HOST.NAME}' expression: '{Template Openshift Master:openshift.master.app.create.sum(1h)}>3' url: 'https://github.com/openshift/ops-sop/blob/master/V3/Alerts/check_create_app.asciidoc' @@ -309,6 +316,14 @@ g_template_openshift_master: description: The application create loop has failed 4 or more times in the last hour priority: avg + - name: 'Application with build creation has failed multiple times in the last hour on {HOST.NAME}' + expression: '{Template Openshift Master:openshift.master.app.build.create.sum(1h)}>3' + url: 'https://github.com/openshift/ops-sop/blob/master/V3/Alerts/check_create_app.asciidoc' + dependencies: + - 'Openshift Master process not running on {HOST.NAME}' + description: The application create loop has failed 4 or more times in the last hour + priority: avg + - name: 'Openshift Master API health check is failing on {HOST.NAME}' expression: '{Template Openshift Master:openshift.master.api.healthz.max(#3)}<1' url: 'https://github.com/openshift/ops-sop/blob/master/V3/Alerts/openshift_master.asciidoc' -- cgit v1.2.3 From a6aea811c2ca7cb8d8c2f5291c5d49cb5425b7c9 Mon Sep 17 00:00:00 2001 From: zhizhang Date: Mon, 29 Feb 2016 13:30:21 +0800 Subject: add item of time cost a app build and app create --- roles/os_zabbix/vars/template_openshift_master.yml | 12 ++++++++++++ 1 file changed, 12 insertions(+) (limited to 'roles/os_zabbix/vars') diff --git a/roles/os_zabbix/vars/template_openshift_master.yml b/roles/os_zabbix/vars/template_openshift_master.yml index 836456b89..75e4b9ce2 100644 --- a/roles/os_zabbix/vars/template_openshift_master.yml +++ b/roles/os_zabbix/vars/template_openshift_master.yml @@ -13,6 +13,18 @@ g_template_openshift_master: applications: - Openshift Master + - key: openshift.master.app.create.time + description: "check the time it takes app create with a build process" + type: int + applications: + - Openshift Master + + - key: openshift.master.app.build.time + description: "check the time it takes app build" + type: int + applications: + - Openshift Master + - key: openshift.master.process.count description: Shows number of master processes running type: int -- cgit v1.2.3 From fbfbe9d0992b3ede4d85acadb34ba60b8f9b5c69 Mon Sep 17 00:00:00 2001 From: zhizhang Date: Wed, 16 Mar 2016 09:23:39 +0800 Subject: change the check time from 1 hour to 2 hour --- roles/os_zabbix/vars/template_openshift_master.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) (limited to 'roles/os_zabbix/vars') diff --git a/roles/os_zabbix/vars/template_openshift_master.yml b/roles/os_zabbix/vars/template_openshift_master.yml index 75e4b9ce2..45f2ecf07 100644 --- a/roles/os_zabbix/vars/template_openshift_master.yml +++ b/roles/os_zabbix/vars/template_openshift_master.yml @@ -328,8 +328,8 @@ g_template_openshift_master: description: The application create loop has failed 4 or more times in the last hour priority: avg - - name: 'Application with build creation has failed multiple times in the last hour on {HOST.NAME}' - expression: '{Template Openshift Master:openshift.master.app.build.create.sum(1h)}>3' + - name: 'Application with build creation has failed multiple times in the last 2 hour on {HOST.NAME}' + expression: '{Template Openshift Master:openshift.master.app.build.create.sum(2h)}>3' url: 'https://github.com/openshift/ops-sop/blob/master/V3/Alerts/check_create_app.asciidoc' dependencies: - 'Openshift Master process not running on {HOST.NAME}' -- cgit v1.2.3