Browse Source

Merge pull request #1606 from BlueShells/BuildappMonitor

Buildapp monitor
Kenny Woodson 9 years ago
parent
commit
025a2b962a
1 changed files with 33 additions and 0 deletions
  1. 33 0
      roles/os_zabbix/vars/template_openshift_master.yml

+ 33 - 0
roles/os_zabbix/vars/template_openshift_master.yml

@@ -6,6 +6,24 @@ g_template_openshift_master:
     applications:
     - Openshift Master
     key: openshift.master.app.create
+  
+  - key: openshift.master.app.build.create
+    description: "check the app create with a build process"
+    type: int
+    applications:
+    - Openshift Master
+
+  - key: openshift.master.app.create.time
+    description: "check the time it takes app create with a build process"
+    type: int
+    applications:
+    - Openshift Master
+
+  - key: openshift.master.app.build.time
+    description: "check the time it takes app build"
+    type: int
+    applications:
+    - Openshift Master
 
   - key: openshift.master.process.count
     description: Shows number of master processes running
@@ -295,6 +313,13 @@ g_template_openshift_master:
     - 'Openshift Master process not running on {HOST.NAME}'
     priority: avg
 
+  - name: 'Application creation with build has failed on {HOST.NAME}'
+    expression: '{Template Openshift Master:openshift.master.app.build.create.last(#1)}=1 and {Template Openshift Master:openshift.master.app.build.create.last(#2)}=1'
+    url: 'https://github.com/openshift/ops-sop/blob/master/V3/Alerts/check_create_app.asciidoc'
+    dependencies:
+    - 'Openshift Master process not running on {HOST.NAME}'
+    priority: avg
+
   - name: 'Application creation has failed multiple times in the last hour on {HOST.NAME}'
     expression: '{Template Openshift Master:openshift.master.app.create.sum(1h)}>3'
     url: 'https://github.com/openshift/ops-sop/blob/master/V3/Alerts/check_create_app.asciidoc'
@@ -303,6 +328,14 @@ g_template_openshift_master:
     description: The application create loop has failed 4 or more times in the last hour
     priority: avg
 
+  - name: 'Application with build creation has failed multiple times in the last 2 hour on {HOST.NAME}'
+    expression: '{Template Openshift Master:openshift.master.app.build.create.sum(2h)}>3'
+    url: 'https://github.com/openshift/ops-sop/blob/master/V3/Alerts/check_create_app.asciidoc'
+    dependencies:
+    - 'Openshift Master process not running on {HOST.NAME}'
+    description: The application create loop has failed 4 or more times in the last hour
+    priority: avg
+
   - name: 'Openshift Master API health check is failing on {HOST.NAME}'
     expression: '{Template Openshift Master:openshift.master.api.healthz.max(#3)}<1'
     url: 'https://github.com/openshift/ops-sop/blob/master/V3/Alerts/openshift_master.asciidoc'