template_os_linux.yml 6.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242
  1. ---
  2. g_template_os_linux:
  3. name: Template OS Linux
  4. zitems:
  5. - key: kernel.uname.sysname
  6. applications:
  7. - Kernel
  8. value_type: string
  9. - key: kernel.all.cpu.wait.total
  10. applications:
  11. - Kernel
  12. value_type: int
  13. - key: kernel.all.cpu.irq.hard
  14. applications:
  15. - Kernel
  16. value_type: int
  17. - key: kernel.all.cpu.idle
  18. applications:
  19. - Kernel
  20. value_type: int
  21. - key: kernel.uname.distro
  22. applications:
  23. - Kernel
  24. value_type: string
  25. - key: kernel.uname.nodename
  26. applications:
  27. - Kernel
  28. value_type: string
  29. - key: kernel.all.cpu.irq.soft
  30. applications:
  31. - Kernel
  32. value_type: int
  33. - key: kernel.all.load.15_minute
  34. applications:
  35. - Kernel
  36. value_type: float
  37. - key: kernel.all.cpu.sys
  38. applications:
  39. - Kernel
  40. value_type: int
  41. - key: kernel.all.load.5_minute
  42. applications:
  43. - Kernel
  44. value_type: float
  45. - key: kernel.all.cpu.nice
  46. applications:
  47. - Kernel
  48. value_type: int
  49. - key: kernel.all.load.1_minute
  50. applications:
  51. - Kernel
  52. value_type: float
  53. - key: kernel.uname.version
  54. applications:
  55. - Kernel
  56. value_type: string
  57. - key: kernel.all.uptime
  58. applications:
  59. - Kernel
  60. value_type: int
  61. - key: kernel.all.cpu.user
  62. applications:
  63. - Kernel
  64. value_type: int
  65. - key: kernel.uname.machine
  66. applications:
  67. - Kernel
  68. value_type: string
  69. - key: hinv.ncpu
  70. applications:
  71. - Kernel
  72. value_type: int
  73. - key: kernel.all.cpu.steal
  74. applications:
  75. - Kernel
  76. value_type: int
  77. - key: kernel.all.pswitch
  78. applications:
  79. - Kernel
  80. value_type: int
  81. - key: kernel.uname.release
  82. applications:
  83. - Kernel
  84. value_type: string
  85. - key: proc.nprocs
  86. applications:
  87. - Kernel
  88. value_type: int
  89. # Memory Items
  90. - key: mem.freemem
  91. applications:
  92. - Memory
  93. value_type: int
  94. description: "PCP: free system memory metric from /proc/meminfo"
  95. multiplier: 1024
  96. units: B
  97. - key: mem.util.bufmem
  98. applications:
  99. - Memory
  100. value_type: int
  101. description: "PCP: Memory allocated for buffer_heads.; I/O buffers metric from /proc/meminfo"
  102. multiplier: 1024
  103. units: B
  104. - key: swap.used
  105. applications:
  106. - Memory
  107. value_type: int
  108. description: "PCP: swap used metric from /proc/meminfo"
  109. multiplier: 1024
  110. units: B
  111. - key: swap.length
  112. applications:
  113. - Memory
  114. value_type: int
  115. description: "PCP: total swap available metric from /proc/meminfo"
  116. multiplier: 1024
  117. units: B
  118. - key: mem.physmem
  119. applications:
  120. - Memory
  121. value_type: int
  122. description: "PCP: The value of this metric corresponds to the \"MemTotal\" field reported by /proc/meminfo. Note that this does not necessarily correspond to actual installed physical memory - there may be areas of the physical address space mapped as ROM in various peripheral devices and the bios may be mirroring certain ROMs in RAM."
  123. multiplier: 1024
  124. units: B
  125. - key: swap.free
  126. applications:
  127. - Memory
  128. value_type: int
  129. description: "PCP: swap free metric from /proc/meminfo"
  130. multiplier: 1024
  131. units: B
  132. - key: mem.util.available
  133. applications:
  134. - Memory
  135. value_type: int
  136. description: "PCP: The amount of memory that is available for a new workload, without pushing the system into swap. Estimated from MemFree, Active(file), Inactive(file), and SReclaimable, as well as the \"low\" watermarks from /proc/zoneinfo.; available memory from /proc/meminfo"
  137. multiplier: 1024
  138. units: B
  139. - key: mem.util.used
  140. applications:
  141. - Memory
  142. value_type: int
  143. description: "PCP: Used memory is the difference between mem.physmem and mem.freemem; used memory metric from /proc/meminfo"
  144. multiplier: 1024
  145. units: B
  146. - key: mem.util.cached
  147. applications:
  148. - Memory
  149. value_type: int
  150. description: "PCP: Memory used by the page cache, including buffered file data. This is in-memory cache for files read from the disk (the pagecache) but doesn't include SwapCached.; page cache metric from /proc/meminfo"
  151. multiplier: 1024
  152. units: B
  153. # Disk items
  154. - key: filesys.full.xvda2
  155. applications:
  156. - Disk
  157. value_type: float
  158. - key: filesys.full.xvda3
  159. applications:
  160. - Disk
  161. value_type: float
  162. zdiscoveryrules:
  163. - name: disc.filesys
  164. key: disc.filesys
  165. lifetime: 1
  166. template_name: Template OS Linux
  167. description: "Dynamically register the filesystems"
  168. zitemprototypes:
  169. - discoveryrule_key: disc.filesys
  170. template_name: Template OS Linux
  171. name: "disc.filesys.full.{#OSO_FILESYS}"
  172. key: "disc.filesys.full[{#OSO_FILESYS}]"
  173. value_type: float
  174. description: "PCP filesys.full option. This is the percent full returned from pcp filesys.full"
  175. applications:
  176. - Disk
  177. ztriggers:
  178. - name: 'Filesystem: / has less than 10% free on {HOST.NAME}'
  179. expression: '{Template OS Linux:filesys.full.xvda2.last()}>90'
  180. url: 'https://github.com/openshift/ops-sop/blob/master/V3/Alerts/check_filesys_full.asciidoc'
  181. priority: warn
  182. - name: 'Filesystem: / has less than 5% free on {HOST.NAME}'
  183. expression: '{Template OS Linux:filesys.full.xvda2.last()}>95'
  184. url: 'https://github.com/openshift/ops-sop/blob/master/V3/Alerts/check_filesys_full.asciidoc'
  185. priority: high
  186. - name: 'Filesystem: /var has less than 10% free on {HOST.NAME}'
  187. expression: '{Template OS Linux:filesys.full.xvda3.last()}>90'
  188. url: 'https://github.com/openshift/ops-sop/blob/master/V3/Alerts/check_filesys_full.asciidoc'
  189. priority: warn
  190. - name: 'Filesystem: /var has less than 5% free on {HOST.NAME}'
  191. expression: '{Template OS Linux:filesys.full.xvda3.last()}>95'
  192. url: 'https://github.com/openshift/ops-sop/blob/master/V3/Alerts/check_filesys_full.asciidoc'
  193. priority: high
  194. - name: 'Too many TOTAL processes on {HOST.NAME}'
  195. expression: '{Template OS Linux:proc.nprocs.last()}>5000'
  196. url: 'https://github.com/openshift/ops-sop/blob/master/V3/Alerts/check_proc.asciidoc'
  197. priority: warn
  198. - name: 'Lack of available memory on {HOST.NAME}'
  199. expression: '{Template OS Linux:mem.freemem.last()}<30720000'
  200. url: 'https://github.com/openshift/ops-sop/blob/master/V3/Alerts/check_memory.asciidoc'
  201. priority: warn
  202. description: 'Alert on less than 30MegaBytes. This is 30 Million Bytes. 30000 KB x 1024'