You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
1921 lines
88 KiB
1921 lines
88 KiB
zabbix_export:
|
|
version: '7.0'
|
|
template_groups:
|
|
- uuid: 748ad4d098d447d492bb935c907f652f
|
|
name: Templates/Databases
|
|
templates:
|
|
- uuid: 47d87c39c121429b98a18f641aa443ea
|
|
template: 'GridGain by JMX'
|
|
name: 'GridGain by JMX'
|
|
description: |
|
|
The template to monitor GridGain In-Memory Computing Platform by Zabbix that work without any external scripts.
|
|
It works with both standalone and cluster instances.
|
|
The metrics are discoverable and collected by JMX.
|
|
Current JMX tree hierarchy contains classloader by default. Add the following jvm option `-DIGNITE_MBEAN_APPEND_CLASS_LOADER_ID=false`to will exclude one level with Classloader name.
|
|
You can set {$GRIDGAIN.USER} and {$GRIDGAIN.PASSWORD} macros in the template for using on the host level.
|
|
|
|
You can discuss this template or leave feedback on our forum https://www.zabbix.com/forum/zabbix-suggestions-and-feedback/
|
|
|
|
Generated by official Zabbix template tool "Templator" 2.0.0
|
|
vendor:
|
|
name: Zabbix
|
|
version: 7.0-0
|
|
groups:
|
|
- name: Templates/Databases
|
|
discovery_rules:
|
|
- uuid: f8d8a6cd41da496ea6d61793e0ab0d00
|
|
name: 'Data region metrics'
|
|
type: JMX
|
|
key: 'jmx.discovery[beans,"org.apache:group=DataRegionMetrics,*"]'
|
|
delay: 10m
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
filter:
|
|
evaltype: AND
|
|
conditions:
|
|
- macro: '{#JMXNAME}'
|
|
value: '{$GRIDGAIN.LLD.FILTER.DATA.REGION.MATCHES}'
|
|
formulaid: A
|
|
- macro: '{#JMXNAME}'
|
|
value: '{$GRIDGAIN.LLD.FILTER.DATA.REGION.NOT_MATCHES}'
|
|
operator: NOT_MATCHES_REGEX
|
|
formulaid: B
|
|
item_prototypes:
|
|
- uuid: c09b0ea002db4c3d9104a7f51b9921cc
|
|
name: 'Data region {#JMXNAME}: Allocation, rate'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",AllocationRate]'
|
|
history: 7d
|
|
value_type: FLOAT
|
|
units: '!pps'
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Allocation rate (pages per second) averaged across rateTimeInternal.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: data_region
|
|
- uuid: 3425f6775e9e4a979d876becddec46d2
|
|
name: 'Data region {#JMXNAME}: Checkpoint buffer size'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",CheckpointBufferSize]'
|
|
history: 7d
|
|
value_type: FLOAT
|
|
units: B
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Total size in bytes for checkpoint buffer.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: data_region
|
|
- uuid: 6e44ce63725a46b486175e34697776ee
|
|
name: 'Data region {#JMXNAME}: Dirty pages'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",DirtyPages]'
|
|
history: 7d
|
|
value_type: FLOAT
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Number of pages in memory not yet synchronized with persistent storage.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: data_region
|
|
- uuid: 5396db6809ca44c480f123e1e63430b4
|
|
name: 'Data region {#JMXNAME}: Eviction, rate'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",EvictionRate]'
|
|
history: 7d
|
|
value_type: FLOAT
|
|
units: '!pps'
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Eviction rate (pages per second).'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: data_region
|
|
trigger_prototypes:
|
|
- uuid: 7e2fc41d632240b3869080d41ef5e639
|
|
expression: 'min(/GridGain by JMX/jmx["{#JMXOBJ}",EvictionRate],5m)>0'
|
|
name: 'Data region {#JMXNAME}: Node started to evict pages'
|
|
priority: INFO
|
|
description: 'You store more data than region can accommodate. Data started to move to disk it can make requests work slower. Acknowledge to close the problem manually.'
|
|
manual_close: 'YES'
|
|
tags:
|
|
- tag: scope
|
|
value: performance
|
|
- uuid: 9f7d683cf3ca47c681eef43e4dd9a471
|
|
name: 'Data region {#JMXNAME}: Size, max'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",MaxSize]'
|
|
history: 7d
|
|
value_type: FLOAT
|
|
units: B
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Maximum memory region size defined by its data region.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: data_region
|
|
- uuid: 16170e6c8007492984c367892a7393aa
|
|
name: 'Data region {#JMXNAME}: Offheap size'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",OffHeapSize]'
|
|
history: 7d
|
|
value_type: FLOAT
|
|
units: B
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Offheap size in bytes.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: data_region
|
|
- uuid: 982c738bdd4f4802917d3f5d63cc489f
|
|
name: 'Data region {#JMXNAME}: Offheap used size'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",OffheapUsedSize]'
|
|
history: 7d
|
|
value_type: FLOAT
|
|
units: B
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Total used offheap size in bytes.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: data_region
|
|
- uuid: 03c923d00e5a486faece1f37b3a2863d
|
|
name: 'Data region {#JMXNAME}: Pages fill factor'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",PagesFillFactor]'
|
|
history: 7d
|
|
value_type: FLOAT
|
|
units: '%'
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'The percentage of the used space.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: data_region
|
|
- uuid: 9094f5992c514be6abaee490b211774e
|
|
name: 'Data region {#JMXNAME}: Pages replace, rate'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",PagesReplaceRate]'
|
|
history: 7d
|
|
value_type: FLOAT
|
|
units: '!pps'
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Rate at which pages in memory are replaced with pages from persistent storage (pages per second).'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: data_region
|
|
trigger_prototypes:
|
|
- uuid: d2b012fdfe634526bb583d4ad18abe4d
|
|
expression: 'min(/GridGain by JMX/jmx["{#JMXOBJ}",PagesReplaceRate],5m)>0'
|
|
name: 'Data region {#JMXNAME}: Pages replace rate more than 0'
|
|
priority: WARNING
|
|
description: 'There is more data than DataRegionMaxSize. Cluster started to replace pages in memory. Page replacement can slow down operations.'
|
|
tags:
|
|
- tag: scope
|
|
value: performance
|
|
- uuid: 390107f411e24581a61043000b42152f
|
|
name: 'Data region {#JMXNAME}: Allocated, bytes'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",TotalAllocatedSize]'
|
|
history: 7d
|
|
value_type: FLOAT
|
|
units: B
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Total size of memory allocated in bytes.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: data_region
|
|
- uuid: 8e0e7a96f0a6424b88829fab78cce2ba
|
|
name: 'Data region {#JMXNAME}: Used checkpoint buffer size'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",UsedCheckpointBufferSize]'
|
|
history: 7d
|
|
value_type: FLOAT
|
|
units: B
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Used checkpoint buffer size in bytes.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: data_region
|
|
trigger_prototypes:
|
|
- uuid: 9a7d7c745faa4f1fa4ffd1ca8c1ac602
|
|
expression: 'min(/GridGain by JMX/jmx["{#JMXOBJ}",UsedCheckpointBufferSize],5m)/last(/GridGain by JMX/jmx["{#JMXOBJ}",CheckpointBufferSize])*100>{$GRIDGAIN.CHECKPOINT.PUSED.MAX.HIGH}'
|
|
name: 'Data region {#JMXNAME}: Checkpoint buffer utilization is too high'
|
|
event_name: 'Data region {#JMXNAME}: Checkpoint buffer utilization is too high (over {$GRIDGAIN.CHECKPOINT.PUSED.MAX.HIGH} in 5m)'
|
|
priority: HIGH
|
|
description: 'Checkpoint buffer utilization is high. Threads will be throttled to avoid buffer overflow. It can be caused by high disk utilization.'
|
|
tags:
|
|
- tag: scope
|
|
value: performance
|
|
- uuid: 02ce52a2067147238969a4fd24f85bdc
|
|
expression: 'min(/GridGain by JMX/jmx["{#JMXOBJ}",UsedCheckpointBufferSize],5m)/last(/GridGain by JMX/jmx["{#JMXOBJ}",CheckpointBufferSize])*100>{$GRIDGAIN.CHECKPOINT.PUSED.MAX.WARN}'
|
|
name: 'Data region {#JMXNAME}: Checkpoint buffer utilization is too high'
|
|
event_name: 'Data region {#JMXNAME}: Checkpoint buffer utilization is too high (over {$GRIDGAIN.CHECKPOINT.PUSED.MAX.WARN} in 5m)'
|
|
priority: WARNING
|
|
description: 'Checkpoint buffer utilization is high. Threads will be throttled to avoid buffer overflow. It can be caused by high disk utilization.'
|
|
dependencies:
|
|
- name: 'Data region {#JMXNAME}: Checkpoint buffer utilization is too high'
|
|
expression: 'min(/GridGain by JMX/jmx["{#JMXOBJ}",UsedCheckpointBufferSize],5m)/last(/GridGain by JMX/jmx["{#JMXOBJ}",CheckpointBufferSize])*100>{$GRIDGAIN.CHECKPOINT.PUSED.MAX.HIGH}'
|
|
tags:
|
|
- tag: scope
|
|
value: performance
|
|
- uuid: 92c2772aa8d7425e8bee5d760ba5b607
|
|
expression: 'min(/GridGain by JMX/jmx["{#JMXOBJ}",OffheapUsedSize],5m)/last(/GridGain by JMX/jmx["{#JMXOBJ}",OffHeapSize])*100>{$GRIDGAIN.DATA.REGION.PUSED.MAX.HIGH}'
|
|
name: 'Data region {#JMXNAME}: Data region utilization is too high'
|
|
event_name: 'Data region {#JMXNAME}: Data region utilization is too high (over {$GRIDGAIN.DATA.REGION.PUSED.MAX.HIGH} in 5m)'
|
|
priority: HIGH
|
|
description: 'Data region utilization is high. Increase data region size or delete any data.'
|
|
tags:
|
|
- tag: scope
|
|
value: performance
|
|
- uuid: 3694e6d813b04b51a77c842de617503c
|
|
expression: 'min(/GridGain by JMX/jmx["{#JMXOBJ}",OffheapUsedSize],5m)/last(/GridGain by JMX/jmx["{#JMXOBJ}",OffHeapSize])*100>{$GRIDGAIN.DATA.REGION.PUSED.MAX.WARN}'
|
|
name: 'Data region {#JMXNAME}: Data region utilization is too high'
|
|
event_name: 'Data region {#JMXNAME}: Data region utilization is too high (over {$GRIDGAIN.DATA.REGION.PUSED.MAX.WARN} in 5m)'
|
|
priority: WARNING
|
|
description: 'Data region utilization is high. Increase data region size or delete any data.'
|
|
dependencies:
|
|
- name: 'Data region {#JMXNAME}: Data region utilization is too high'
|
|
expression: 'min(/GridGain by JMX/jmx["{#JMXOBJ}",OffheapUsedSize],5m)/last(/GridGain by JMX/jmx["{#JMXOBJ}",OffHeapSize])*100>{$GRIDGAIN.DATA.REGION.PUSED.MAX.HIGH}'
|
|
tags:
|
|
- tag: scope
|
|
value: performance
|
|
graph_prototypes:
|
|
- uuid: f9410067b582451aa0b2675391504a65
|
|
name: 'Data region {#JMXNAME}: Checkpoint buffer utilization'
|
|
graph_items:
|
|
- drawtype: BOLD_LINE
|
|
color: 199C0D
|
|
item:
|
|
host: 'GridGain by JMX'
|
|
key: 'jmx["{#JMXOBJ}",CheckpointBufferSize]'
|
|
- sortorder: '1'
|
|
color: F63100
|
|
item:
|
|
host: 'GridGain by JMX'
|
|
key: 'jmx["{#JMXOBJ}",UsedCheckpointBufferSize]'
|
|
- uuid: 6f2ffd3ba45c4803864d049e7bfbbf18
|
|
name: 'Data region {#JMXNAME}: DataRegion utilization'
|
|
graph_items:
|
|
- drawtype: BOLD_LINE
|
|
color: 199C0D
|
|
item:
|
|
host: 'GridGain by JMX'
|
|
key: 'jmx["{#JMXOBJ}",OffHeapSize]'
|
|
- sortorder: '1'
|
|
color: F63100
|
|
item:
|
|
host: 'GridGain by JMX'
|
|
key: 'jmx["{#JMXOBJ}",OffheapUsedSize]'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
preprocessing:
|
|
- type: JAVASCRIPT
|
|
parameters:
|
|
- |
|
|
var data = JSON.parse(value);
|
|
for (var item, i = 0; item = data.data[i++];) {
|
|
if (!('{#JMXIGNITEINSTANCENAME}' in item)) {
|
|
Object.assign(item, {
|
|
'{#JMXIGNITEINSTANCENAME}': 'null'
|
|
});
|
|
}
|
|
|
|
}
|
|
|
|
return JSON.stringify(data)
|
|
- type: DISCARD_UNCHANGED_HEARTBEAT
|
|
parameters:
|
|
- 3h
|
|
- uuid: e7ad3e966ed94b91a88d28b785862b2f
|
|
name: 'Local node metrics'
|
|
type: JMX
|
|
key: 'jmx.discovery[beans,"org.apache:group=Kernal,name=ClusterLocalNodeMetricsMXBeanImpl,*"]'
|
|
delay: 30m
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
item_prototypes:
|
|
- uuid: f3c7461902934de8a220513a33ad8771
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Jobs active, current'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",CurrentActiveJobs]'
|
|
history: 7d
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Number of currently active jobs concurrently executing on the node.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: job
|
|
- tag: component
|
|
value: node
|
|
- uuid: c254bc19bccb44de821c51b0882b78b4
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Jobs cancelled, current'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",CurrentCancelledJobs]'
|
|
history: 7d
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Number of cancelled jobs that are still running.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: job
|
|
- tag: component
|
|
value: node
|
|
- uuid: 63916bbee7604c3e9610f5989bc5bb7a
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: PME duration, current'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",CurrentPmeDuration]'
|
|
history: 7d
|
|
units: ms
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Current PME duration in milliseconds.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: node
|
|
trigger_prototypes:
|
|
- uuid: a2672171fa374810b95b72f6014f3998
|
|
expression: 'min(/GridGain by JMX/jmx["{#JMXOBJ}",CurrentPmeDuration],5m) > {$GRIDGAIN.PME.DURATION.MAX.HIGH}'
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: PME duration is too long'
|
|
event_name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: PME duration is too long (over {$GRIDGAIN.PME.DURATION.MAX.HIGH} for 5 min)'
|
|
priority: HIGH
|
|
description: 'PME duration is over {$GRIDGAIN.PME.DURATION.MAX.HIGH}ms. Looks like PME is hung.'
|
|
tags:
|
|
- tag: scope
|
|
value: performance
|
|
- uuid: f21e1cee28354fcd945d58955831641b
|
|
expression: 'min(/GridGain by JMX/jmx["{#JMXOBJ}",CurrentPmeDuration],5m) > {$GRIDGAIN.PME.DURATION.MAX.WARN}'
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: PME duration is too long'
|
|
event_name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: PME duration is too long (over {$GRIDGAIN.PME.DURATION.MAX.WARN} for 5 min)'
|
|
priority: WARNING
|
|
description: 'PME duration is over {$GRIDGAIN.PME.DURATION.MAX.WARN}ms.'
|
|
dependencies:
|
|
- name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: PME duration is too long'
|
|
expression: 'min(/GridGain by JMX/jmx["{#JMXOBJ}",CurrentPmeDuration],5m) > {$GRIDGAIN.PME.DURATION.MAX.HIGH}'
|
|
tags:
|
|
- tag: scope
|
|
value: performance
|
|
- uuid: 790e8c300f7c4c82b640fb6025bb9eef
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Jobs rejected, current'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",CurrentRejectedJobs]'
|
|
history: 7d
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Number of jobs rejected after more recent collision resolution operation.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: job
|
|
- tag: component
|
|
value: node
|
|
- uuid: a5c1ece74c914620b9ce70c00c7d5377
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Threads count, current'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",CurrentThreadCount]'
|
|
history: 7d
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Current number of live threads.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: node
|
|
- tag: component
|
|
value: threads
|
|
trigger_prototypes:
|
|
- uuid: 124c9738a384481fb39f5e8078cca0e4
|
|
expression: 'min(/GridGain by JMX/jmx["{#JMXOBJ}",CurrentThreadCount],15m) > {$GRIDGAIN.THREADS.COUNT.MAX.WARN}'
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Number of running threads is too high'
|
|
event_name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Number of running threads is too high (over {$GRIDGAIN.THREADS.COUNT.MAX.WARN} for 15 min)'
|
|
priority: WARNING
|
|
description: 'Number of running threads is over {$GRIDGAIN.THREADS.COUNT.MAX.WARN}.'
|
|
dependencies:
|
|
- name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: PME duration is too long'
|
|
expression: 'min(/GridGain by JMX/jmx["{#JMXOBJ}",CurrentPmeDuration],5m) > {$GRIDGAIN.PME.DURATION.MAX.HIGH}'
|
|
tags:
|
|
- tag: scope
|
|
value: performance
|
|
- uuid: df386b29e8f74ec9a8f1825cb3094c0e
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Jobs waiting, current'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",CurrentWaitingJobs]'
|
|
history: 7d
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Number of queued jobs currently waiting to be executed.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: job
|
|
- tag: component
|
|
value: node
|
|
trigger_prototypes:
|
|
- uuid: 71d259fbdcd74888a4bedc646fc4bc54
|
|
expression: 'min(/GridGain by JMX/jmx["{#JMXOBJ}",CurrentWaitingJobs],15m) > {$GRIDGAIN.JOBS.QUEUE.MAX.WARN}'
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Number of queued jobs is too high'
|
|
event_name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Number of queued jobs is too high (over {$GRIDGAIN.JOBS.QUEUE.MAX.WARN} for 15 min)'
|
|
priority: WARNING
|
|
description: 'Number of queued jobs is over {$GRIDGAIN.JOBS.QUEUE.MAX.WARN}.'
|
|
tags:
|
|
- tag: scope
|
|
value: performance
|
|
- uuid: ec0c25c202ff4b1ea47422b51c24d3b4
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Heap memory used'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",HeapMemoryUsed]'
|
|
history: 7d
|
|
units: B
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Current heap size that is used for object allocation.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: memory
|
|
- tag: component
|
|
value: node
|
|
- uuid: a698da07a1794c479db9948a5ffb4123
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Jobs cancelled, rate'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",TotalCancelledJobs]'
|
|
history: 7d
|
|
value_type: FLOAT
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Total number of jobs cancelled by the node per second.'
|
|
preprocessing:
|
|
- type: CHANGE_PER_SECOND
|
|
parameters:
|
|
- ''
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: job
|
|
- tag: component
|
|
value: node
|
|
- uuid: 5a60a71ecd2d40af8ca2ca81712c287e
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Jobs executed, rate'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",TotalExecutedJobs]'
|
|
history: 7d
|
|
value_type: FLOAT
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Total number of jobs handled by the node per second.'
|
|
preprocessing:
|
|
- type: CHANGE_PER_SECOND
|
|
parameters:
|
|
- ''
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: job
|
|
- tag: component
|
|
value: node
|
|
- uuid: 7673741944094af9a6bc05bd630fd055
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Jobs rejects, rate'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",TotalRejectedJobs]'
|
|
history: 7d
|
|
value_type: FLOAT
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Total number of jobs this node rejects during collision resolution operations since node startup per second.'
|
|
preprocessing:
|
|
- type: CHANGE_PER_SECOND
|
|
parameters:
|
|
- ''
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: job
|
|
- tag: component
|
|
value: node
|
|
graph_prototypes:
|
|
- uuid: ca84e5c7fc76473392a30a3073e9cb25
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Jobs current state'
|
|
graph_items:
|
|
- color: 199C0D
|
|
item:
|
|
host: 'GridGain by JMX'
|
|
key: 'jmx["{#JMXOBJ}",CurrentActiveJobs]'
|
|
- sortorder: '1'
|
|
color: F63100
|
|
item:
|
|
host: 'GridGain by JMX'
|
|
key: 'jmx["{#JMXOBJ}",CurrentWaitingJobs]'
|
|
- sortorder: '2'
|
|
color: 00611C
|
|
item:
|
|
host: 'GridGain by JMX'
|
|
key: 'jmx["{#JMXOBJ}",CurrentRejectedJobs]'
|
|
- sortorder: '3'
|
|
color: F7941D
|
|
item:
|
|
host: 'GridGain by JMX'
|
|
key: 'jmx["{#JMXOBJ}",CurrentCancelledJobs]'
|
|
- uuid: 93e01a53b9054a83a6461e3526f63ee3
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Jobs rate'
|
|
graph_items:
|
|
- color: 199C0D
|
|
item:
|
|
host: 'GridGain by JMX'
|
|
key: 'jmx["{#JMXOBJ}",TotalCancelledJobs]'
|
|
- sortorder: '1'
|
|
color: F63100
|
|
item:
|
|
host: 'GridGain by JMX'
|
|
key: 'jmx["{#JMXOBJ}",TotalRejectedJobs]'
|
|
- sortorder: '2'
|
|
color: 00611C
|
|
item:
|
|
host: 'GridGain by JMX'
|
|
key: 'jmx["{#JMXOBJ}",TotalExecutedJobs]'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
preprocessing:
|
|
- type: JAVASCRIPT
|
|
parameters:
|
|
- |
|
|
var data = JSON.parse(value);
|
|
for (var item, i = 0; item = data.data[i++];) {
|
|
if (!('{#JMXIGNITEINSTANCENAME}' in item)) {
|
|
Object.assign(item, {
|
|
'{#JMXIGNITEINSTANCENAME}': 'null'
|
|
});
|
|
}
|
|
|
|
}
|
|
|
|
return JSON.stringify(data)
|
|
- uuid: 5b7b9e010a274bb5a52784143dd57628
|
|
name: 'Cluster metrics'
|
|
type: JMX
|
|
key: 'jmx.discovery[beans,"org.apache:group=Kernal,name=ClusterMetricsMXBeanImpl,*"]'
|
|
delay: 30m
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
item_prototypes:
|
|
- uuid: a7eb47fd5db24c198774beacf52fa965
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Nodes, Active baseline'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",ActiveBaselineNodes]'
|
|
history: 7d
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'The number of nodes that are currently active in the baseline topology.'
|
|
preprocessing:
|
|
- type: DISCARD_UNCHANGED_HEARTBEAT
|
|
parameters:
|
|
- 3h
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: node
|
|
- uuid: 16ca4ca8efa04874902a619bce1f0071
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Nodes, Baseline'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",TotalBaselineNodes]'
|
|
history: 7d
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Total baseline nodes that are registered in the baseline topology.'
|
|
preprocessing:
|
|
- type: DISCARD_UNCHANGED_HEARTBEAT
|
|
parameters:
|
|
- 3h
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: node
|
|
- uuid: cf66620eeb6b4c9d88c2bd69ed05685a
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Nodes, Client'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",TotalClientNodes]'
|
|
history: 7d
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'The number of client nodes in the cluster.'
|
|
preprocessing:
|
|
- type: DISCARD_UNCHANGED_HEARTBEAT
|
|
parameters:
|
|
- 3h
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: node
|
|
- uuid: d74b4324fb5a446a92e6fcf89162eff5
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Nodes, total'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",TotalNodes]'
|
|
history: 7d
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Total number of nodes.'
|
|
preprocessing:
|
|
- type: DISCARD_UNCHANGED_HEARTBEAT
|
|
parameters:
|
|
- 3h
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: node
|
|
- uuid: b64a4ce1266b4806a554967d2fd24fa5
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Nodes, Server'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",TotalServerNodes]'
|
|
history: 7d
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'The number of server nodes in the cluster.'
|
|
preprocessing:
|
|
- type: DISCARD_UNCHANGED_HEARTBEAT
|
|
parameters:
|
|
- 3h
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: node
|
|
trigger_prototypes:
|
|
- uuid: bf1fbe1ea3754da59bd8a510fbcc6f54
|
|
expression: 'change(/GridGain by JMX/jmx["{#JMXOBJ}",TotalServerNodes])>0'
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Server node added to the topology'
|
|
priority: INFO
|
|
description: 'One or more server node added to the topology. Acknowledge to close the problem manually.'
|
|
manual_close: 'YES'
|
|
tags:
|
|
- tag: scope
|
|
value: capacity
|
|
- uuid: db4cd7173ead4e878b79d55067d81300
|
|
expression: 'change(/GridGain by JMX/jmx["{#JMXOBJ}",TotalServerNodes])<0'
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Server node left the topology'
|
|
priority: WARNING
|
|
description: 'One or more server node left the topology. Acknowledge to close the problem manually.'
|
|
manual_close: 'YES'
|
|
tags:
|
|
- tag: scope
|
|
value: capacity
|
|
trigger_prototypes:
|
|
- uuid: ea93cb34b6434f2e94095c28087fc18e
|
|
expression: 'last(/GridGain by JMX/jmx["{#JMXOBJ}",TotalServerNodes])>last(/GridGain by JMX/jmx["{#JMXOBJ}",TotalBaselineNodes])'
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: There are nodes is not in topology'
|
|
priority: INFO
|
|
description: 'One or more server node left the topology. Acknowledge to close the problem manually.'
|
|
manual_close: 'YES'
|
|
tags:
|
|
- tag: scope
|
|
value: capacity
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
preprocessing:
|
|
- type: JAVASCRIPT
|
|
parameters:
|
|
- |
|
|
var data = JSON.parse(value);
|
|
for (var item, i = 0; item = data.data[i++];) {
|
|
if (!('{#JMXIGNITEINSTANCENAME}' in item)) {
|
|
Object.assign(item, {
|
|
'{#JMXIGNITEINSTANCENAME}': 'null'
|
|
});
|
|
}
|
|
|
|
}
|
|
|
|
return JSON.stringify(data)
|
|
- uuid: 3b81fbcbef204717be1918d3df919174
|
|
name: 'GridGain kernal metrics'
|
|
type: JMX
|
|
key: 'jmx.discovery[beans,"org.apache:group=Kernal,name=IgniteKernal,*"]'
|
|
delay: 30m
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
item_prototypes:
|
|
- uuid: cbe7305a44754576a8084d606710765f
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Version'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",FullVersion]'
|
|
history: 7d
|
|
trends: '0'
|
|
value_type: CHAR
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Version of GridGain instance.'
|
|
preprocessing:
|
|
- type: REGEX
|
|
parameters:
|
|
- '(.*)-\d+'
|
|
- \1
|
|
- type: DISCARD_UNCHANGED_HEARTBEAT
|
|
parameters:
|
|
- 3h
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: kernal
|
|
trigger_prototypes:
|
|
- uuid: 4cc201fb67664fc49d36bbec95b574ce
|
|
expression: 'last(/GridGain by JMX/jmx["{#JMXOBJ}",FullVersion],#1)<>last(/GridGain by JMX/jmx["{#JMXOBJ}",FullVersion],#2) and length(last(/GridGain by JMX/jmx["{#JMXOBJ}",FullVersion]))>0'
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Version has changed'
|
|
event_name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Version has changed (new version: {ITEM.VALUE})'
|
|
priority: INFO
|
|
description: 'The GridGain [{#JMXIGNITEINSTANCENAME}] version has changed. Acknowledge to close the problem manually.'
|
|
manual_close: 'YES'
|
|
tags:
|
|
- tag: scope
|
|
value: notice
|
|
- uuid: 18f518b41e804f7cb3eeaaf92fef40e7
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Local node ID'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",LocalNodeId]'
|
|
history: 7d
|
|
trends: '0'
|
|
value_type: CHAR
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Unique identifier for this node within grid.'
|
|
preprocessing:
|
|
- type: DISCARD_UNCHANGED_HEARTBEAT
|
|
parameters:
|
|
- 3h
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: kernal
|
|
- uuid: 4b3c99a88fbf4485a3dbf5efa2723ca7
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Uptime'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",UpTime]'
|
|
history: 7d
|
|
units: uptime
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Uptime of GridGain instance.'
|
|
preprocessing:
|
|
- type: MULTIPLIER
|
|
parameters:
|
|
- '0.001'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: kernal
|
|
trigger_prototypes:
|
|
- uuid: d7b2be3a707f49d2897e7cce356cafa5
|
|
expression: 'nodata(/GridGain by JMX/jmx["{#JMXOBJ}",UpTime],10m)=1'
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Failed to fetch info data'
|
|
event_name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Failed to fetch info data (or no data for 10m)'
|
|
priority: WARNING
|
|
description: 'Zabbix has not received data for items for the last 10 minutes.'
|
|
manual_close: 'YES'
|
|
tags:
|
|
- tag: scope
|
|
value: availability
|
|
- uuid: 23cd9dbb498f4bb095ec8be1693fccf0
|
|
expression: 'last(/GridGain by JMX/jmx["{#JMXOBJ}",UpTime])<10m'
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: has been restarted'
|
|
event_name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: has been restarted (uptime < 10m)'
|
|
priority: INFO
|
|
description: 'Uptime is less than 10 minutes.'
|
|
manual_close: 'YES'
|
|
tags:
|
|
- tag: scope
|
|
value: notice
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
preprocessing:
|
|
- type: JAVASCRIPT
|
|
parameters:
|
|
- |
|
|
var data = JSON.parse(value);
|
|
for (var item, i = 0; item = data.data[i++];) {
|
|
if (!('{#JMXIGNITEINSTANCENAME}' in item)) {
|
|
Object.assign(item, {
|
|
'{#JMXIGNITEINSTANCENAME}': 'null'
|
|
});
|
|
}
|
|
|
|
}
|
|
|
|
return JSON.stringify(data)
|
|
- uuid: 6265d30cd7494809bc94f929968d3c6f
|
|
name: 'TCP Communication SPI metrics'
|
|
type: JMX
|
|
key: 'jmx.discovery[beans,"org.apache:group=SPIs,name=TcpCommunicationSpi,*"]'
|
|
delay: 30m
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
item_prototypes:
|
|
- uuid: 904f0c843b1b434986043a63cb0890e7
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Communication outbound messages queue'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",OutboundMessagesQueueSize]'
|
|
history: 7d
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Outbound messages queue size.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: messages
|
|
- tag: component
|
|
value: network
|
|
- uuid: 2a01c4dc23b34df6801be0901bf10ab0
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Communication messages received, rate'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",ReceivedMessagesCount]'
|
|
history: 7d
|
|
value_type: FLOAT
|
|
units: '!msg/s'
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'The number of messages received per second.'
|
|
preprocessing:
|
|
- type: CHANGE_PER_SECOND
|
|
parameters:
|
|
- ''
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: messages
|
|
- tag: component
|
|
value: network
|
|
- uuid: 613114b7abb94bd5bbabc2d1d19975b7
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Communication reconnect rate'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",ReconnectCount,maxNumbers]'
|
|
history: 7d
|
|
value_type: FLOAT
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Gets maximum number of reconnect attempts used when establishing connection with remote nodes per second.'
|
|
preprocessing:
|
|
- type: CHANGE_PER_SECOND
|
|
parameters:
|
|
- ''
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: network
|
|
- uuid: e015293ddbb540e4b6b59ba6e28ed91e
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Communication messages sent, rate'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",SentMessagesCount]'
|
|
history: 7d
|
|
value_type: FLOAT
|
|
units: '!msg/s'
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'The number of messages sent per second.'
|
|
preprocessing:
|
|
- type: CHANGE_PER_SECOND
|
|
parameters:
|
|
- ''
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: messages
|
|
- tag: component
|
|
value: network
|
|
graph_prototypes:
|
|
- uuid: ca090aa6d7e449e880b43cdbbd80d991
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Communication messages rate'
|
|
graph_items:
|
|
- color: 199C0D
|
|
item:
|
|
host: 'GridGain by JMX'
|
|
key: 'jmx["{#JMXOBJ}",SentMessagesCount]'
|
|
- sortorder: '1'
|
|
color: F63100
|
|
item:
|
|
host: 'GridGain by JMX'
|
|
key: 'jmx["{#JMXOBJ}",ReceivedMessagesCount]'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
preprocessing:
|
|
- type: JAVASCRIPT
|
|
parameters:
|
|
- |
|
|
var data = JSON.parse(value);
|
|
for (var item, i = 0; item = data.data[i++];) {
|
|
if (!('{#JMXIGNITEINSTANCENAME}' in item)) {
|
|
Object.assign(item, {
|
|
'{#JMXIGNITEINSTANCENAME}': 'null'
|
|
});
|
|
}
|
|
|
|
}
|
|
|
|
return JSON.stringify(data)
|
|
- uuid: 5fb38d8148d746d6ae19d4f8c5a33ce8
|
|
name: 'TCP discovery SPI'
|
|
type: JMX
|
|
key: 'jmx.discovery[beans,"org.apache:group=SPIs,name=TcpDiscoverySpi,*"]'
|
|
delay: 30m
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
item_prototypes:
|
|
- uuid: 3e1086638d954e939907fd2009408048
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Coordinator'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",Coordinator]'
|
|
history: 7d
|
|
trends: '0'
|
|
value_type: CHAR
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Current coordinator UUID.'
|
|
preprocessing:
|
|
- type: DISCARD_UNCHANGED_HEARTBEAT
|
|
parameters:
|
|
- 3h
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: network
|
|
trigger_prototypes:
|
|
- uuid: 40641263a3d840e89e46ba6f57076a0a
|
|
expression: 'last(/GridGain by JMX/jmx["{#JMXOBJ}",Coordinator],#1)<>last(/GridGain by JMX/jmx["{#JMXOBJ}",Coordinator],#2) and length(last(/GridGain by JMX/jmx["{#JMXOBJ}",Coordinator]))>0'
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Coordinator has changed'
|
|
event_name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Version has changed (new version: {ITEM.VALUE})'
|
|
priority: WARNING
|
|
description: 'The GridGain [{#JMXIGNITEINSTANCENAME}] version has changed. Acknowledge to close the problem manually.'
|
|
manual_close: 'YES'
|
|
tags:
|
|
- tag: scope
|
|
value: notice
|
|
- uuid: 29d85d09951346c1a7c30acc83f404fc
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Discovery message worker queue'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",MessageWorkerQueueSize]'
|
|
history: 7d
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Message worker queue current size.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: messages
|
|
- tag: component
|
|
value: network
|
|
- uuid: 0aed9a4269ff4718aa443d1b053fa31b
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Nodes failed'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",NodesFailed]'
|
|
history: 7d
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Nodes failed count.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: network
|
|
- tag: component
|
|
value: nodes
|
|
- uuid: 43ea840b621e4f2a8643ca38479eb73e
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Nodes joined'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",NodesJoined]'
|
|
history: 7d
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Nodes join count.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: network
|
|
- tag: component
|
|
value: nodes
|
|
- uuid: 0164664362e446209b4399081d807ca7
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Nodes left'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",NodesLeft]'
|
|
history: 7d
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Nodes left count.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: network
|
|
- tag: component
|
|
value: nodes
|
|
- uuid: e03329689c674ea997d55d11e1a0c2be
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Discovery reconnect, rate'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",ReconnectCount]'
|
|
history: 7d
|
|
value_type: FLOAT
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Number of times node tries to (re)establish connection to another node per second.'
|
|
preprocessing:
|
|
- type: CHANGE_PER_SECOND
|
|
parameters:
|
|
- ''
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: network
|
|
- tag: component
|
|
value: nodes
|
|
- uuid: e344575b799a4f69b79b45ef6590a649
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: TotalProcessedMessages'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",TotalProcessedMessages]'
|
|
history: 7d
|
|
value_type: FLOAT
|
|
units: '!msg/s'
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'The number of messages received per second.'
|
|
preprocessing:
|
|
- type: CHANGE_PER_SECOND
|
|
parameters:
|
|
- ''
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: messages
|
|
- tag: component
|
|
value: network
|
|
- uuid: adcf2c5981004c8da658122cc50a6518
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Discovery messages received, rate'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",TotalReceivedMessages]'
|
|
history: 7d
|
|
value_type: FLOAT
|
|
units: '!msg/s'
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'The number of messages processed per second.'
|
|
preprocessing:
|
|
- type: CHANGE_PER_SECOND
|
|
parameters:
|
|
- ''
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: messages
|
|
- tag: component
|
|
value: network
|
|
graph_prototypes:
|
|
- uuid: a44983a855934d3ea5d2eaa1421df147
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Discovery messages rate'
|
|
graph_items:
|
|
- color: 199C0D
|
|
item:
|
|
host: 'GridGain by JMX'
|
|
key: 'jmx["{#JMXOBJ}",TotalProcessedMessages]'
|
|
- sortorder: '1'
|
|
color: F63100
|
|
item:
|
|
host: 'GridGain by JMX'
|
|
key: 'jmx["{#JMXOBJ}",TotalReceivedMessages]'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
preprocessing:
|
|
- type: JAVASCRIPT
|
|
parameters:
|
|
- |
|
|
var data = JSON.parse(value);
|
|
for (var item, i = 0; item = data.data[i++];) {
|
|
if (!('{#JMXIGNITEINSTANCENAME}' in item)) {
|
|
Object.assign(item, {
|
|
'{#JMXIGNITEINSTANCENAME}': 'null'
|
|
});
|
|
}
|
|
|
|
}
|
|
|
|
return JSON.stringify(data)
|
|
- uuid: b0b570121f1646e5baf0b0ff5cc5de2b
|
|
name: 'Transaction metrics'
|
|
type: JMX
|
|
key: 'jmx.discovery[beans,"org.apache:group=TransactionMetrics,name=TransactionMetricsMxBeanImpl,*"]'
|
|
delay: 30m
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
item_prototypes:
|
|
- uuid: 0b03ef7787684ab5abd99af4610adf59
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Locked keys'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",LockedKeysNumber]'
|
|
history: 7d
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'The number of keys locked on the node.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: transactions
|
|
- uuid: 446cbb708d354b2a9282e973d562527f
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Transactions owner, current'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",OwnerTransactionsNumber]'
|
|
history: 7d
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'The number of active transactions for which this node is the initiator.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: transactions
|
|
- uuid: 21971cbf540c48df93fde079ce917a26
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Transactions committed, rate'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",TransactionsCommittedNumber]'
|
|
history: 7d
|
|
value_type: FLOAT
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'The number of transactions which were committed per second.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: transactions
|
|
- uuid: d8d3e05c6e7e4874b3149edb74774e6d
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Transactions holding lock, current'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",TransactionsHoldingLockNumber]'
|
|
history: 7d
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'The number of active transactions holding at least one key lock.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: transactions
|
|
- uuid: 2d1def1d4f414ce992cf5a6ff1bc4204
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Transactions rolledback, rate'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",TransactionsRolledBackNumber]'
|
|
history: 7d
|
|
value_type: FLOAT
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'The number of transactions which were rollback per second.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: transactions
|
|
graph_prototypes:
|
|
- uuid: 82d772972cec4454b95d69343040b2b5
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Transactions'
|
|
graph_items:
|
|
- color: 199C0D
|
|
item:
|
|
host: 'GridGain by JMX'
|
|
key: 'jmx["{#JMXOBJ}",OwnerTransactionsNumber]'
|
|
- sortorder: '1'
|
|
color: F63100
|
|
item:
|
|
host: 'GridGain by JMX'
|
|
key: 'jmx["{#JMXOBJ}",TransactionsHoldingLockNumber]'
|
|
- uuid: ad74079d5ef741918d25f059c1950839
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Transactions rate'
|
|
graph_items:
|
|
- color: 199C0D
|
|
item:
|
|
host: 'GridGain by JMX'
|
|
key: 'jmx["{#JMXOBJ}",TransactionsRolledBackNumber]'
|
|
- sortorder: '1'
|
|
color: F63100
|
|
item:
|
|
host: 'GridGain by JMX'
|
|
key: 'jmx["{#JMXOBJ}",TransactionsCommittedNumber]'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
preprocessing:
|
|
- type: JAVASCRIPT
|
|
parameters:
|
|
- |
|
|
var data = JSON.parse(value);
|
|
for (var item, i = 0; item = data.data[i++];) {
|
|
if (!('{#JMXIGNITEINSTANCENAME}' in item)) {
|
|
Object.assign(item, {
|
|
'{#JMXIGNITEINSTANCENAME}': 'null'
|
|
});
|
|
}
|
|
|
|
}
|
|
|
|
return JSON.stringify(data)
|
|
- uuid: 7e3825aba1ad47c194162122eb050612
|
|
name: 'Cache groups'
|
|
type: JMX
|
|
key: 'jmx.discovery[beans,"org.apache:group=\"Cache groups\",*"]'
|
|
delay: 10m
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
filter:
|
|
evaltype: AND
|
|
conditions:
|
|
- macro: '{#JMXNAME}'
|
|
value: '{$GRIDGAIN.LLD.FILTER.CACHE.MATCHES}'
|
|
formulaid: A
|
|
- macro: '{#JMXNAME}'
|
|
value: '{$GRIDGAIN.LLD.FILTER.CACHE.NOT_MATCHES}'
|
|
operator: NOT_MATCHES_REGEX
|
|
formulaid: B
|
|
item_prototypes:
|
|
- uuid: d46bf088d33946a69a5b625566558994
|
|
name: 'Cache group [{#JMXNAME}]: Backups'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",Backups]'
|
|
history: 7d
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Count of backups configured for cache group.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: cache_group
|
|
- uuid: a535d161527b4821b717f114aaeb8b0b
|
|
name: 'Cache group [{#JMXNAME}]: Caches'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",Caches]'
|
|
history: 7d
|
|
trends: '0'
|
|
value_type: CHAR
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'List of caches.'
|
|
preprocessing:
|
|
- type: DISCARD_UNCHANGED_HEARTBEAT
|
|
parameters:
|
|
- 3h
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: cache_group
|
|
trigger_prototypes:
|
|
- uuid: 94d82f9db4f449e491782e14f6973f9b
|
|
expression: 'last(/GridGain by JMX/jmx["{#JMXOBJ}",Caches],#1)<>last(/GridGain by JMX/jmx["{#JMXOBJ}",Caches],#2) and length(last(/GridGain by JMX/jmx["{#JMXOBJ}",Caches]))>0'
|
|
name: 'Cache group [{#JMXNAME}]: List of caches has changed'
|
|
event_name: 'Cache group [{#JMXNAME}]: Version has changed (new version: {ITEM.VALUE})'
|
|
priority: INFO
|
|
description: 'List of caches has changed. Significant changes have occurred in the cluster. Acknowledge to close the problem manually.'
|
|
manual_close: 'YES'
|
|
tags:
|
|
- tag: scope
|
|
value: notice
|
|
- uuid: 0a09c18adfd5477098684c47927f967b
|
|
name: 'Cache group [{#JMXNAME}]: Local node partitions, moving'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",LocalNodeMovingPartitionsCount]'
|
|
history: 7d
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Count of partitions with state MOVING for this cache group located on this node.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: cache_group
|
|
trigger_prototypes:
|
|
- uuid: 84e1402b3ae64960ad997d2610137927
|
|
expression: 'max(/GridGain by JMX/jmx["{#JMXOBJ}",LocalNodeMovingPartitionsCount],30m)>0'
|
|
name: 'Cache group [{#JMXNAME}]: Rebalance in progress'
|
|
priority: INFO
|
|
description: 'Acknowledge to close the problem manually.'
|
|
manual_close: 'YES'
|
|
tags:
|
|
- tag: scope
|
|
value: notice
|
|
- uuid: c2a38de3743549e0850e678d1f91e2de
|
|
name: 'Cache group [{#JMXNAME}]: Local node partitions, owning'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",LocalNodeOwningPartitionsCount]'
|
|
history: 7d
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Count of partitions with state OWNING for this cache group located on this node.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: cache_group
|
|
- uuid: be9b2cbf210e4e27a5887d77f2dafaad
|
|
name: 'Cache group [{#JMXNAME}]: Local node entries, renting'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",LocalNodeRentingEntriesCount]'
|
|
history: 7d
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Count of entries remains to evict in RENTING partitions located on this node for this cache group.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: cache_group
|
|
- uuid: 582acb454ffa4b129f5786e814df234f
|
|
name: 'Cache group [{#JMXNAME}]: Local node partitions, renting'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",LocalNodeRentingPartitionsCount]'
|
|
history: 7d
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Count of partitions with state RENTING for this cache group located on this node.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: cache_group
|
|
- uuid: e026169754954bbe85afcef2534b4d0e
|
|
name: 'Cache group [{#JMXNAME}]: Partition copies, max'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",MaximumNumberOfPartitionCopies]'
|
|
history: 7d
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Maximum number of partition copies for all partitions of this cache group.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: cache_group
|
|
- uuid: b93a9ff86a2048bfbf8743b7a1c5ec06
|
|
name: 'Cache group [{#JMXNAME}]: Partition copies, min'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",MinimumNumberOfPartitionCopies]'
|
|
history: 7d
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Minimum number of partition copies for all partitions of this cache group.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: cache_group
|
|
trigger_prototypes:
|
|
- uuid: 63c244c02ace4ac4a8d6f60e5c533890
|
|
expression: 'max(/GridGain by JMX/jmx["{#JMXOBJ}",MinimumNumberOfPartitionCopies],30m)=0'
|
|
name: 'Cache group [{#JMXNAME}]: There is no copy for partitions'
|
|
priority: WARNING
|
|
tags:
|
|
- tag: scope
|
|
value: capacity
|
|
- uuid: 8dac4ccaad0f4736b2065e2f1200e3ff
|
|
name: 'Cache group [{#JMXNAME}]: Partitions'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",Partitions]'
|
|
history: 7d
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Count of partitions for cache group.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: cache_group
|
|
trigger_prototypes:
|
|
- uuid: 3ded54fcdad74c83b47543410a7d9b3c
|
|
expression: 'min(/GridGain by JMX/jmx["{#JMXOBJ}",Backups],5m)>=max(/GridGain by JMX/jmx["{#JMXOBJ}",MinimumNumberOfPartitionCopies],5m)'
|
|
name: 'Cache group [{#JMXNAME}]: One or more backups are unavailable'
|
|
priority: WARNING
|
|
tags:
|
|
- tag: scope
|
|
value: capacity
|
|
graph_prototypes:
|
|
- uuid: da32480debef4e2baec58a7cf1131357
|
|
name: 'Cache group [{#JMXNAME}]: Partitions'
|
|
graph_items:
|
|
- color: 199C0D
|
|
item:
|
|
host: 'GridGain by JMX'
|
|
key: 'jmx["{#JMXOBJ}",LocalNodeMovingPartitionsCount]'
|
|
- sortorder: '1'
|
|
color: F63100
|
|
item:
|
|
host: 'GridGain by JMX'
|
|
key: 'jmx["{#JMXOBJ}",LocalNodeRentingPartitionsCount]'
|
|
- sortorder: '2'
|
|
color: 00611C
|
|
item:
|
|
host: 'GridGain by JMX'
|
|
key: 'jmx["{#JMXOBJ}",LocalNodeOwningPartitionsCount]'
|
|
- sortorder: '3'
|
|
color: F7941D
|
|
item:
|
|
host: 'GridGain by JMX'
|
|
key: 'jmx["{#JMXOBJ}",LocalNodeRentingEntriesCount]'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
preprocessing:
|
|
- type: JAVASCRIPT
|
|
parameters:
|
|
- |
|
|
var data = JSON.parse(value);
|
|
for (var item, i = 0; item = data.data[i++];) {
|
|
if (!('{#JMXIGNITEINSTANCENAME}' in item)) {
|
|
Object.assign(item, {
|
|
'{#JMXIGNITEINSTANCENAME}': 'null'
|
|
});
|
|
}
|
|
|
|
}
|
|
|
|
return JSON.stringify(data)
|
|
- type: DISCARD_UNCHANGED_HEARTBEAT
|
|
parameters:
|
|
- 3h
|
|
- uuid: 3ca6cce698d247daae252430289e7b61
|
|
name: 'Thread pool metrics'
|
|
type: JMX
|
|
key: 'jmx.discovery[beans,"org.apache:group=\"Thread Pools\",*"]'
|
|
delay: 10m
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
filter:
|
|
evaltype: AND
|
|
conditions:
|
|
- macro: '{#JMXNAME}'
|
|
value: '{$GRIDGAIN.LLD.FILTER.THREAD.POOL.MATCHES}'
|
|
formulaid: A
|
|
- macro: '{#JMXNAME}'
|
|
value: '{$GRIDGAIN.LLD.FILTER.THREAD.POOL.NOT_MATCHES}'
|
|
operator: NOT_MATCHES_REGEX
|
|
formulaid: B
|
|
item_prototypes:
|
|
- uuid: 7d6ab6a7180c44859b933784fb565212
|
|
name: 'Thread pool [{#JMXNAME}]: Pool size, core'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",CorePoolSize]'
|
|
history: 7d
|
|
units: '!msg'
|
|
username: '{$IGNITE.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'The core number of threads.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: thread_pool
|
|
- uuid: 3ffebf40ed154a7eb7050e16d30f9f53
|
|
name: 'Thread pool [{#JMXNAME}]: Pool size, max'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",MaximumPoolSize]'
|
|
history: 7d
|
|
units: '!msg'
|
|
username: '{$IGNITE.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'The maximum allowed number of threads.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: thread_pool
|
|
- uuid: 1f7f5e0d19f6400fa8803eba2fb14f85
|
|
name: 'Thread pool [{#JMXNAME}]: Pool size'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",PoolSize]'
|
|
history: 7d
|
|
units: '!msg'
|
|
username: '{$IGNITE.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Current number of threads in the pool.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: thread_pool
|
|
- uuid: c4a5e348590341b29af96b57bf92240b
|
|
name: 'Thread pool [{#JMXNAME}]: Queue size'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",QueueSize]'
|
|
history: 7d
|
|
units: '!msg'
|
|
username: '{$IGNITE.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Current size of the execution queue.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: thread_pool
|
|
trigger_prototypes:
|
|
- uuid: f2a7aa098ed245f48b455ed747ee42c3
|
|
expression: 'min(/GridGain by JMX/jmx["{#JMXOBJ}",QueueSize],5m) > {$GRIDGAIN.THREAD.QUEUE.MAX.WARN:"{#JMXNAME}"}'
|
|
name: 'Thread pool [{#JMXNAME}]: Too many messages in queue'
|
|
event_name: 'Thread pool [{#JMXNAME}]: Too many messages in queue (over {$GRIDGAIN.THREAD.QUEUE.MAX.WARN:"{#JMXNAME}"} for 5 min)'
|
|
priority: AVERAGE
|
|
description: 'Number of messages in queue more than {$GRIDGAIN.THREAD.QUEUE.MAX.WARN:"{#JMXNAME}"}.'
|
|
tags:
|
|
- tag: scope
|
|
value: performance
|
|
graph_prototypes:
|
|
- uuid: d3db21cd80664dc4b6847456e15b2b3e
|
|
name: 'Thread pool [{#JMXNAME}]: Thread pool size'
|
|
graph_items:
|
|
- color: 199C0D
|
|
item:
|
|
host: 'GridGain by JMX'
|
|
key: 'jmx["{#JMXOBJ}",PoolSize]'
|
|
- sortorder: '1'
|
|
color: F63100
|
|
item:
|
|
host: 'GridGain by JMX'
|
|
key: 'jmx["{#JMXOBJ}",MaximumPoolSize]'
|
|
- sortorder: '2'
|
|
color: 00611C
|
|
item:
|
|
host: 'GridGain by JMX'
|
|
key: 'jmx["{#JMXOBJ}",CorePoolSize]'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
preprocessing:
|
|
- type: JAVASCRIPT
|
|
parameters:
|
|
- |
|
|
var data = JSON.parse(value);
|
|
for (var item, i = 0; item = data.data[i++];) {
|
|
if (!('{#JMXIGNITEINSTANCENAME}' in item)) {
|
|
Object.assign(item, {
|
|
'{#JMXIGNITEINSTANCENAME}': 'null'
|
|
});
|
|
}
|
|
|
|
}
|
|
|
|
return JSON.stringify(data)
|
|
- type: DISCARD_UNCHANGED_HEARTBEAT
|
|
parameters:
|
|
- 3h
|
|
- uuid: 3f3382c27cc449bd86822c245b798056
|
|
name: 'Cache metrics'
|
|
type: JMX
|
|
key: 'jmx.discovery[beans,"org.apache:name=\"org.apache.gridgain.internal.processors.cache.CacheLocalMetricsMXBeanImpl\",*"]'
|
|
delay: 10m
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
filter:
|
|
evaltype: AND
|
|
conditions:
|
|
- macro: '{#JMXGROUP}'
|
|
value: '{$GRIDGAIN.LLD.FILTER.CACHE.MATCHES}'
|
|
formulaid: A
|
|
- macro: '{#JMXGROUP}'
|
|
value: '{$GRIDGAIN.LLD.FILTER.CACHE.NOT_MATCHES}'
|
|
operator: NOT_MATCHES_REGEX
|
|
formulaid: B
|
|
item_prototypes:
|
|
- uuid: 6fb5dee0c7434b279eb21da7d54edacc
|
|
name: 'Cache group [{#JMXGROUP}]: Cache gets, rate'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",CacheGets]'
|
|
history: 7d
|
|
value_type: FLOAT
|
|
units: ops
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'The number of gets to the cache per second.'
|
|
preprocessing:
|
|
- type: CHANGE_PER_SECOND
|
|
parameters:
|
|
- ''
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: cache
|
|
- uuid: 632a331fe886428fa7b2c8845a02b57a
|
|
name: 'Cache group [{#JMXGROUP}]: Cache hits, pct'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",CacheHitPercentage]'
|
|
history: 7d
|
|
value_type: FLOAT
|
|
units: '%'
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Percentage of successful hits.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: cache
|
|
- uuid: 843b31df2e4d430082731b44e2653f13
|
|
name: 'Cache group [{#JMXGROUP}]: Cache misses, pct'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",CacheMissPercentage]'
|
|
history: 7d
|
|
value_type: FLOAT
|
|
units: '%'
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'Percentage of accesses that failed to find anything.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: cache
|
|
- uuid: 96616d8c2b9c46b0bbd7350679476c36
|
|
name: 'Cache group [{#JMXGROUP}]: Cache puts, rate'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",CachePuts]'
|
|
history: 7d
|
|
value_type: FLOAT
|
|
units: ops
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'The number of puts to the cache per second.'
|
|
preprocessing:
|
|
- type: CHANGE_PER_SECOND
|
|
parameters:
|
|
- ''
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: cache
|
|
- uuid: 308b3e27d35b439bbb2c1cf96f6d92fe
|
|
name: 'Cache group [{#JMXGROUP}]: Cache removals, rate'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",CacheRemovals]'
|
|
history: 7d
|
|
value_type: FLOAT
|
|
units: ops
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'The number of removals from the cache per second.'
|
|
preprocessing:
|
|
- type: CHANGE_PER_SECOND
|
|
parameters:
|
|
- ''
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: cache
|
|
- uuid: e4886d5b699e432c8e6bb47b23b9c314
|
|
name: 'Cache group [{#JMXGROUP}]: Cache size'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",CacheSize]'
|
|
history: 7d
|
|
units: '!keys'
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'The number of non-null values in the cache as a long value.'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: cache
|
|
- uuid: 304ff6af92c0473aab8216d16509d28f
|
|
name: 'Cache group [{#JMXGROUP}]: Cache transaction commits, rate'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",CacheTxCommits]'
|
|
history: 7d
|
|
value_type: FLOAT
|
|
units: '!tps'
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'The number of transaction commits per second.'
|
|
preprocessing:
|
|
- type: CHANGE_PER_SECOND
|
|
parameters:
|
|
- ''
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: cache
|
|
- uuid: bd5b517d5a384c70a070658bc41734bf
|
|
name: 'Cache group [{#JMXGROUP}]: Cache transaction rollbacks, rate'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",CacheTxRollbacks]'
|
|
history: 7d
|
|
value_type: FLOAT
|
|
units: '!tps'
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'The number of transaction rollback per second.'
|
|
preprocessing:
|
|
- type: CHANGE_PER_SECOND
|
|
parameters:
|
|
- ''
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: cache
|
|
- uuid: a0d3a73939564dc39267ccdca06d524b
|
|
name: 'Cache group [{#JMXGROUP}]: Cache heap entries'
|
|
type: JMX
|
|
key: 'jmx["{#JMXOBJ}",HeapEntriesCount]'
|
|
history: 7d
|
|
units: '!keys'
|
|
username: '{$GRIDGAIN.USER}'
|
|
password: '{$GRIDGAIN.PASSWORD}'
|
|
description: 'The number of entries in heap memory.'
|
|
preprocessing:
|
|
- type: CHANGE_PER_SECOND
|
|
parameters:
|
|
- ''
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
tags:
|
|
- tag: component
|
|
value: cache
|
|
trigger_prototypes:
|
|
- uuid: cfe03901890a4377ad8d5dcc7be3e0c5
|
|
expression: 'last(/GridGain by JMX/jmx["{#JMXOBJ}",CacheSize])=last(/GridGain by JMX/jmx["{#JMXOBJ}",HeapEntriesCount])'
|
|
name: 'Cache group [{#JMXGROUP}]: All entries are in heap'
|
|
priority: INFO
|
|
description: 'All entries are in heap. Possibly you use eager queries it may cause out of memory exceptions for big caches. Acknowledge to close the problem manually.'
|
|
manual_close: 'YES'
|
|
tags:
|
|
- tag: scope
|
|
value: notice
|
|
- uuid: 1c990b38154340a3aab678ac1365cf7e
|
|
expression: 'min(/GridGain by JMX/jmx["{#JMXOBJ}",CacheTxRollbacks],5m) > max(/GridGain by JMX/jmx["{#JMXOBJ}",CacheTxCommits],5m)'
|
|
name: 'Cache group [{#JMXGROUP}]: Success transactions less than rollbacks for 5m'
|
|
priority: WARNING
|
|
dependencies:
|
|
- name: 'Cache group [{#JMXGROUP}]: There are no success transactions for cache for 5m'
|
|
expression: 'min(/GridGain by JMX/jmx["{#JMXOBJ}",CacheTxRollbacks],5m)>0 and max(/GridGain by JMX/jmx["{#JMXOBJ}",CacheTxCommits],5m)=0'
|
|
tags:
|
|
- tag: scope
|
|
value: performance
|
|
- uuid: 2caa406da4cf4d089705e5506fd589f1
|
|
expression: 'min(/GridGain by JMX/jmx["{#JMXOBJ}",CacheTxRollbacks],5m)>0 and max(/GridGain by JMX/jmx["{#JMXOBJ}",CacheTxCommits],5m)=0'
|
|
name: 'Cache group [{#JMXGROUP}]: There are no success transactions for cache for 5m'
|
|
priority: AVERAGE
|
|
tags:
|
|
- tag: scope
|
|
value: performance
|
|
graph_prototypes:
|
|
- uuid: 8c453a6631b34c96b39375aff2e51ac3
|
|
name: 'Cache group [{#JMXGROUP}]: Cache hits'
|
|
graph_items:
|
|
- color: 199C0D
|
|
item:
|
|
host: 'GridGain by JMX'
|
|
key: 'jmx["{#JMXOBJ}",CacheHitPercentage]'
|
|
- sortorder: '1'
|
|
color: F63100
|
|
item:
|
|
host: 'GridGain by JMX'
|
|
key: 'jmx["{#JMXOBJ}",CacheMissPercentage]'
|
|
- uuid: de80d7645ec347c3a547e9d8d41edc3a
|
|
name: 'Cache group [{#JMXGROUP}]: Cache ops'
|
|
graph_items:
|
|
- color: 199C0D
|
|
item:
|
|
host: 'GridGain by JMX'
|
|
key: 'jmx["{#JMXOBJ}",CacheGets]'
|
|
- sortorder: '1'
|
|
color: F63100
|
|
item:
|
|
host: 'GridGain by JMX'
|
|
key: 'jmx["{#JMXOBJ}",CachePuts]'
|
|
- sortorder: '2'
|
|
color: 00611C
|
|
item:
|
|
host: 'GridGain by JMX'
|
|
key: 'jmx["{#JMXOBJ}",CacheRemovals]'
|
|
- uuid: 20b825d52d8241a79405768faf0e202d
|
|
name: 'Cache group [{#JMXGROUP}]: Cache transactions'
|
|
graph_items:
|
|
- color: 199C0D
|
|
item:
|
|
host: 'GridGain by JMX'
|
|
key: 'jmx["{#JMXOBJ}",CacheTxCommits]'
|
|
- sortorder: '1'
|
|
color: F63100
|
|
item:
|
|
host: 'GridGain by JMX'
|
|
key: 'jmx["{#JMXOBJ}",CacheTxRollbacks]'
|
|
jmx_endpoint: 'service:jmx:rmi:///jndi/rmi://{HOST.CONN}:{HOST.PORT}/jmxrmi'
|
|
preprocessing:
|
|
- type: JAVASCRIPT
|
|
parameters:
|
|
- |
|
|
var data = JSON.parse(value);
|
|
for (var item, i = 0; item = data.data[i++];) {
|
|
if (!('{#JMXIGNITEINSTANCENAME}' in item)) {
|
|
Object.assign(item, {
|
|
'{#JMXIGNITEINSTANCENAME}': 'null'
|
|
});
|
|
}
|
|
|
|
}
|
|
|
|
return JSON.stringify(data)
|
|
- type: DISCARD_UNCHANGED_HEARTBEAT
|
|
parameters:
|
|
- 3h
|
|
tags:
|
|
- tag: class
|
|
value: software
|
|
- tag: target
|
|
value: gridgain
|
|
macros:
|
|
- macro: '{$GRIDGAIN.CHECKPOINT.PUSED.MAX.HIGH}'
|
|
value: '80'
|
|
description: 'The maximum percent of checkpoint buffer utilization for high trigger expression.'
|
|
- macro: '{$GRIDGAIN.CHECKPOINT.PUSED.MAX.WARN}'
|
|
value: '66'
|
|
description: 'The maximum percent of checkpoint buffer utilization for warning trigger expression.'
|
|
- macro: '{$GRIDGAIN.DATA.REGION.PUSED.MAX.HIGH}'
|
|
value: '90'
|
|
description: 'The maximum percent of data region utilization for high trigger expression.'
|
|
- macro: '{$GRIDGAIN.DATA.REGION.PUSED.MAX.WARN}'
|
|
value: '80'
|
|
description: 'The maximum percent of data region utilization for warning trigger expression.'
|
|
- macro: '{$GRIDGAIN.JOBS.QUEUE.MAX.WARN}'
|
|
value: '10'
|
|
description: 'The maximum number of queued jobs for trigger expression.'
|
|
- macro: '{$GRIDGAIN.LLD.FILTER.CACHE.MATCHES}'
|
|
value: '.*'
|
|
description: 'Filter of discoverable cache groups.'
|
|
- macro: '{$GRIDGAIN.LLD.FILTER.CACHE.NOT_MATCHES}'
|
|
value: CHANGE_IF_NEEDED
|
|
description: 'Filter to exclude discovered cache groups.'
|
|
- macro: '{$GRIDGAIN.LLD.FILTER.DATA.REGION.MATCHES}'
|
|
value: '.*'
|
|
description: 'Filter of discoverable data regions.'
|
|
- macro: '{$GRIDGAIN.LLD.FILTER.DATA.REGION.NOT_MATCHES}'
|
|
value: ^(sysMemPlc|TxLog)$
|
|
description: 'Filter to exclude discovered data regions.'
|
|
- macro: '{$GRIDGAIN.LLD.FILTER.THREAD.POOL.MATCHES}'
|
|
value: '.*'
|
|
description: 'Filter of discoverable thread pools.'
|
|
- macro: '{$GRIDGAIN.LLD.FILTER.THREAD.POOL.NOT_MATCHES}'
|
|
value: ^(GridCallbackExecutor|GridRebalanceStripedExecutor|GridDataStreamExecutor|StripedExecutor)$
|
|
description: 'Filter to exclude discovered thread pools.'
|
|
- macro: '{$GRIDGAIN.PASSWORD}'
|
|
value: '<secret>'
|
|
- macro: '{$GRIDGAIN.PME.DURATION.MAX.HIGH}'
|
|
value: '60000'
|
|
description: 'The maximum PME duration in ms for high trigger expression.'
|
|
- macro: '{$GRIDGAIN.PME.DURATION.MAX.WARN}'
|
|
value: '10000'
|
|
description: 'The maximum PME duration in ms for warning trigger expression.'
|
|
- macro: '{$GRIDGAIN.THREAD.QUEUE.MAX.WARN}'
|
|
value: '1000'
|
|
description: 'Threshold for thread pool queue size. Can be used with thread pool name as context.'
|
|
- macro: '{$GRIDGAIN.THREADS.COUNT.MAX.WARN}'
|
|
value: '1000'
|
|
description: 'The maximum number of running threads for trigger expression.'
|
|
- macro: '{$GRIDGAIN.USER}'
|
|
value: zabbix
|
|
dashboards:
|
|
- uuid: 407c505abde6457b88154f6d566190d8
|
|
name: 'GridGain: Overview'
|
|
pages:
|
|
- name: General
|
|
widgets:
|
|
- type: graphprototype
|
|
width: '24'
|
|
height: '5'
|
|
fields:
|
|
- type: INTEGER
|
|
name: columns
|
|
value: '2'
|
|
- type: INTEGER
|
|
name: rows
|
|
value: '1'
|
|
- type: GRAPH_PROTOTYPE
|
|
name: graphid
|
|
value:
|
|
host: 'GridGain by JMX'
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Transactions rate'
|
|
- type: graphprototype
|
|
'y': '5'
|
|
width: '24'
|
|
height: '5'
|
|
fields:
|
|
- type: INTEGER
|
|
name: columns
|
|
value: '2'
|
|
- type: INTEGER
|
|
name: rows
|
|
value: '1'
|
|
- type: GRAPH_PROTOTYPE
|
|
name: graphid
|
|
value:
|
|
host: 'GridGain by JMX'
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Discovery messages rate'
|
|
- type: graphprototype
|
|
'y': '10'
|
|
width: '24'
|
|
height: '5'
|
|
fields:
|
|
- type: INTEGER
|
|
name: columns
|
|
value: '2'
|
|
- type: INTEGER
|
|
name: rows
|
|
value: '1'
|
|
- type: GRAPH_PROTOTYPE
|
|
name: graphid
|
|
value:
|
|
host: 'GridGain by JMX'
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Communication messages rate'
|
|
- type: graphprototype
|
|
'y': '15'
|
|
width: '24'
|
|
height: '5'
|
|
fields:
|
|
- type: INTEGER
|
|
name: columns
|
|
value: '2'
|
|
- type: INTEGER
|
|
name: rows
|
|
value: '1'
|
|
- type: GRAPH_PROTOTYPE
|
|
name: graphid
|
|
value:
|
|
host: 'GridGain by JMX'
|
|
name: 'GridGain [{#JMXIGNITEINSTANCENAME}]: Jobs rate'
|