You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

903 lines
40 KiB

1 year ago
zabbix_export:
version: '7.0'
template_groups:
- uuid: e960332b3f6c46a1956486d4f3f99fce
name: 'Templates/Server hardware'
templates:
- uuid: 7b6c6228b25f4586b42cd1bf37ff8034
template: 'SMART by Zabbix agent 2'
name: 'SMART by Zabbix agent 2'
description: |
The template for monitoring S.M.A.R.T. attributes of physical disk that works without any external scripts. It collects metrics by Zabbix agent 2 version 5.0 and later with Smartmontools version 7.1 and later. Disk discovery LLD rule finds all HDD, SSD, NVMe disks with S.M.A.R.T. enabled. Attribute discovery LLD rule have pre-defined Vendor Specific Attributes for each disk, and will be discovered if attribute is present.
You can discuss this template or leave feedback on our forum https://www.zabbix.com/forum/zabbix-suggestions-and-feedback/415662-discussion-thread-for-official-zabbix-smart-disk-monitoring
Generated by official Zabbix template tool "Templator" 2.0.0
vendor:
name: Zabbix
version: 7.0-0
groups:
- name: 'Templates/Server hardware'
discovery_rules:
- uuid: 4575af2717ec4bf78645edb84a966c84
name: 'Disk discovery'
key: smart.disk.discovery
delay: 1h
filter:
evaltype: AND
conditions:
- macro: '{#NAME}'
value: '{$SMART.DISK.NAME.MATCHES}'
formulaid: A
- macro: '{#NAME}'
value: '{$SMART.DISK.NAME.NOT_MATCHES}'
operator: NOT_MATCHES_REGEX
formulaid: B
description: 'Discovery SMART disks.'
item_prototypes:
- uuid: 643de316ae644f6d8fd92d1f03ae0360
name: 'SMART [{#NAME}]: Bad_Block_Rate'
type: DEPENDENT
key: 'smart.disk.attribute.bad_block_rate[{#NAME}]'
delay: '0'
history: 7d
discover: NO_DISCOVER
description: 'Percentage of used reserve blocks divided by total reserve blocks.'
preprocessing:
- type: JSONPATH
parameters:
- $.bad_block_rate.value
- type: DISCARD_UNCHANGED_HEARTBEAT
parameters:
- 6h
master_item:
key: 'smart.disk.get[{#PATH},"{#RAIDTYPE}"]'
tags:
- tag: component
value: attribute
- tag: component
value: storage
- tag: diskname
value: '{#NAME}'
- tag: disktype
value: '{#DISKTYPE}'
- uuid: 2a055383835247bc83745c84fdc5dea9
name: 'SMART [{#NAME}]: Power_Cycle_Count'
type: DEPENDENT
key: 'smart.disk.attribute.power_cycle_count[{#NAME}]'
delay: '0'
history: 7d
discover: NO_DISCOVER
description: 'This attribute indicates the count of full hard disk power on/off cycles.'
preprocessing:
- type: JSONPATH
parameters:
- $.power_cycle_count.value
- type: DISCARD_UNCHANGED_HEARTBEAT
parameters:
- 6h
master_item:
key: 'smart.disk.get[{#PATH},"{#RAIDTYPE}"]'
tags:
- tag: component
value: attribute
- tag: component
value: storage
- tag: diskname
value: '{#NAME}'
- tag: disktype
value: '{#DISKTYPE}'
- uuid: e1fbae7fe66c453997d9aa6e6eb3b5cb
name: 'SMART [{#NAME}]: Program_Fail_Count_Chip'
type: DEPENDENT
key: 'smart.disk.attribute.program_fail_count_chip[{#NAME}]'
delay: '0'
history: 7d
discover: NO_DISCOVER
description: 'The total number of flash program operation failures since the drive was deployed.'
preprocessing:
- type: JSONPATH
parameters:
- $.program_fail_count_chip.value
- type: DISCARD_UNCHANGED_HEARTBEAT
parameters:
- 6h
master_item:
key: 'smart.disk.get[{#PATH},"{#RAIDTYPE}"]'
tags:
- tag: component
value: attribute
- tag: component
value: storage
- tag: diskname
value: '{#NAME}'
- tag: disktype
value: '{#DISKTYPE}'
- uuid: abb098035cbd4c5b9e2d15c1e95d8e34
name: 'SMART [{#NAME}]: Raw_Read_Error_Rate'
type: DEPENDENT
key: 'smart.disk.attribute.raw_read_error_rate[{#NAME}]'
delay: '0'
history: 7d
discover: NO_DISCOVER
description: 'Stores data related to the rate of hardware read errors that occurred when reading data from a disk surface. The raw value has different structure for different vendors and is often not meaningful as a decimal number. For some drives, this number may increase during normal operation without necessarily signifying errors.'
preprocessing:
- type: JSONPATH
parameters:
- $.raw_read_error_rate.value
- type: DISCARD_UNCHANGED_HEARTBEAT
parameters:
- 6h
master_item:
key: 'smart.disk.get[{#PATH},"{#RAIDTYPE}"]'
tags:
- tag: component
value: attribute
- tag: component
value: storage
- tag: diskname
value: '{#NAME}'
- tag: disktype
value: '{#DISKTYPE}'
- uuid: 5601bfa6a38940b6b8d695bf029f534c
name: 'SMART [{#NAME}]: Reallocated_Sector_Ct'
type: DEPENDENT
key: 'smart.disk.attribute.reallocated_sector_ct[{#NAME}]'
delay: '0'
history: 7d
discover: NO_DISCOVER
description: 'Disk discovered attribute.'
preprocessing:
- type: JSONPATH
parameters:
- $.reallocated_sector_ct.value
- type: DISCARD_UNCHANGED_HEARTBEAT
parameters:
- 6h
master_item:
key: 'smart.disk.get[{#PATH},"{#RAIDTYPE}"]'
tags:
- tag: component
value: attribute
- tag: component
value: storage
- tag: diskname
value: '{#NAME}'
- tag: disktype
value: '{#DISKTYPE}'
- uuid: f538f4708280451eb30d20433d133012
name: 'SMART [{#NAME}]: Reported_Uncorrect'
type: DEPENDENT
key: 'smart.disk.attribute.reported_uncorrect[{#NAME}]'
delay: '0'
history: 7d
discover: NO_DISCOVER
description: 'The count of errors that could not be recovered using hardware ECC.'
preprocessing:
- type: JSONPATH
parameters:
- $.reported_uncorrect.value
- type: DISCARD_UNCHANGED_HEARTBEAT
parameters:
- 6h
master_item:
key: 'smart.disk.get[{#PATH},"{#RAIDTYPE}"]'
tags:
- tag: component
value: attribute
- tag: component
value: storage
- tag: diskname
value: '{#NAME}'
- tag: disktype
value: '{#DISKTYPE}'
- uuid: 70ac7d6cdf29431cacf02fc716c8ab0c
name: 'SMART [{#NAME}]: Seek_Error_Rate'
type: DEPENDENT
key: 'smart.disk.attribute.seek_error_rate[{#NAME}]'
delay: '0'
history: 7d
discover: NO_DISCOVER
description: 'Rate of seek errors of the magnetic heads. If there is a partial failure in the mechanical positioning system, then seek errors will arise. Such a failure may be due to numerous factors, such as damage to a servo, or thermal widening of the hard disk. The raw value has different structure for different vendors and is often not meaningful as a decimal number. For some drives, this number may increase during normal operation without necessarily signifying errors.'
preprocessing:
- type: JSONPATH
parameters:
- $.seek_error_rate.value
- type: DISCARD_UNCHANGED_HEARTBEAT
parameters:
- 6h
master_item:
key: 'smart.disk.get[{#PATH},"{#RAIDTYPE}"]'
tags:
- tag: component
value: attribute
- tag: component
value: storage
- tag: diskname
value: '{#NAME}'
- tag: disktype
value: '{#DISKTYPE}'
- uuid: 6e08c65d77ca4155b396c9615b2f45b3
name: 'SMART [{#NAME}]: Spin_Up_Time'
type: DEPENDENT
key: 'smart.disk.attribute.spin_up_time[{#NAME}]'
delay: '0'
history: 7d
discover: NO_DISCOVER
description: 'Average time of spindle spin up (from zero RPM to fully operational [milliseconds]).'
preprocessing:
- type: JSONPATH
parameters:
- $.spin_up_time.value
- type: DISCARD_UNCHANGED_HEARTBEAT
parameters:
- 6h
master_item:
key: 'smart.disk.get[{#PATH},"{#RAIDTYPE}"]'
tags:
- tag: component
value: attribute
- tag: component
value: storage
- tag: diskname
value: '{#NAME}'
- tag: disktype
value: '{#DISKTYPE}'
- uuid: e428eb3368e94dbc955f2bebf8feb202
name: 'SMART [{#NAME}]: Start_Stop_Count'
type: DEPENDENT
key: 'smart.disk.attribute.start_stop_count[{#NAME}]'
delay: '0'
history: 7d
discover: NO_DISCOVER
description: 'A tally of spindle start/stop cycles. The spindle turns on, and hence the count is increased, both when the hard disk is turned on after having before been turned entirely off (disconnected from power source) and when the hard disk returns from having previously been put to sleep mode.'
preprocessing:
- type: JSONPATH
parameters:
- $.start_stop_count.value
- type: DISCARD_UNCHANGED_HEARTBEAT
parameters:
- 6h
master_item:
key: 'smart.disk.get[{#PATH},"{#RAIDTYPE}"]'
tags:
- tag: component
value: attribute
- tag: component
value: storage
- tag: diskname
value: '{#NAME}'
- tag: disktype
value: '{#DISKTYPE}'
- uuid: c186f7ce1b8d4311997c84fd5c239819
name: 'SMART [{#NAME}]: Critical warning'
type: DEPENDENT
key: 'smart.disk.critical_warning[{#NAME}]'
delay: '0'
history: 7d
description: 'This field indicates critical warnings for the state of the controller.'
preprocessing:
- type: JSONPATH
parameters:
- $.critical_warning
- type: DISCARD_UNCHANGED_HEARTBEAT
parameters:
- 6h
master_item:
key: 'smart.disk.get[{#PATH},"{#RAIDTYPE}"]'
tags:
- tag: component
value: storage
- tag: diskname
value: '{#NAME}'
- tag: disktype
value: '{#DISKTYPE}'
- uuid: 72f16a701cee4119b0b1865671fd448d
name: 'SMART [{#NAME}]: Smartctl error'
type: DEPENDENT
key: 'smart.disk.error[{#NAME}]'
delay: '0'
history: 7d
trends: '0'
value_type: TEXT
description: 'This metric will contain smartctl errors.'
preprocessing:
- type: JSONPATH
parameters:
- $.error
- type: DISCARD_UNCHANGED_HEARTBEAT
parameters:
- 1h
master_item:
key: 'smart.disk.get[{#PATH},"{#RAIDTYPE}"]'
tags:
- tag: component
value: storage
- tag: diskname
value: '{#NAME}'
- tag: disktype
value: '{#DISKTYPE}'
- uuid: 849a9d5c9b9d4b969a09ab5cf4629ded
name: 'SMART [{#NAME}]: Exit status'
type: DEPENDENT
key: 'smart.disk.es[{#NAME}]'
delay: '0'
history: 7d
description: |
The exit statuses of smartctl are defined by a bitmask but in decimal value. The eight different bits in the exit status have the following meanings for ATA disks; some of these values may also be returned for SCSI disks.
Bit 0: Command line did not parse.
Bit 1: Device open failed, device did not return an IDENTIFY DEVICE structure, or device is in a low-power mode (see '-n' option above).
Bit 2: Some SMART or other ATA command to the disk failed, or there was a checksum error in a SMART data structure (see '-b' option above).
Bit 3: SMART status check returned "DISK FAILING".
Bit 4: We found prefail Attributes <= threshold.
Bit 5: SMART status check returned "DISK OK" but we found that some (usage or prefail) Attributes have been <= threshold at some time in the past.
Bit 6: The device error log contains records of errors.
Bit 7: The device self-test log contains records of errors. [ATA only] Failed self-tests outdated by a newer successful extended self-test are ignored.
preprocessing:
- type: JSONPATH
parameters:
- $.exit_status
- type: DISCARD_UNCHANGED_HEARTBEAT
parameters:
- 6h
master_item:
key: 'smart.disk.get[{#PATH},"{#RAIDTYPE}"]'
tags:
- tag: component
value: storage
- tag: diskname
value: '{#NAME}'
- tag: disktype
value: '{#DISKTYPE}'
trigger_prototypes:
- uuid: c51b609f267c45c3bcb4a3f5f40b6d35
expression: |
( count(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}],#2) = 1 and bitand(last(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}]),8) = 8 )
or ( bitand(last(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}]),8) = 8
and bitand(last(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}]),8) > bitand(last(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}],#2),8) )
recovery_mode: NONE
name: 'SMART [{#NAME}]: Check returned "DISK FAILING"'
priority: HIGH
description: 'SMART status check returned "DISK FAILING".'
manual_close: 'YES'
tags:
- tag: scope
value: notice
- uuid: 12ed61dfd27c4666883c4240a5726d06
expression: |
( count(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}],#2) = 1 and bitand(last(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}]),1) = 1 )
or ( bitand(last(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}]),1) = 1
and bitand(last(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}]),1) > bitand(last(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}],#2),1) )
recovery_mode: NONE
name: 'SMART [{#NAME}]: Command line did not parse'
priority: HIGH
description: 'Command line did not parse.'
manual_close: 'YES'
tags:
- tag: scope
value: notice
- uuid: 9b960cb324774b3fa5e3d39aeb3141e2
expression: |
( count(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}],#2) = 1 and bitand(last(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}]),2) = 2 )
or ( bitand(last(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}]),2) = 2
and bitand(last(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}]),2) > bitand(last(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}],#2),2) )
recovery_mode: NONE
name: 'SMART [{#NAME}]: Device open failed'
priority: HIGH
description: 'Device open failed, device did not return an IDENTIFY DEVICE structure, or device is in a low-power mode.'
manual_close: 'YES'
tags:
- tag: scope
value: notice
- uuid: ccff1b75f69a47cdbb5a04c58d201a0f
expression: |
( count(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}],#2) = 1 and bitand(last(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}]),64) = 64 )
or ( bitand(last(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}]),64) = 64
and bitand(last(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}]),64) > bitand(last(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}],#2),64) )
recovery_mode: NONE
name: 'SMART [{#NAME}]: Error log contains records'
priority: HIGH
description: 'The device error log contains records of errors.'
manual_close: 'YES'
tags:
- tag: scope
value: notice
- uuid: 69fb021abcc841b7b35cc93358ef085c
expression: |
( count(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}],#2) = 1 and bitand(last(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}]),128) = 128 )
or ( bitand(last(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}]),128) = 128
and bitand(last(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}]),128) > bitand(last(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}],#2),128) )
recovery_mode: NONE
name: 'SMART [{#NAME}]: Self-test log contains records'
priority: HIGH
description: |
The device self-test log contains records of errors. [ATA only]
Failed self-tests outdated by a newer successful extended self-test are ignored.
manual_close: 'YES'
tags:
- tag: scope
value: notice
- uuid: 4ad2fbb5b6e349f6852a489b99a2760d
expression: |
( count(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}],#2) = 1 and bitand(last(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}]),32) = 32 )
or ( bitand(last(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}]),32) = 32
and bitand(last(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}]),32) > bitand(last(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}],#2),32) )
recovery_mode: NONE
name: 'SMART [{#NAME}]: Some Attributes have been <= threshold'
priority: HIGH
description: |
SMART status check returned "DISK OK" but we found that some (usage
or prefail) Attributes have been <= threshold at some time in the past.
manual_close: 'YES'
tags:
- tag: scope
value: notice
- uuid: 592e647842d048e3985e65726cdc838c
expression: |
( count(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}],#2) = 1 and bitand(last(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}]),4) = 4 )
or ( bitand(last(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}]),4) = 4
and bitand(last(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}]),4) > bitand(last(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}],#2),4) )
recovery_mode: NONE
name: 'SMART [{#NAME}]: Some command to the disk failed'
priority: HIGH
description: |
Some SMART or other ATA command to the disk failed,
or there was a checksum error in a SMART data structure.
manual_close: 'YES'
tags:
- tag: scope
value: notice
- uuid: ec137781d51249c89d8891a35a596445
expression: |
( count(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}],#2) = 1 and bitand(last(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}]),16) = 16 )
or ( bitand(last(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}]),16) = 16
and bitand(last(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}]),16) > bitand(last(/SMART by Zabbix agent 2/smart.disk.es[{#NAME}],#2),16) )
recovery_mode: NONE
name: 'SMART [{#NAME}]: Some prefail Attributes <= threshold'
priority: HIGH
description: 'We found prefail Attributes <= threshold.'
manual_close: 'YES'
tags:
- tag: scope
value: notice
- uuid: 805e1d6f91e741ac93e87bd7d62860d5
name: 'SMART [{#NAME}]: Get disk attributes'
key: 'smart.disk.get[{#PATH},"{#RAIDTYPE}"]'
history: '0'
trends: '0'
value_type: TEXT
tags:
- tag: component
value: raw
- tag: component
value: storage
- uuid: 365f9642f2764116923bb3e014eefa22
name: 'SMART [{#NAME}]: Power on hours'
type: DEPENDENT
key: 'smart.disk.hours[{#NAME}]'
delay: '0'
history: 7d
description: |
Count of hours in power-on state. The raw value of this attribute
shows total count of hours (or minutes, or seconds, depending on manufacturer)
in power-on state. "By default, the total expected lifetime of a hard disk
in perfect condition is defined as 5 years (running every day and night on
all days). This is equal to 1825 days in 24/7 mode or 43800 hours." On some
pre-2005 drives, this raw value may advance erratically and/or "wrap around"
(reset to zero periodically). https://en.wikipedia.org/wiki/S.M.A.R.T.#Known_ATA_S.M.A.R.T._attributes
preprocessing:
- type: JSONPATH
parameters:
- $.power_on_time
- type: DISCARD_UNCHANGED_HEARTBEAT
parameters:
- 6h
master_item:
key: 'smart.disk.get[{#PATH},"{#RAIDTYPE}"]'
tags:
- tag: component
value: storage
- tag: diskname
value: '{#NAME}'
- tag: disktype
value: '{#DISKTYPE}'
- uuid: 8478d6421fb044339e2118848ac6d56b
name: 'SMART [{#NAME}]: Media errors'
type: DEPENDENT
key: 'smart.disk.media_errors[{#NAME}]'
delay: '0'
history: 7d
description: |
Contains the number of occurrences where the controller detected
an unrecovered data integrity error. Errors such as uncorrectable ECC, CRC
checksum failure, or LBA tag mismatch are included in this field.
preprocessing:
- type: JSONPATH
parameters:
- $.media_errors
- type: DISCARD_UNCHANGED_HEARTBEAT
parameters:
- 6h
master_item:
key: 'smart.disk.get[{#PATH},"{#RAIDTYPE}"]'
tags:
- tag: component
value: storage
- tag: diskname
value: '{#NAME}'
- tag: disktype
value: '{#DISKTYPE}'
- uuid: b6abf9b52c694600b63fce4a68fc0fbd
name: 'SMART [{#NAME}]: Device model'
type: DEPENDENT
key: 'smart.disk.model[{#NAME}]'
delay: '0'
history: 7d
trends: '0'
value_type: CHAR
preprocessing:
- type: JSONPATH
parameters:
- $.model_name
- type: DISCARD_UNCHANGED_HEARTBEAT
parameters:
- 6h
master_item:
key: 'smart.disk.get[{#PATH},"{#RAIDTYPE}"]'
tags:
- tag: component
value: inventory
- tag: diskname
value: '{#NAME}'
- tag: disktype
value: '{#DISKTYPE}'
- uuid: 6ce46d274a694eac9700bd02a936f4be
name: 'SMART [{#NAME}]: Percentage used'
type: DEPENDENT
key: 'smart.disk.percentage_used[{#NAME}]'
delay: '0'
history: 7d
units: '%'
description: |
Contains a vendor specific estimate of the percentage of NVM subsystem
life used based on the actual usage and the manufacturer's prediction of NVM
life. A value of 100 indicates that the estimated endurance of the NVM in
the NVM subsystem has been consumed, but may not indicate an NVM subsystem
failure. The value is allowed to exceed 100. Percentages greater than 254
shall be represented as 255. This value shall be updated once per power-on
hour (when the controller is not in a sleep state).
preprocessing:
- type: JSONPATH
parameters:
- $.percentage_used
- type: DISCARD_UNCHANGED_HEARTBEAT
parameters:
- 6h
master_item:
key: 'smart.disk.get[{#PATH},"{#RAIDTYPE}"]'
tags:
- tag: component
value: storage
- tag: diskname
value: '{#NAME}'
- tag: disktype
value: '{#DISKTYPE}'
trigger_prototypes:
- uuid: e2bc2b0e195446d7973037be8e41eb6f
expression: 'last(/SMART by Zabbix agent 2/smart.disk.percentage_used[{#NAME}])>90'
name: 'SMART [{#NAME}]: NVMe disk percentage using is over 90% of estimated endurance'
priority: AVERAGE
tags:
- tag: scope
value: notice
- uuid: 62f98419c8034f389a5be3755eac8938
name: 'SMART [{#NAME}]: Serial number'
type: DEPENDENT
key: 'smart.disk.sn[{#NAME}]'
delay: '0'
history: 7d
trends: '0'
value_type: CHAR
preprocessing:
- type: JSONPATH
parameters:
- $.serial_number
- type: DISCARD_UNCHANGED_HEARTBEAT
parameters:
- 6h
master_item:
key: 'smart.disk.get[{#PATH},"{#RAIDTYPE}"]'
tags:
- tag: component
value: inventory
- tag: diskname
value: '{#NAME}'
- tag: disktype
value: '{#DISKTYPE}'
trigger_prototypes:
- uuid: 7257c02f398f4338ace1eb3a07cb7362
expression: 'last(/SMART by Zabbix agent 2/smart.disk.sn[{#NAME}],#1)<>last(/SMART by Zabbix agent 2/smart.disk.sn[{#NAME}],#2) and length(last(/SMART by Zabbix agent 2/smart.disk.sn[{#NAME}]))>0'
name: 'SMART [{#NAME}]: Disk has been replaced'
event_name: 'SMART [{#NAME}]: Disk has been replaced (new serial number received)'
priority: INFO
description: 'Device serial number has changed. Acknowledge to close the problem manually.'
manual_close: 'YES'
tags:
- tag: scope
value: notice
- uuid: 2f5b054d7a644e029a195d17f525c191
name: 'SMART [{#NAME}]: Temperature'
type: DEPENDENT
key: 'smart.disk.temperature[{#NAME}]'
delay: '0'
history: 7d
units: °C
description: 'Current drive temperature.'
preprocessing:
- type: JSONPATH
parameters:
- $.temperature
- type: DISCARD_UNCHANGED_HEARTBEAT
parameters:
- 6h
master_item:
key: 'smart.disk.get[{#PATH},"{#RAIDTYPE}"]'
tags:
- tag: component
value: temperature
- tag: diskname
value: '{#NAME}'
- tag: disktype
value: '{#DISKTYPE}'
trigger_prototypes:
- uuid: cd09aebe3ca146119cdf5b977bf6b018
expression: 'avg(/SMART by Zabbix agent 2/smart.disk.temperature[{#NAME}],5m)>{$SMART.TEMPERATURE.MAX.CRIT}'
name: 'SMART [{#NAME}]: Average disk temperature is critical'
event_name: 'SMART [{#NAME}]: Average disk temperature is critical (over {$SMART.TEMPERATURE.MAX.CRIT}°C for 5m)'
priority: AVERAGE
tags:
- tag: scope
value: notice
- uuid: aaa5acb3196b481f894998c0ca5ea165
expression: 'avg(/SMART by Zabbix agent 2/smart.disk.temperature[{#NAME}],5m)>{$SMART.TEMPERATURE.MAX.WARN}'
name: 'SMART [{#NAME}]: Average disk temperature is too high'
event_name: 'SMART [{#NAME}]: Average disk temperature is too high (over {$SMART.TEMPERATURE.MAX.WARN}°C for 5m)'
priority: WARNING
dependencies:
- name: 'SMART [{#NAME}]: Average disk temperature is critical'
expression: 'avg(/SMART by Zabbix agent 2/smart.disk.temperature[{#NAME}],5m)>{$SMART.TEMPERATURE.MAX.CRIT}'
tags:
- tag: scope
value: notice
- uuid: 434b338d88e041dd9b6a0b7aaa403076
name: 'SMART [{#NAME}]: Self-test passed'
type: DEPENDENT
key: 'smart.disk.test[{#NAME}]'
delay: '0'
history: 7d
trends: '0'
value_type: CHAR
description: 'The disk is passed the SMART self-test or not.'
preprocessing:
- type: JSONPATH
parameters:
- $.self_test_passed
- type: DISCARD_UNCHANGED_HEARTBEAT
parameters:
- 6h
master_item:
key: 'smart.disk.get[{#PATH},"{#RAIDTYPE}"]'
tags:
- tag: component
value: health
- tag: diskname
value: '{#NAME}'
- tag: disktype
value: '{#DISKTYPE}'
trigger_prototypes:
- uuid: 5fa97df4012e45279fb55724f617ef4a
expression: 'last(/SMART by Zabbix agent 2/smart.disk.test[{#NAME}])="false"'
name: 'SMART [{#NAME}]: Disk self-test is not passed'
priority: HIGH
tags:
- tag: scope
value: notice
overrides:
- name: Self-test
step: '1'
filter:
conditions:
- macro: '{#DISKTYPE}'
value: nvme
formulaid: A
operations:
- operationobject: ITEM_PROTOTYPE
operator: LIKE
value: Self-test
discover: NO_DISCOVER
- name: 'Not NVMe'
step: '2'
filter:
conditions:
- macro: '{#DISKTYPE}'
value: nvme
operator: NOT_MATCHES_REGEX
formulaid: A
operations:
- operationobject: ITEM_PROTOTYPE
operator: REGEXP
value: Media|Percentage|Critical
discover: NO_DISCOVER
- name: Raw_Read_Error_Rate
step: '3'
filter:
conditions:
- macro: '{#ATTRIBUTES}'
value: Raw_Read_Error_Rate
formulaid: A
operations:
- operationobject: ITEM_PROTOTYPE
operator: REGEXP
value: Raw_Read_Error_Rate
discover: DISCOVER
- name: Spin_Up_Time
step: '4'
filter:
conditions:
- macro: '{#ATTRIBUTES}'
value: Spin_Up_Time
formulaid: A
operations:
- operationobject: ITEM_PROTOTYPE
operator: REGEXP
value: Spin_Up_Time
discover: DISCOVER
- name: Start_Stop_Count
step: '5'
filter:
conditions:
- macro: '{#ATTRIBUTES}'
value: Start_Stop_Count
formulaid: A
operations:
- operationobject: ITEM_PROTOTYPE
operator: REGEXP
value: Start_Stop_Count
discover: DISCOVER
- name: Power_Cycle_Count
step: '6'
filter:
conditions:
- macro: '{#ATTRIBUTES}'
value: Power_Cycle_Count
formulaid: A
operations:
- operationobject: ITEM_PROTOTYPE
operator: REGEXP
value: Power_Cycle_Count
discover: DISCOVER
- name: Reported_Uncorrect
step: '7'
filter:
conditions:
- macro: '{#ATTRIBUTES}'
value: Reported_Uncorrect
formulaid: A
operations:
- operationobject: ITEM_PROTOTYPE
operator: REGEXP
value: Reported_Uncorrect
discover: DISCOVER
- name: Seek_Error_Rate
step: '8'
filter:
conditions:
- macro: '{#ATTRIBUTES}'
value: Seek_Error_Rate
formulaid: A
operations:
- operationobject: ITEM_PROTOTYPE
operator: REGEXP
value: Seek_Error_Rate
discover: DISCOVER
- name: Bad_Block_Rate
step: '9'
filter:
conditions:
- macro: '{#ATTRIBUTES}'
value: Bad_Block_Rate
formulaid: A
operations:
- operationobject: ITEM_PROTOTYPE
operator: REGEXP
value: Bad_Block_Rate
discover: DISCOVER
- name: Program_Fail_Count_Chip
step: '10'
filter:
conditions:
- macro: '{#ATTRIBUTES}'
value: Program_Fail_Count_Chip
formulaid: A
operations:
- operationobject: ITEM_PROTOTYPE
operator: REGEXP
value: Program_Fail_Count_Chip
discover: DISCOVER
- name: Reallocated_Sector_Ct
step: '11'
filter:
conditions:
- macro: '{#ATTRIBUTES}'
value: Reallocated_Sector_Ct
formulaid: A
operations:
- operationobject: ITEM_PROTOTYPE
operator: REGEXP
value: Reallocated_Sector_Ct
discover: DISCOVER
tags:
- tag: class
value: storage
- tag: target
value: hdd
- tag: target
value: ssd
macros:
- macro: '{$SMART.DISK.NAME.MATCHES}'
value: '^.*$'
description: 'This macro is used in the filter of attribute and disk discoveries. It can be overridden on the host or linked on the template level.'
- macro: '{$SMART.DISK.NAME.NOT_MATCHES}'
value: CHANGE_IF_NEEDED
description: 'This macro is used in the filter of attribute and disk discoveries. It can be overridden on the host or linked on the template level.'
- macro: '{$SMART.TEMPERATURE.MAX.CRIT}'
value: '65'
description: 'This macro is used for trigger expression. It can be overridden on the host or linked on the template level.'
- macro: '{$SMART.TEMPERATURE.MAX.WARN}'
value: '50'
description: 'This macro is used for trigger expression. It can be overridden on the host or linked on the template level.'
dashboards:
- uuid: 074166cdd4d54f7e89bd7488283ba5be
name: 'SMART: Overview'
pages:
- name: Temperature
widgets:
- type: graphprototype
width: '24'
height: '20'
fields:
- type: INTEGER
name: columns
value: '2'
- type: INTEGER
name: rows
value: '5'
- type: INTEGER
name: source_type
value: '3'
- type: ITEM_PROTOTYPE
name: itemid
value:
host: 'SMART by Zabbix agent 2'
key: 'smart.disk.temperature[{#NAME}]'
- name: 'Power On'
widgets:
- type: graphprototype
width: '24'
height: '20'
fields:
- type: INTEGER
name: columns
value: '2'
- type: INTEGER
name: rows
value: '5'
- type: INTEGER
name: source_type
value: '3'
- type: ITEM_PROTOTYPE
name: itemid
value:
host: 'SMART by Zabbix agent 2'
key: 'smart.disk.hours[{#NAME}]'