Software: Apache/2.4.41 (Ubuntu). PHP/8.0.30 uname -a: Linux apirnd 5.4.0-204-generic #224-Ubuntu SMP Thu Dec 5 13:38:28 UTC 2024 x86_64 uid=33(www-data) gid=33(www-data) groups=33(www-data) Safe-mode: OFF (not secure) /netdata/health/health.d/ drwxr-xr-x | |
| Viewing file: Select action/file-type:
# Common
template: hdfs_capacity_usage
on: hdfs.capacity
class: Utilization
type: Storage
component: HDFS
calc: ($used) * 100 / ($used + $remaining)
units: %
every: 10s
warn: $this > (($status >= $WARNING) ? (70) : (80))
crit: $this > (($status == $CRITICAL) ? (80) : (98))
delay: down 15m multiplier 1.5 max 1h
info: summary datanodes space capacity utilization
to: sysadmin
# NameNode
template: hdfs_missing_blocks
on: hdfs.blocks
class: Errors
type: Storage
component: HDFS
calc: $missing
units: missing blocks
every: 10s
warn: $this > 0
delay: down 15m multiplier 1.5 max 1h
info: number of missing blocks
to: sysadmin
template: hdfs_stale_nodes
on: hdfs.data_nodes
class: Errors
type: Storage
component: HDFS
calc: $stale
units: dead nodes
every: 10s
warn: $this > 0
delay: down 15m multiplier 1.5 max 1h
info: number of datanodes marked stale due to delayed heartbeat
to: sysadmin
template: hdfs_dead_nodes
on: hdfs.data_nodes
class: Errors
type: Storage
component: HDFS
calc: $dead
units: dead nodes
every: 10s
crit: $this > 0
delay: down 15m multiplier 1.5 max 1h
info: number of datanodes which are currently dead
to: sysadmin
# DataNode
template: hdfs_num_failed_volumes
on: hdfs.num_failed_volumes
class: Errors
type: Storage
component: HDFS
calc: $fsds_num_failed_volumes
units: failed volumes
every: 10s
warn: $this > 0
delay: down 15m multiplier 1.5 max 1h
info: number of failed volumes
to: sysadmin
|
:: Command execute :: | |
--[ c99shell v. 2.5 [PHP 8 Update] [24.05.2025] | Generation time: 0.0052 ]-- |