Kubernetes-Node-Problem-Detector¶
There are various customizations you can do to tailor the deployment of OpenStack Kubernetes-Node-Problem-Detector. You can find those below.
General Parameters¶
conf.monitors.custom-plugin-monitor.config.network-problem-monitor.conditions
Type: list
Description:
[]
conf.monitors.custom-plugin-monitor.config.network-problem-monitor.plugin
Type: string
Description:
“custom”
conf.monitors.custom-plugin-monitor.config.network-problem-monitor.pluginConfig.concurrency
Type: int
Description:
3
conf.monitors.custom-plugin-monitor.config.network-problem-monitor.pluginConfig.invoke_interval
Type: string
Description:
“30s”
conf.monitors.custom-plugin-monitor.config.network-problem-monitor.pluginConfig.max_output_length
Type: int
Description:
80
conf.monitors.custom-plugin-monitor.config.network-problem-monitor.pluginConfig.timeout
Type: string
Description:
“5s”
conf.monitors.custom-plugin-monitor.config.network-problem-monitor.rules[0].path
Type: string
Description:
“./config/plugin/network_problem.sh”
conf.monitors.custom-plugin-monitor.config.network-problem-monitor.rules[0].reason
Type: string
Description:
“ConntrackFull”
conf.monitors.custom-plugin-monitor.config.network-problem-monitor.rules[0].timeout
Type: string
Description:
“3s”
conf.monitors.custom-plugin-monitor.config.network-problem-monitor.rules[0].type
Type: string
Description:
“temporary”
conf.monitors.custom-plugin-monitor.config.network-problem-monitor.source
Type: string
Description:
“network-custom-plugin-monitor”
conf.monitors.custom-plugin-monitor.enabled[0]
Type: string
Description:
“/config/network-problem-monitor.json”
conf.monitors.custom-plugin-monitor.scripts.enabled[0]
Type: string
Description:
“network_problem.sh”
conf.monitors.custom-plugin-monitor.scripts.source.”network_problem.sh”
Type: string
Description:
#!/bin/bash # This plugin checks for common network issues. Currently, it only checks # if the conntrack table is 50% full. set -eu set -o pipefail conntrack_threshold=$(($(cat /proc/sys/net/netfilter/nf_conntrack_max)/2 )) conntrack_count=$(cat /proc/sys/net/netfilter/nf_conntrack_count) if [ \"$conntrack_count\" -ge \"$conntrack_threshold\" ]; then echo \"Conntrack table approaching full\" exit 1 fi exit 0conf.monitors.system-log-monitor.config.docker-monitor-counter.conditions[0].message
Type: string
Description:
“docker overlay2 is functioning properly”
conf.monitors.system-log-monitor.config.docker-monitor-counter.conditions[0].reason
Type: string
Description:
“NoCorruptDockerOverlay2”
conf.monitors.system-log-monitor.config.docker-monitor-counter.conditions[0].type
Type: string
Description:
“CorruptDockerOverlay2”
conf.monitors.system-log-monitor.config.docker-monitor-counter.plugin
Type: string
Description:
“custom”
conf.monitors.system-log-monitor.config.docker-monitor-counter.pluginConfig.concurrency
Type: int
Description:
1
conf.monitors.system-log-monitor.config.docker-monitor-counter.pluginConfig.invoke_interval
Type: string
Description:
“5m”
conf.monitors.system-log-monitor.config.docker-monitor-counter.pluginConfig.max_output_length
Type: int
Description:
80
conf.monitors.system-log-monitor.config.docker-monitor-counter.pluginConfig.timeout
Type: string
Description:
“1m”
conf.monitors.system-log-monitor.config.docker-monitor-counter.rules[0].args[0]
Type: string
Description:
“–journald-source=dockerd”
conf.monitors.system-log-monitor.config.docker-monitor-counter.rules[0].args[1]
Type: string
Description:
“–log-path=/var/log/journal”
conf.monitors.system-log-monitor.config.docker-monitor-counter.rules[0].args[2]
Type: string
Description:
“–lookback=5m”
conf.monitors.system-log-monitor.config.docker-monitor-counter.rules[0].args[3]
Type: string
Description:
“–count=10”
conf.monitors.system-log-monitor.config.docker-monitor-counter.rules[0].args[4]
Type: string
Description:
“–pattern=returned error: readlink /var/lib/docker/overlay2.*: invalid argument.*”
conf.monitors.system-log-monitor.config.docker-monitor-counter.rules[0].condition
Type: string
Description:
“CorruptDockerOverlay2”
conf.monitors.system-log-monitor.config.docker-monitor-counter.rules[0].path
Type: string
Description:
“/home/kubernetes/bin/log-counter”
conf.monitors.system-log-monitor.config.docker-monitor-counter.rules[0].reason
Type: string
Description:
“CorruptDockerOverlay2”
conf.monitors.system-log-monitor.config.docker-monitor-counter.rules[0].timeout
Type: string
Description:
“1m”
conf.monitors.system-log-monitor.config.docker-monitor-counter.rules[0].type
Type: string
Description:
“permanent”
conf.monitors.system-log-monitor.config.docker-monitor-counter.source
Type: string
Description:
“docker-monitor”
conf.monitors.system-log-monitor.config.docker-monitor-filelog.bufferSize
Type: int
Description:
10
conf.monitors.system-log-monitor.config.docker-monitor-filelog.conditions
Type: list
Description:
[]
conf.monitors.system-log-monitor.config.docker-monitor-filelog.logPath
Type: string
Description:
“/var/log/docker.log”
conf.monitors.system-log-monitor.config.docker-monitor-filelog.lookback
Type: string
Description:
“5m”
conf.monitors.system-log-monitor.config.docker-monitor-filelog.plugin
Type: string
Description:
“filelog”
conf.monitors.system-log-monitor.config.docker-monitor-filelog.pluginConfig.message
Type: string
Description:
msg=\"([^ ]*)\conf.monitors.system-log-monitor.config.docker-monitor-filelog.pluginConfig.timestamp
Type: string
Description:
“^time="(\S*)"”
conf.monitors.system-log-monitor.config.docker-monitor-filelog.pluginConfig.timestampFormat
Type: string
Description:
“2006-01-02T15:04:05.999999999-07:00”
conf.monitors.system-log-monitor.config.docker-monitor-filelog.rules[0].pattern
Type: string
Description:
“Error trying v2 registry: failed to register layer: rename /var/lib/docker/image/(.+) /var/lib/docker/image/(.+): directory not empty.*”
conf.monitors.system-log-monitor.config.docker-monitor-filelog.rules[0].reason
Type: string
Description:
“CorruptDockerImage”
conf.monitors.system-log-monitor.config.docker-monitor-filelog.rules[0].type
Type: string
Description:
“temporary”
conf.monitors.system-log-monitor.config.docker-monitor-filelog.source
Type: string
Description:
“docker-monitor”
conf.monitors.system-log-monitor.config.docker-monitor.bufferSize
Type: int
Description:
10
conf.monitors.system-log-monitor.config.docker-monitor.conditions
Type: list
Description:
[]
conf.monitors.system-log-monitor.config.docker-monitor.logPath
Type: string
Description:
“/var/log/journal”
conf.monitors.system-log-monitor.config.docker-monitor.lookback
Type: string
Description:
“5m”
conf.monitors.system-log-monitor.config.docker-monitor.plugin
Type: string
Description:
“journald”
conf.monitors.system-log-monitor.config.docker-monitor.pluginConfig.source
Type: string
Description:
“dockerd”
conf.monitors.system-log-monitor.config.docker-monitor.rules[0].pattern
Type: string
Description:
“Error trying v2 registry: failed to register layer: rename /var/lib/docker/image/(.+) /var/lib/docker/image/(.+): directory not empty.*”
conf.monitors.system-log-monitor.config.docker-monitor.rules[0].reason
Type: string
Description:
“CorruptDockerImage”
conf.monitors.system-log-monitor.config.docker-monitor.rules[0].type
Type: string
Description:
“temporary”
conf.monitors.system-log-monitor.config.docker-monitor.source
Type: string
Description:
“docker-monitor”
conf.monitors.system-log-monitor.config.kernel-monitor-counter.conditions[0].message
Type: string
Description:
“node is functioning properly”
conf.monitors.system-log-monitor.config.kernel-monitor-counter.conditions[0].reason
Type: string
Description:
“NoFrequentUnregisterNetDevice”
conf.monitors.system-log-monitor.config.kernel-monitor-counter.conditions[0].type
Type: string
Description:
“FrequentUnregisterNetDevice”
conf.monitors.system-log-monitor.config.kernel-monitor-counter.plugin
Type: string
Description:
“custom”
conf.monitors.system-log-monitor.config.kernel-monitor-counter.pluginConfig.concurrency
Type: int
Description:
1
conf.monitors.system-log-monitor.config.kernel-monitor-counter.pluginConfig.invoke_interval
Type: string
Description:
“5m”
conf.monitors.system-log-monitor.config.kernel-monitor-counter.pluginConfig.max_output_length
Type: int
Description:
80
conf.monitors.system-log-monitor.config.kernel-monitor-counter.pluginConfig.timeout
Type: string
Description:
“1m”
conf.monitors.system-log-monitor.config.kernel-monitor-counter.rules[0].args[0]
Type: string
Description:
“–journald-source=kernel”
conf.monitors.system-log-monitor.config.kernel-monitor-counter.rules[0].args[1]
Type: string
Description:
“–log-path=/var/log/journal”
conf.monitors.system-log-monitor.config.kernel-monitor-counter.rules[0].args[2]
Type: string
Description:
“–lookback=20m”
conf.monitors.system-log-monitor.config.kernel-monitor-counter.rules[0].args[3]
Type: string
Description:
“–count=3”
conf.monitors.system-log-monitor.config.kernel-monitor-counter.rules[0].args[4]
Type: string
Description:
“–pattern=unregister_netdevice: waiting for \w+ to become free. Usage count = \d+”
conf.monitors.system-log-monitor.config.kernel-monitor-counter.rules[0].condition
Type: string
Description:
“FrequentUnregisterNetDevice”
conf.monitors.system-log-monitor.config.kernel-monitor-counter.rules[0].path
Type: string
Description:
“/home/kubernetes/bin/log-counter”
conf.monitors.system-log-monitor.config.kernel-monitor-counter.rules[0].reason
Type: string
Description:
“UnregisterNetDevice”
conf.monitors.system-log-monitor.config.kernel-monitor-counter.rules[0].timeout
Type: string
Description:
“1m”
conf.monitors.system-log-monitor.config.kernel-monitor-counter.rules[0].type
Type: string
Description:
“permanent”
conf.monitors.system-log-monitor.config.kernel-monitor-counter.source
Type: string
Description:
“kernel-monitor”
conf.monitors.system-log-monitor.config.kernel-monitor-filelog.bufferSize
Type: int
Description:
10
conf.monitors.system-log-monitor.config.kernel-monitor-filelog.conditions[0].message
Type: string
Description:
“kernel has no deadlock”
conf.monitors.system-log-monitor.config.kernel-monitor-filelog.conditions[0].reason
Type: string
Description:
“KernelHasNoDeadlock”
conf.monitors.system-log-monitor.config.kernel-monitor-filelog.conditions[0].type
Type: string
Description:
“KernelDeadlock”
conf.monitors.system-log-monitor.config.kernel-monitor-filelog.logPath
Type: string
Description:
“/var/log/kern.log”
conf.monitors.system-log-monitor.config.kernel-monitor-filelog.lookback
Type: string
Description:
“5m”
conf.monitors.system-log-monitor.config.kernel-monitor-filelog.plugin
Type: string
Description:
“filelog”
conf.monitors.system-log-monitor.config.kernel-monitor-filelog.pluginConfig.message
Type: string
Description:
“kernel: \[.*\] (.*)”
conf.monitors.system-log-monitor.config.kernel-monitor-filelog.pluginConfig.timestamp
Type: string
Description:
“^.{15}”
conf.monitors.system-log-monitor.config.kernel-monitor-filelog.pluginConfig.timestampFormat
Type: string
Description:
“Jan _2 15:04:05”
conf.monitors.system-log-monitor.config.kernel-monitor-filelog.rules[0].pattern
Type: string
Description:
Kill process \\d+ (.+) score \\d+ or sacrifice child\ Killed process \\d+ (.+) total-vm:\\d+kB, anon-rss:\\d+kB, file-rss:\\d+kB.*conf.monitors.system-log-monitor.config.kernel-monitor-filelog.rules[0].reason
Type: string
Description:
“OOMKilling”
conf.monitors.system-log-monitor.config.kernel-monitor-filelog.rules[0].type
Type: string
Description:
“temporary”
conf.monitors.system-log-monitor.config.kernel-monitor-filelog.rules[1].pattern
Type: string
Description:
“task \S+:\w+ blocked for more than \w+ seconds\.”
conf.monitors.system-log-monitor.config.kernel-monitor-filelog.rules[1].reason
Type: string
Description:
“TaskHung”
conf.monitors.system-log-monitor.config.kernel-monitor-filelog.rules[1].type
Type: string
Description:
“temporary”
conf.monitors.system-log-monitor.config.kernel-monitor-filelog.rules[2].pattern
Type: string
Description:
“unregister_netdevice: waiting for \w+ to become free. Usage count = \d+”
conf.monitors.system-log-monitor.config.kernel-monitor-filelog.rules[2].reason
Type: string
Description:
“UnregisterNetDevice”
conf.monitors.system-log-monitor.config.kernel-monitor-filelog.rules[2].type
Type: string
Description:
“temporary”
conf.monitors.system-log-monitor.config.kernel-monitor-filelog.rules[3].pattern
Type: string
Description:
“BUG: unable to handle kernel NULL pointer dereference at .*”
conf.monitors.system-log-monitor.config.kernel-monitor-filelog.rules[3].reason
Type: string
Description:
“KernelOops”
conf.monitors.system-log-monitor.config.kernel-monitor-filelog.rules[3].type
Type: string
Description:
“temporary”
conf.monitors.system-log-monitor.config.kernel-monitor-filelog.rules[4].pattern
Type: string
Description:
“divide error: 0000 \[#\d+\] SMP”
conf.monitors.system-log-monitor.config.kernel-monitor-filelog.rules[4].reason
Type: string
Description:
“KernelOops”
conf.monitors.system-log-monitor.config.kernel-monitor-filelog.rules[4].type
Type: string
Description:
“temporary”
conf.monitors.system-log-monitor.config.kernel-monitor-filelog.rules[5].condition
Type: string
Description:
“KernelDeadlock”
conf.monitors.system-log-monitor.config.kernel-monitor-filelog.rules[5].pattern
Type: string
Description:
“task umount\.aufs:\w+ blocked for more than \w+ seconds\.”
conf.monitors.system-log-monitor.config.kernel-monitor-filelog.rules[5].reason
Type: string
Description:
“AUFSUmountHung”
conf.monitors.system-log-monitor.config.kernel-monitor-filelog.rules[5].type
Type: string
Description:
“permanent”
conf.monitors.system-log-monitor.config.kernel-monitor-filelog.rules[6].condition
Type: string
Description:
“KernelDeadlock”
conf.monitors.system-log-monitor.config.kernel-monitor-filelog.rules[6].pattern
Type: string
Description:
“task docker:\w+ blocked for more than \w+ seconds\.”
conf.monitors.system-log-monitor.config.kernel-monitor-filelog.rules[6].reason
Type: string
Description:
“DockerHung”
conf.monitors.system-log-monitor.config.kernel-monitor-filelog.rules[6].type
Type: string
Description:
“permanent”
conf.monitors.system-log-monitor.config.kernel-monitor-filelog.source
Type: string
Description:
“kernel-monitor”
conf.monitors.system-log-monitor.config.kernel-monitor.bufferSize
Type: int
Description:
10
conf.monitors.system-log-monitor.config.kernel-monitor.conditions[0].message
Type: string
Description:
“kernel has no deadlock”
conf.monitors.system-log-monitor.config.kernel-monitor.conditions[0].reason
Type: string
Description:
“KernelHasNoDeadlock”
conf.monitors.system-log-monitor.config.kernel-monitor.conditions[0].type
Type: string
Description:
“KernelDeadlock”
conf.monitors.system-log-monitor.config.kernel-monitor.conditions[1].message
Type: string
Description:
“Filesystem is not read-only”
conf.monitors.system-log-monitor.config.kernel-monitor.conditions[1].reason
Type: string
Description:
“FilesystemIsNotReadOnly”
conf.monitors.system-log-monitor.config.kernel-monitor.conditions[1].type
Type: string
Description:
“ReadonlyFilesystem”
conf.monitors.system-log-monitor.config.kernel-monitor.logPath
Type: string
Description:
“/dev/kmsg”
conf.monitors.system-log-monitor.config.kernel-monitor.lookback
Type: string
Description:
“5m”
conf.monitors.system-log-monitor.config.kernel-monitor.plugin
Type: string
Description:
“kmsg”
conf.monitors.system-log-monitor.config.kernel-monitor.rules[0].pattern
Type: string
Description:
Kill process \\d+ (.+) score \\d+ or sacrifice child\ Killed process \\d+ (.+) total-vm:\\d+kB, anon-rss:\\d+kB, file-rss:\\d+kB.*conf.monitors.system-log-monitor.config.kernel-monitor.rules[0].reason
Type: string
Description:
“OOMKilling”
conf.monitors.system-log-monitor.config.kernel-monitor.rules[0].type
Type: string
Description:
“temporary”
conf.monitors.system-log-monitor.config.kernel-monitor.rules[1].pattern
Type: string
Description:
“task \S+:\w+ blocked for more than \w+ seconds\.”
conf.monitors.system-log-monitor.config.kernel-monitor.rules[1].reason
Type: string
Description:
“TaskHung”
conf.monitors.system-log-monitor.config.kernel-monitor.rules[1].type
Type: string
Description:
“temporary”
conf.monitors.system-log-monitor.config.kernel-monitor.rules[2].pattern
Type: string
Description:
“unregister_netdevice: waiting for \w+ to become free. Usage count = \d+”
conf.monitors.system-log-monitor.config.kernel-monitor.rules[2].reason
Type: string
Description:
“UnregisterNetDevice”
conf.monitors.system-log-monitor.config.kernel-monitor.rules[2].type
Type: string
Description:
“temporary”
conf.monitors.system-log-monitor.config.kernel-monitor.rules[3].pattern
Type: string
Description:
“BUG: unable to handle kernel NULL pointer dereference at .*”
conf.monitors.system-log-monitor.config.kernel-monitor.rules[3].reason
Type: string
Description:
“KernelOops”
conf.monitors.system-log-monitor.config.kernel-monitor.rules[3].type
Type: string
Description:
“temporary”
conf.monitors.system-log-monitor.config.kernel-monitor.rules[4].pattern
Type: string
Description:
“divide error: 0000 \[#\d+\] SMP”
conf.monitors.system-log-monitor.config.kernel-monitor.rules[4].reason
Type: string
Description:
“KernelOops”
conf.monitors.system-log-monitor.config.kernel-monitor.rules[4].type
Type: string
Description:
“temporary”
conf.monitors.system-log-monitor.config.kernel-monitor.rules[5].condition
Type: string
Description:
“KernelDeadlock”
conf.monitors.system-log-monitor.config.kernel-monitor.rules[5].pattern
Type: string
Description:
“task umount\.aufs:\w+ blocked for more than \w+ seconds\.”
conf.monitors.system-log-monitor.config.kernel-monitor.rules[5].reason
Type: string
Description:
“AUFSUmountHung”
conf.monitors.system-log-monitor.config.kernel-monitor.rules[5].type
Type: string
Description:
“permanent”
conf.monitors.system-log-monitor.config.kernel-monitor.rules[6].condition
Type: string
Description:
“KernelDeadlock”
conf.monitors.system-log-monitor.config.kernel-monitor.rules[6].pattern
Type: string
Description:
“task docker:\w+ blocked for more than \w+ seconds\.”
conf.monitors.system-log-monitor.config.kernel-monitor.rules[6].reason
Type: string
Description:
“DockerHung”
conf.monitors.system-log-monitor.config.kernel-monitor.rules[6].type
Type: string
Description:
“permanent”
conf.monitors.system-log-monitor.config.kernel-monitor.rules[7].condition
Type: string
Description:
“ReadonlyFilesystem”
conf.monitors.system-log-monitor.config.kernel-monitor.rules[7].pattern
Type: string
Description:
“Remounting filesystem read-only”
conf.monitors.system-log-monitor.config.kernel-monitor.rules[7].reason
Type: string
Description:
“FilesystemIsReadOnly”
conf.monitors.system-log-monitor.config.kernel-monitor.rules[7].type
Type: string
Description:
“permanent”
conf.monitors.system-log-monitor.config.kernel-monitor.source
Type: string
Description:
“kernel-monitor”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.conditions[0].message
Type: string
Description:
“kubelet is functioning properly”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.conditions[0].reason
Type: string
Description:
“NoFrequentKubeletRestart”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.conditions[0].type
Type: string
Description:
“FrequentKubeletRestart”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.conditions[1].message
Type: string
Description:
“docker is functioning properly”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.conditions[1].reason
Type: string
Description:
“NoFrequentDockerRestart”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.conditions[1].type
Type: string
Description:
“FrequentDockerRestart”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.conditions[2].message
Type: string
Description:
“containerd is functioning properly”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.conditions[2].reason
Type: string
Description:
“NoFrequentContainerdRestart”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.conditions[2].type
Type: string
Description:
“FrequentContainerdRestart”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.plugin
Type: string
Description:
“custom”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.pluginConfig.concurrency
Type: int
Description:
1
conf.monitors.system-log-monitor.config.systemd-monitor-counter.pluginConfig.invoke_interval
Type: string
Description:
“5m”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.pluginConfig.max_output_length
Type: int
Description:
80
conf.monitors.system-log-monitor.config.systemd-monitor-counter.pluginConfig.timeout
Type: string
Description:
“1m”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.rules[0].args[0]
Type: string
Description:
“–journald-source=systemd”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.rules[0].args[1]
Type: string
Description:
“–log-path=/var/log/journal”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.rules[0].args[2]
Type: string
Description:
“–lookback=20m”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.rules[0].args[3]
Type: string
Description:
“–delay=5m”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.rules[0].args[4]
Type: string
Description:
“–count=5”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.rules[0].args[5]
Type: string
Description:
“–pattern=Started Kubernetes kubelet.”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.rules[0].condition
Type: string
Description:
“FrequentKubeletRestart”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.rules[0].path
Type: string
Description:
“/home/kubernetes/bin/log-counter”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.rules[0].reason
Type: string
Description:
“FrequentKubeletRestart”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.rules[0].timeout
Type: string
Description:
“1m”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.rules[0].type
Type: string
Description:
“permanent”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.rules[1].args[0]
Type: string
Description:
“–journald-source=systemd”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.rules[1].args[1]
Type: string
Description:
“–log-path=/var/log/journal”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.rules[1].args[2]
Type: string
Description:
“–lookback=20m”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.rules[1].args[3]
Type: string
Description:
“–count=5”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.rules[1].args[4]
Type: string
Description:
“–pattern=Starting Docker Application Container Engine…”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.rules[1].condition
Type: string
Description:
“FrequentDockerRestart”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.rules[1].path
Type: string
Description:
“/home/kubernetes/bin/log-counter”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.rules[1].reason
Type: string
Description:
“FrequentDockerRestart”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.rules[1].timeout
Type: string
Description:
“1m”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.rules[1].type
Type: string
Description:
“permanent”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.rules[2].args[0]
Type: string
Description:
“–journald-source=systemd”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.rules[2].args[1]
Type: string
Description:
“–log-path=/var/log/journal”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.rules[2].args[2]
Type: string
Description:
“–lookback=20m”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.rules[2].args[3]
Type: string
Description:
“–count=5”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.rules[2].args[4]
Type: string
Description:
“–pattern=Starting containerd container runtime…”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.rules[2].condition
Type: string
Description:
“FrequentContainerdRestart”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.rules[2].path
Type: string
Description:
“/home/kubernetes/bin/log-counter”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.rules[2].reason
Type: string
Description:
“FrequentContainerdRestart”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.rules[2].timeout
Type: string
Description:
“1m”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.rules[2].type
Type: string
Description:
“permanent”
conf.monitors.system-log-monitor.config.systemd-monitor-counter.source
Type: string
Description:
“systemd-monitor”
conf.monitors.system-log-monitor.config.systemd-monitor.bufferSize
Type: int
Description:
10
conf.monitors.system-log-monitor.config.systemd-monitor.conditions
Type: list
Description:
[]
conf.monitors.system-log-monitor.config.systemd-monitor.logPath
Type: string
Description:
“/var/log/journal”
conf.monitors.system-log-monitor.config.systemd-monitor.lookback
Type: string
Description:
“5m”
conf.monitors.system-log-monitor.config.systemd-monitor.plugin
Type: string
Description:
“journald”
conf.monitors.system-log-monitor.config.systemd-monitor.pluginConfig.source
Type: string
Description:
“systemd”
conf.monitors.system-log-monitor.config.systemd-monitor.rules[0].pattern
Type: string
Description:
“Started Kubernetes kubelet.”
conf.monitors.system-log-monitor.config.systemd-monitor.rules[0].reason
Type: string
Description:
“KubeletStart”
conf.monitors.system-log-monitor.config.systemd-monitor.rules[0].type
Type: string
Description:
“temporary”
conf.monitors.system-log-monitor.config.systemd-monitor.rules[1].pattern
Type: string
Description:
“Starting Docker Application Container Engine…”
conf.monitors.system-log-monitor.config.systemd-monitor.rules[1].reason
Type: string
Description:
“DockerStart”
conf.monitors.system-log-monitor.config.systemd-monitor.rules[1].type
Type: string
Description:
“temporary”
conf.monitors.system-log-monitor.config.systemd-monitor.rules[2].pattern
Type: string
Description:
“Starting containerd container runtime…”
conf.monitors.system-log-monitor.config.systemd-monitor.rules[2].reason
Type: string
Description:
“ContainerdStart”
conf.monitors.system-log-monitor.config.systemd-monitor.rules[2].type
Type: string
Description:
“temporary”
conf.monitors.system-log-monitor.config.systemd-monitor.source
Type: string
Description:
“systemd-monitor”
conf.monitors.system-log-monitor.enabled[0]
Type: string
Description:
“/config/kernel-monitor.json”
conf.monitors.system-log-monitor.enabled[1]
Type: string
Description:
“/config/docker-monitor.json”
conf.monitors.system-log-monitor.enabled[2]
Type: string
Description:
“/config/systemd-monitor.json”
conf.monitors.system-log-monitor.scripts.enabled
Type: string
Description:
nil
conf.monitors.system-log-monitor.scripts.source
Type: string
Description:
nil
conf.monitors.system-stats-monitor.config.system-stats-monitor.disk.includeAllAttachedBlk
Type: bool
Description:
true
conf.monitors.system-stats-monitor.config.system-stats-monitor.disk.includeRootBlk
Type: bool
Description:
true
conf.monitors.system-stats-monitor.config.system-stats-monitor.disk.lsblkTimeout
Type: string
Description:
“5s”
conf.monitors.system-stats-monitor.config.system-stats-monitor.disk.metricsConfigs.disk/avg_queue_len.displayName
Type: string
Description:
“disk/avg_queue_len”
conf.monitors.system-stats-monitor.config.system-stats-monitor.disk.metricsConfigs.disk/io_time.displayName
Type: string
Description:
“disk/io_time”
conf.monitors.system-stats-monitor.config.system-stats-monitor.disk.metricsConfigs.disk/weighted_io.displayName
Type: string
Description:
“disk/weighted_io”
conf.monitors.system-stats-monitor.config.system-stats-monitor.invokeInterval
Type: string
Description:
“60s”
conf.monitors.system-stats-monitor.enabled[0]
Type: string
Description:
“/config/system-stats-monitor.json”
conf.monitors.system-stats-monitor.scripts.enabled
Type: string
Description:
nil
conf.monitors.system-stats-monitor.scripts.source
Type: string
Description:
nil
dependencies.dynamic.common.local_image_registry.jobs[0]
Type: string
Description:
“node-exporter-image-repo-sync”
dependencies.dynamic.common.local_image_registry.services[0].endpoint
Type: string
Description:
“node”
dependencies.dynamic.common.local_image_registry.services[0].service
Type: string
Description:
“local_image_registry”
dependencies.static.image_repo_sync.services[0].endpoint
Type: string
Description:
“internal”
dependencies.static.image_repo_sync.services[0].service
Type: string
Description:
“local_image_registry”
dependencies.static.node_problem_detector.services
Type: string
Description:
nil
endpoints.cluster_domain_suffix
Type: string
Description:
“cluster.local”
endpoints.local_image_registry.host_fqdn_override.default
Type: string
Description:
nil
endpoints.local_image_registry.hosts.default
Type: string
Description:
“localhost”
endpoints.local_image_registry.hosts.internal
Type: string
Description:
“docker-registry”
endpoints.local_image_registry.hosts.node
Type: string
Description:
“localhost”
endpoints.local_image_registry.name
Type: string
Description:
“docker-registry”
endpoints.local_image_registry.namespace
Type: string
Description:
“docker-registry”
endpoints.local_image_registry.port.registry.node
Type: int
Description:
5000
endpoints.node_problem_detector.host_fqdn_override.default
Type: string
Description:
nil
endpoints.node_problem_detector.hosts.default
Type: string
Description:
“node-problem-detector”
endpoints.node_problem_detector.name
Type: string
Description:
“node-problem-detector”
endpoints.node_problem_detector.namespace
Type: string
Description:
nil
endpoints.node_problem_detector.path.default
Type: string
Description:
nil
endpoints.node_problem_detector.port.metrics.default
Type: int
Description:
20257
endpoints.oci_image_registry.auth.enabled
Type: bool
Description:
false
endpoints.oci_image_registry.auth.kubernetes-node-problem-detector.password
Type: string
Description:
“password”
endpoints.oci_image_registry.auth.kubernetes-node-problem-detector.username
Type: string
Description:
“kubernetes-node-problem-detector”
endpoints.oci_image_registry.host_fqdn_override.default
Type: string
Description:
nil
endpoints.oci_image_registry.hosts.default
Type: string
Description:
“localhost”
endpoints.oci_image_registry.name
Type: string
Description:
“oci-image-registry”
endpoints.oci_image_registry.namespace
Type: string
Description:
“oci-image-registry”
endpoints.oci_image_registry.port.registry.default
Type: string
Description:
nil
images.local_registry.active
Type: bool
Description:
false
images.local_registry.exclude[0]
Type: string
Description:
“dep_check”
images.local_registry.exclude[1]
Type: string
Description:
“image_repo_sync”
images.pull_policy
Type: string
Description:
“IfNotPresent”
images.tags.dep_check
Type: string
Description:
“quay.io/airshipit/kubernetes-entrypoint:latest-ubuntu_focal”
images.tags.image_repo_sync
Type: string
Description:
“docker.io/library/docker:17.07.0”
images.tags.node_problem_detector
Type: string
Description:
“docker.io/openstackhelm/node-problem-detector:latest-ubuntu_jammy”
labels.job.node_selector_key
Type: string
Description:
“openstack-control-plane”
labels.job.node_selector_value
Type: string
Description:
“enabled”
labels.node_problem_detector.node_selector_key
Type: string
Description:
“openstack-control-plane”
labels.node_problem_detector.node_selector_value
Type: string
Description:
“enabled”
manifests.configmap_bin
Type: bool
Description:
true
manifests.configmap_etc
Type: bool
Description:
true
manifests.daemonset
Type: bool
Description:
true
manifests.job_image_repo_sync
Type: bool
Description:
true
manifests.secret_registry
Type: bool
Description:
true
manifests.service
Type: bool
Description:
false
monitoring.prometheus.node_problem_detector.port
Type: int
Description:
20257
monitoring.prometheus.node_problem_detector.scrape
Type: bool
Description:
true
monitoring.prometheus.pod.enabled
Type: bool
Description:
true
monitoring.prometheus.service.enabled
Type: bool
Description:
false
pod.affinity.anti.topologyKey.default
Type: string
Description:
“kubernetes.io/hostname”
pod.affinity.anti.type.default
Type: string
Description:
“preferredDuringSchedulingIgnoredDuringExecution”
pod.lifecycle.termination_grace_period.node_problem_detector.timeout
Type: int
Description:
30
pod.lifecycle.upgrades.daemonsets.node_problem_detector.enabled
Type: bool
Description:
true
pod.lifecycle.upgrades.daemonsets.node_problem_detector.min_ready_seconds
Type: int
Description:
0
pod.lifecycle.upgrades.daemonsets.pod_replacement_strategy
Type: string
Description:
“RollingUpdate”
pod.lifecycle.upgrades.pod_replacement_strategy
Type: string
Description:
“RollingUpdate”
pod.lifecycle.upgrades.revision_history
Type: int
Description:
3
pod.lifecycle.upgrades.rolling_update.max_surge
Type: int
Description:
3
pod.lifecycle.upgrades.rolling_update.max_unavailable
Type: int
Description:
1
pod.mounts.node_problem_detector.init_container
Type: string
Description:
nil
pod.mounts.node_problem_detector.node_problem_detector
Type: string
Description:
nil
pod.resources.enabled
Type: bool
Description:
false
pod.resources.jobs.image_repo_sync.limits.cpu
Type: string
Description:
“2000m”
pod.resources.jobs.image_repo_sync.limits.memory
Type: string
Description:
“1024Mi”
pod.resources.jobs.image_repo_sync.requests.cpu
Type: string
Description:
“100m”
pod.resources.jobs.image_repo_sync.requests.memory
Type: string
Description:
“128Mi”
pod.resources.node_problem_detector.limits.cpu
Type: string
Description:
“2000m”
pod.resources.node_problem_detector.limits.memory
Type: string
Description:
“1024Mi”
pod.resources.node_problem_detector.requests.cpu
Type: string
Description:
“100m”
pod.resources.node_problem_detector.requests.memory
Type: string
Description:
“128Mi”
pod.security_context.node_problem_detector.container.node_problem_detector.privileged
Type: bool
Description:
true
pod.security_context.node_problem_detector.container.node_problem_detector.readOnlyRootFilesystem
Type: bool
Description:
true
pod.security_context.node_problem_detector.pod.runAsUser
Type: int
Description:
0
pod.tolerations.node_problem_detector.enabled
Type: bool
Description:
false
pod.tolerations.node_problem_detector.tolerations[0].key
Type: string
Description:
“node-role.kubernetes.io/master”
pod.tolerations.node_problem_detector.tolerations[0].operator
Type: string
Description:
“Exists”
pod.tolerations.node_problem_detector.tolerations[1].key
Type: string
Description:
“node-role.kubernetes.io/control-plane”
pod.tolerations.node_problem_detector.tolerations[1].operator
Type: string
Description:
“Exists”
pod.tolerations.node_problem_detector.tolerations[2].key
Type: string
Description:
“node-role.kubernetes.io/node”
pod.tolerations.node_problem_detector.tolerations[2].operator
Type: string
Description:
“Exists”
secrets.oci_image_registry.kubernetes-node-problem-detector
Type: string
Description:
“kubernetes-node-problem-detector-oci-image-registry-key”