|
| 1 | +apiVersion: v1 |
| 2 | +data: |
| 3 | + kernel-monitor.json: | |
| 4 | + { |
| 5 | + "plugin": "journald", |
| 6 | + "pluginConfig": { |
| 7 | + "source": "kernel" |
| 8 | + }, |
| 9 | + "logPath": "/var/log/journal", |
| 10 | + "lookback": "5m", |
| 11 | + "bufferSize": 10, |
| 12 | + "source": "kernel-monitor", |
| 13 | + "conditions": [ |
| 14 | + { |
| 15 | + "type": "KernelDeadlock", |
| 16 | + "reason": "KernelHasNoDeadlock", |
| 17 | + "message": "kernel has no deadlock" |
| 18 | + } |
| 19 | + ], |
| 20 | + "rules": [ |
| 21 | + { |
| 22 | + "type": "temporary", |
| 23 | + "reason": "OOMKilling", |
| 24 | + "pattern": "Kill process \\d+ (.+) score \\d+ or sacrifice child\\nKilled process \\d+ (.+) total-vm:\\d+kB, anon-rss:\\d+kB, file-rss:\\d+kB.*" |
| 25 | + }, |
| 26 | + { |
| 27 | + "type": "temporary", |
| 28 | + "reason": "TaskHung", |
| 29 | + "pattern": "task \\S+:\\w+ blocked for more than \\w+ seconds\\." |
| 30 | + }, |
| 31 | + { |
| 32 | + "type": "temporary", |
| 33 | + "reason": "UnregisterNetDevice", |
| 34 | + "pattern": "unregister_netdevice: waiting for \\w+ to become free. Usage count = \\d+" |
| 35 | + }, |
| 36 | + { |
| 37 | + "type": "temporary", |
| 38 | + "reason": "KernelOops", |
| 39 | + "pattern": "BUG: unable to handle kernel NULL pointer dereference at .*" |
| 40 | + }, |
| 41 | + { |
| 42 | + "type": "temporary", |
| 43 | + "reason": "KernelOops", |
| 44 | + "pattern": "divide error: 0000 \\[#\\d+\\] SMP" |
| 45 | + }, |
| 46 | + { |
| 47 | + "type": "permanent", |
| 48 | + "condition": "KernelDeadlock", |
| 49 | + "reason": "AUFSUmountHung", |
| 50 | + "pattern": "task umount\\.aufs:\\w+ blocked for more than \\w+ seconds\\." |
| 51 | + }, |
| 52 | + { |
| 53 | + "type": "permanent", |
| 54 | + "condition": "KernelDeadlock", |
| 55 | + "reason": "DockerHung", |
| 56 | + "pattern": "task docker:\\w+ blocked for more than \\w+ seconds\\." |
| 57 | + } |
| 58 | + ] |
| 59 | + } |
| 60 | + docker-monitor.json: | |
| 61 | + { |
| 62 | + "plugin": "journald", |
| 63 | + "pluginConfig": { |
| 64 | + "source": "docker" |
| 65 | + }, |
| 66 | + "logPath": "/var/log/journal", |
| 67 | + "lookback": "5m", |
| 68 | + "bufferSize": 10, |
| 69 | + "source": "docker-monitor", |
| 70 | + "conditions": [], |
| 71 | + "rules": [ |
| 72 | + { |
| 73 | + "type": "temporary", |
| 74 | + "reason": "CorruptDockerImage", |
| 75 | + "pattern": "Error trying v2 registry: failed to register layer: rename /var/lib/docker/image/(.+) /var/lib/docker/image/(.+): directory not empty.*" |
| 76 | + } |
| 77 | + ] |
| 78 | + } |
| 79 | +kind: ConfigMap |
| 80 | +metadata: |
| 81 | + name: node-problem-detector-config |
| 82 | + namespace: default |
0 commit comments