{
  "id": "kubernetes/kubelet-node-status-notfound",
  "signature": "Error: node 'worker-node-1' not found — kubelet is not posting node status",
  "signature_zh": "错误：节点 'worker-node-1' 未找到 — kubelet 未发布节点状态",
  "regex": "node '.*' not found",
  "domain": "kubernetes",
  "category": "system_error",
  "subcategory": null,
  "root_cause": "Kubelet on the node has stopped reporting its status to the API server, often due to kubelet crash, network disconnection, or certificate expiration, causing the node to be marked as NotReady or removed.",
  "root_cause_type": "generic",
  "root_cause_zh": "节点上的kubelet已停止向API服务器报告其状态，通常由于kubelet崩溃、网络断开或证书过期，导致节点被标记为NotReady或移除。",
  "versions": [
    {
      "version": "Kubernetes 1.24",
      "introduced": null,
      "deprecated": null,
      "removed": null,
      "behavior_change": null,
      "status": "active"
    },
    {
      "version": "Kubernetes 1.25",
      "introduced": null,
      "deprecated": null,
      "removed": null,
      "behavior_change": null,
      "status": "active"
    },
    {
      "version": "Kubernetes 1.26",
      "introduced": null,
      "deprecated": null,
      "removed": null,
      "behavior_change": null,
      "status": "active"
    },
    {
      "version": "kubeadm 1.25.0",
      "introduced": null,
      "deprecated": null,
      "removed": null,
      "behavior_change": null,
      "status": "active"
    }
  ],
  "os_specific": {},
  "dead_ends": [
    {
      "action": "",
      "why_fails": "Restarting the API server does not fix the node issue; the kubelet must be fixed on the node itself.",
      "fail_rate": 0.9,
      "condition": "",
      "sources": []
    },
    {
      "action": "",
      "why_fails": "Deleting and re-creating the node object in Kubernetes without fixing the kubelet will result in the same error because the new node will also fail to report status.",
      "fail_rate": 0.7,
      "condition": "",
      "sources": []
    }
  ],
  "workarounds": [
    {
      "action": "SSH into the node and check kubelet status: `systemctl status kubelet`. If stopped, restart it: `systemctl restart kubelet`. Then check logs: `journalctl -u kubelet -n 50`. Common causes: certificate expired (`openssl x509 -in /var/lib/kubelet/pki/kubelet-client-current.pem -text -noout`). If expired, rotate kubelet certificates: `kubeadm certs renew kubelet` and restart kubelet.",
      "success_rate": 0.85,
      "how": "SSH into the node and check kubelet status: `systemctl status kubelet`. If stopped, restart it: `systemctl restart kubelet`. Then check logs: `journalctl -u kubelet -n 50`. Common causes: certificate expired (`openssl x509 -in /var/lib/kubelet/pki/kubelet-client-current.pem -text -noout`). If expired, rotate kubelet certificates: `kubeadm certs renew kubelet` and restart kubelet.",
      "condition": "",
      "sources": []
    },
    {
      "action": "If the node is unreachable, delete the node object from the cluster: `kubectl delete node worker-node-1`. Then rejoin the node using `kubeadm join` with the correct token. This forces a fresh registration.",
      "success_rate": 0.75,
      "how": "If the node is unreachable, delete the node object from the cluster: `kubectl delete node worker-node-1`. Then rejoin the node using `kubeadm join` with the correct token. This forces a fresh registration.",
      "condition": "",
      "sources": []
    }
  ],
  "workarounds_zh": [
    "SSH进入节点并检查kubelet状态：`systemctl status kubelet`。如果已停止，重启：`systemctl restart kubelet`。然后检查日志：`journalctl -u kubelet -n 50`。常见原因：证书过期（`openssl x509 -in /var/lib/kubelet/pki/kubelet-client-current.pem -text -noout`）。如果过期，轮换kubelet证书：`kubeadm certs renew kubelet`并重启kubelet。",
    "如果节点不可达，从集群中删除节点对象：`kubectl delete node worker-node-1`。然后使用正确的令牌通过`kubeadm join`重新加入节点。这强制进行新注册。"
  ],
  "transition_graph": {
    "leads_to": [],
    "preceded_by": [],
    "frequently_confused_with": []
  },
  "official_doc_url": "https://kubernetes.io/docs/tasks/administer-cluster/kubelet-config-file/",
  "official_doc_section": null,
  "error_code": null,
  "verification_tier": "ai_generated",
  "confidence": 0.88,
  "fix_success_rate": 0.82,
  "resolvable": "true",
  "first_seen": "2023-04-05",
  "last_confirmed": "2024-06-01",
  "last_updated": "2024-06-01",
  "evidence_count": 1,
  "tags": [],
  "locale": "en",
  "aliases": []
}