mirror of
				https://github.com/optim-enterprises-bv/kubernetes.git
				synced 2025-11-03 19:58:17 +00:00 
			
		
		
		
	
		
			
				
	
	
		
			121 lines
		
	
	
		
			4.5 KiB
		
	
	
	
		
			Bash
		
	
	
		
			Executable File
		
	
	
	
	
			
		
		
	
	
			121 lines
		
	
	
		
			4.5 KiB
		
	
	
	
		
			Bash
		
	
	
		
			Executable File
		
	
	
	
	
#!/bin/bash
 | 
						|
 | 
						|
# Copyright 2014 The Kubernetes Authors All rights reserved.
 | 
						|
#
 | 
						|
# Licensed under the Apache License, Version 2.0 (the "License");
 | 
						|
# you may not use this file except in compliance with the License.
 | 
						|
# You may obtain a copy of the License at
 | 
						|
#
 | 
						|
#     http://www.apache.org/licenses/LICENSE-2.0
 | 
						|
#
 | 
						|
# Unless required by applicable law or agreed to in writing, software
 | 
						|
# distributed under the License is distributed on an "AS IS" BASIS,
 | 
						|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 | 
						|
# See the License for the specific language governing permissions and
 | 
						|
# limitations under the License.
 | 
						|
 | 
						|
# Validates that the cluster is healthy.
 | 
						|
# Error codes are:
 | 
						|
# 0 - success
 | 
						|
# 1 - fatal (cluster is unlikely to work)
 | 
						|
# 2 - non-fatal (encountered some errors, but cluster should be working correctly)
 | 
						|
 | 
						|
set -o errexit
 | 
						|
set -o nounset
 | 
						|
set -o pipefail
 | 
						|
 | 
						|
KUBE_ROOT=$(dirname "${BASH_SOURCE}")/..
 | 
						|
 | 
						|
if [ -f "${KUBE_ROOT}/cluster/env.sh" ]; then
 | 
						|
    source "${KUBE_ROOT}/cluster/env.sh"
 | 
						|
fi
 | 
						|
 | 
						|
source "${KUBE_ROOT}/cluster/lib/util.sh"
 | 
						|
source "${KUBE_ROOT}/cluster/kube-util.sh"
 | 
						|
 | 
						|
ALLOWED_NOTREADY_NODES="${ALLOWED_NOTREADY_NODES:-0}"
 | 
						|
 | 
						|
EXPECTED_NUM_NODES="${NUM_NODES}"
 | 
						|
if [[ "${REGISTER_MASTER_KUBELET:-}" == "true" ]]; then
 | 
						|
  EXPECTED_NUM_NODES=$((EXPECTED_NUM_NODES+1))
 | 
						|
fi
 | 
						|
# Make several attempts to deal with slow cluster birth.
 | 
						|
return_value=0
 | 
						|
attempt=0
 | 
						|
while true; do
 | 
						|
  # The "kubectl get nodes -o template" exports node information.
 | 
						|
  #
 | 
						|
  # Echo the output and gather 2 counts:
 | 
						|
  #  - Total number of nodes.
 | 
						|
  #  - Number of "ready" nodes.
 | 
						|
  #
 | 
						|
  # Suppress errors from kubectl output because during cluster bootstrapping
 | 
						|
  # for clusters where the master node is registered, the apiserver will become
 | 
						|
  # available and then get restarted as the kubelet configures the docker bridge.
 | 
						|
  node=$("${KUBE_ROOT}/cluster/kubectl.sh" get nodes) || true
 | 
						|
  found=$(($(echo "${node}" | wc -l) - 1)) || true
 | 
						|
  ready=$(($(echo "${node}" | grep -v "NotReady" | wc -l ) - 1)) || true
 | 
						|
 | 
						|
  if (( "${found}" == "${EXPECTED_NUM_NODES}" )) && (( "${ready}" == "${EXPECTED_NUM_NODES}")); then
 | 
						|
    break
 | 
						|
  elif (( "${found}" > "${EXPECTED_NUM_NODES}" )) && (( "${ready}" > "${EXPECTED_NUM_NODES}")); then
 | 
						|
    echo -e "${color_red}Detected ${ready} ready nodes, found ${found} nodes out of expected ${EXPECTED_NUM_NODES}. Found more nodes than expected, your cluster may not behave correctly.${color_norm}"
 | 
						|
    break
 | 
						|
  else
 | 
						|
    # Set the timeout to ~25minutes (100 x 15 second) to avoid timeouts for 1000-node clusters.
 | 
						|
    if (( attempt > 100 )); then
 | 
						|
      echo -e "${color_red}Detected ${ready} ready nodes, found ${found} nodes out of expected ${EXPECTED_NUM_NODES}. Your cluster may not be fully functional.${color_norm}"
 | 
						|
      "${KUBE_ROOT}/cluster/kubectl.sh" get nodes
 | 
						|
      if [ "$((${EXPECTED_NUM_NODES} - ${ready}))" -gt "${ALLOWED_NOTREADY_NODES}" ]; then
 | 
						|
        exit 1
 | 
						|
      else
 | 
						|
        return_value=2
 | 
						|
        break
 | 
						|
      fi
 | 
						|
		else
 | 
						|
      echo -e "${color_yellow}Waiting for ${EXPECTED_NUM_NODES} ready nodes. ${ready} ready nodes, ${found} registered. Retrying.${color_norm}"
 | 
						|
    fi
 | 
						|
    attempt=$((attempt+1))
 | 
						|
    sleep 15
 | 
						|
  fi
 | 
						|
done
 | 
						|
echo "Found ${found} node(s)."
 | 
						|
"${KUBE_ROOT}/cluster/kubectl.sh" get nodes
 | 
						|
 | 
						|
attempt=0
 | 
						|
while true; do
 | 
						|
  # The "kubectl componentstatuses -o template" exports components health information.
 | 
						|
  #
 | 
						|
  # Echo the output and gather 2 counts:
 | 
						|
  #  - Total number of componentstatuses.
 | 
						|
  #  - Number of "healthy" components.
 | 
						|
  cs_status=$("${KUBE_ROOT}/cluster/kubectl.sh" get componentstatuses -o template --template='{{range .items}}{{with index .conditions 0}}{{.type}}:{{.status}},{{end}}{{end}}' --api-version=v1) || true
 | 
						|
  componentstatuses=$(echo "${cs_status}" | tr "," "\n" | grep -c 'Healthy:') || true
 | 
						|
  healthy=$(echo "${cs_status}" | tr "," "\n" | grep -c 'Healthy:True') || true
 | 
						|
 | 
						|
  if ((componentstatuses > healthy)); then
 | 
						|
    if ((attempt < 5)); then
 | 
						|
      echo -e "${color_yellow}Cluster not working yet.${color_norm}"
 | 
						|
      attempt=$((attempt+1))
 | 
						|
      sleep 30
 | 
						|
    else
 | 
						|
      echo -e " ${color_yellow}Validate output:${color_norm}"
 | 
						|
      "${KUBE_ROOT}/cluster/kubectl.sh" get cs
 | 
						|
      echo -e "${color_red}Validation returned one or more failed components. Cluster is probably broken.${color_norm}"
 | 
						|
      exit 1
 | 
						|
    fi
 | 
						|
  else
 | 
						|
    break
 | 
						|
  fi
 | 
						|
done
 | 
						|
 | 
						|
echo "Validate output:"
 | 
						|
"${KUBE_ROOT}/cluster/kubectl.sh" get cs
 | 
						|
if [ "${return_value}" == "0" ]; then 
 | 
						|
  echo -e "${color_green}Cluster validation succeeded${color_norm}"
 | 
						|
else
 | 
						|
  echo -e "${color_yellow}Cluster validation encountered some problems, but cluster should be in working order${color_norm}"
 | 
						|
fi
 | 
						|
 | 
						|
exit "${return_value}"
 |