first commit
This commit is contained in:
302
check-longhorn.sh
Normal file
302
check-longhorn.sh
Normal file
@@ -0,0 +1,302 @@
|
||||
#!/bin/bash
|
||||
|
||||
export RED='\x1b[0;31m'
|
||||
export GREEN='\x1b[38;5;22m'
|
||||
export CYAN='\x1b[36m'
|
||||
export YELLOW='\x1b[33m'
|
||||
export NO_COLOR='\x1b[0m'
|
||||
|
||||
if [ -z "${LOG_TITLE}" ]; then
|
||||
LOG_TITLE=''
|
||||
fi
|
||||
if [ -z "${LOG_LEVEL}" ]; then
|
||||
LOG_LEVEL="INFO"
|
||||
fi
|
||||
|
||||
debug() {
|
||||
if [[ "${LOG_LEVEL}" == "DEBUG" ]]; then
|
||||
local log_title
|
||||
if [ -n "${LOG_TITLE}" ]; then
|
||||
log_title="(${LOG_TITLE})"
|
||||
else
|
||||
log_title=''
|
||||
fi
|
||||
echo -e "${GREEN}[DEBUG]${log_title} ${NO_COLOR}$1"
|
||||
fi
|
||||
}
|
||||
|
||||
info() {
|
||||
if [[ "${LOG_LEVEL}" == "DEBUG" ]] ||\
|
||||
[[ "${LOG_LEVEL}" == "INFO" ]]; then
|
||||
local log_title
|
||||
if [ -n "${LOG_TITLE}" ]; then
|
||||
log_title="(${LOG_TITLE})"
|
||||
else
|
||||
log_title=''
|
||||
fi
|
||||
echo -e "${CYAN}[INFO] ${log_title} ${NO_COLOR}$1"
|
||||
fi
|
||||
}
|
||||
|
||||
warn() {
|
||||
if [[ "${LOG_LEVEL}" == "DEBUG" ]] ||\
|
||||
[[ "${LOG_LEVEL}" == "INFO" ]] ||\
|
||||
[[ "${LOG_LEVEL}" == "WARN" ]]; then
|
||||
local log_title
|
||||
if [ -n "${LOG_TITLE}" ]; then
|
||||
log_title="(${LOG_TITLE})"
|
||||
else
|
||||
log_title=''
|
||||
fi
|
||||
echo -e "${YELLOW}[WARN] ${log_title} ${NO_COLOR}$1"
|
||||
fi
|
||||
}
|
||||
|
||||
error() {
|
||||
if [[ "${LOG_LEVEL}" == "DEBUG" ]] ||\
|
||||
[[ "${LOG_LEVEL}" == "INFO" ]] ||\
|
||||
[[ "${LOG_LEVEL}" == "WARN" ]] ||\
|
||||
[[ "${LOG_LEVEL}" == "ERROR" ]]; then
|
||||
local log_title
|
||||
if [ -n "${LOG_TITLE}" ]; then
|
||||
log_title="(${LOG_TITLE})"
|
||||
else
|
||||
log_title=''
|
||||
fi
|
||||
echo -e "${RED}[ERROR]${log_title} ${NO_COLOR}$1"
|
||||
fi
|
||||
}
|
||||
|
||||
detect_node_os()
|
||||
{
|
||||
local pod="$1"
|
||||
|
||||
OS=`kubectl exec -i $pod -- nsenter --mount=/proc/1/ns/mnt -- bash -c 'grep -E "^ID_LIKE=" /etc/os-release | cut -d= -f2'`
|
||||
if [[ -z "${OS}" ]]; then
|
||||
OS=`kubectl exec -i $pod -- nsenter --mount=/proc/1/ns/mnt -- bash -c 'grep -E "^ID=" /etc/os-release | cut -d= -f2'`
|
||||
fi
|
||||
echo "$OS"
|
||||
}
|
||||
|
||||
set_packages_and_check_cmd()
|
||||
{
|
||||
case $OS in
|
||||
*"debian"* | *"ubuntu"* )
|
||||
CHECK_CMD='dpkg -l | grep -w'
|
||||
PACKAGES=(nfs-common open-iscsi)
|
||||
;;
|
||||
*"centos"* | *"fedora"* | *"rocky"* | *"ol"* )
|
||||
CHECK_CMD='rpm -q'
|
||||
PACKAGES=(nfs-utils iscsi-initiator-utils)
|
||||
;;
|
||||
*"suse"* )
|
||||
CHECK_CMD='rpm -q'
|
||||
PACKAGES=(nfs-client open-iscsi)
|
||||
;;
|
||||
*"arch"* )
|
||||
CHECK_CMD='pacman -Q'
|
||||
PACKAGES=(nfs-utils open-iscsi)
|
||||
;;
|
||||
*"gentoo"* )
|
||||
CHECK_CMD='qlist -I'
|
||||
PACKAGES=(net-fs/nfs-utils sys-block/open-iscsi)
|
||||
;;
|
||||
*)
|
||||
CHECK_CMD=''
|
||||
PACKAGES=()
|
||||
warn "Stop the environment check because '$OS' is not supported in the environment check script."
|
||||
exit 1
|
||||
;;
|
||||
esac
|
||||
}
|
||||
|
||||
check_dependencies() {
|
||||
local targets=($@)
|
||||
|
||||
local allFound=true
|
||||
for ((i=0; i<${#targets[@]}; i++)); do
|
||||
local target=${targets[$i]}
|
||||
if [ "$(which $target)" == "" ]; then
|
||||
allFound=false
|
||||
error "Not found: $target"
|
||||
fi
|
||||
done
|
||||
if [ "$allFound" == "false" ]; then
|
||||
error "Please install missing dependencies."
|
||||
exit 2
|
||||
else
|
||||
info "Required dependencies are installed."
|
||||
fi
|
||||
}
|
||||
|
||||
create_ds() {
|
||||
cat <<EOF > $TEMP_DIR/environment_check.yaml
|
||||
apiVersion: apps/v1
|
||||
kind: DaemonSet
|
||||
metadata:
|
||||
labels:
|
||||
app: longhorn-environment-check
|
||||
name: longhorn-environment-check
|
||||
spec:
|
||||
selector:
|
||||
matchLabels:
|
||||
app: longhorn-environment-check
|
||||
template:
|
||||
metadata:
|
||||
labels:
|
||||
app: longhorn-environment-check
|
||||
spec:
|
||||
hostPID: true
|
||||
containers:
|
||||
- name: longhorn-environment-check
|
||||
image: alpine:3.12
|
||||
args: ["/bin/sh", "-c", "sleep 1000000000"]
|
||||
volumeMounts:
|
||||
- name: mountpoint
|
||||
mountPath: /tmp/longhorn-environment-check
|
||||
mountPropagation: Bidirectional
|
||||
securityContext:
|
||||
privileged: true
|
||||
volumes:
|
||||
- name: mountpoint
|
||||
hostPath:
|
||||
path: /tmp/longhorn-environment-check
|
||||
EOF
|
||||
kubectl create -f $TEMP_DIR/environment_check.yaml > /dev/null
|
||||
}
|
||||
|
||||
cleanup() {
|
||||
info "Cleaning up longhorn-environment-check pods..."
|
||||
kubectl delete -f $TEMP_DIR/environment_check.yaml > /dev/null
|
||||
rm -rf $TEMP_DIR
|
||||
info "Cleanup completed."
|
||||
}
|
||||
|
||||
wait_ds_ready() {
|
||||
while true; do
|
||||
local ds=$(kubectl get ds/longhorn-environment-check -o json)
|
||||
local numberReady=$(echo $ds | jq .status.numberReady)
|
||||
local desiredNumberScheduled=$(echo $ds | jq .status.desiredNumberScheduled)
|
||||
|
||||
if [ "$desiredNumberScheduled" == "$numberReady" ] && [ "$desiredNumberScheduled" != "0" ]; then
|
||||
info "All longhorn-environment-check pods are ready ($numberReady/$desiredNumberScheduled)."
|
||||
return
|
||||
fi
|
||||
|
||||
info "Waiting for longhorn-environment-check pods to become ready ($numberReady/$desiredNumberScheduled)..."
|
||||
sleep 3
|
||||
done
|
||||
}
|
||||
|
||||
check_mount_propagation() {
|
||||
local allSupported=true
|
||||
local pods=$(kubectl -l app=longhorn-environment-check get po -o json)
|
||||
|
||||
local ds=$(kubectl get ds/longhorn-environment-check -o json)
|
||||
local desiredNumberScheduled=$(echo $ds | jq .status.desiredNumberScheduled)
|
||||
|
||||
for ((i=0; i<desiredNumberScheduled; i++)); do
|
||||
local pod=$(echo $pods | jq .items[$i])
|
||||
local nodeName=$(echo $pod | jq -r .spec.nodeName)
|
||||
local mountPropagation=$(echo $pod | jq -r '.spec.containers[0].volumeMounts[] | select(.name=="mountpoint") | .mountPropagation')
|
||||
|
||||
if [ "$mountPropagation" != "Bidirectional" ]; then
|
||||
allSupported=false
|
||||
error "node $nodeName: MountPropagation is disabled"
|
||||
fi
|
||||
done
|
||||
|
||||
if [ "$allSupported" != "true" ]; then
|
||||
error "MountPropagation is disabled on at least one node. As a result, CSI driver and Base image cannot be supported."
|
||||
exit 1
|
||||
else
|
||||
info "MountPropagation is enabled."
|
||||
fi
|
||||
}
|
||||
|
||||
check_package_installed() {
|
||||
local pods=$(kubectl get pods -o name | grep longhorn-environment-check)
|
||||
|
||||
local allFound=true
|
||||
|
||||
for pod in ${pods}; do
|
||||
OS=`detect_node_os $pod`
|
||||
if [ x"$OS" == x"" ]; then
|
||||
error "Unable to detect OS on node $node."
|
||||
exit 2
|
||||
fi
|
||||
|
||||
set_packages_and_check_cmd "$OS"
|
||||
|
||||
for ((i=0; i<${#PACKAGES[@]}; i++)); do
|
||||
local package=${PACKAGES[$i]}
|
||||
|
||||
kubectl exec -i $pod -- nsenter --mount=/proc/1/ns/mnt -- timeout 30 bash -c "$CHECK_CMD $package" > /dev/null 2>&1
|
||||
if [ $? != 0 ]; then
|
||||
allFound=false
|
||||
node=`kubectl get ${pod} --no-headers -o=custom-columns=:.spec.nodeName`
|
||||
error "$package is not found in $node."
|
||||
fi
|
||||
done
|
||||
done
|
||||
|
||||
if [ "$allFound" == "false" ]; then
|
||||
error "Please install missing packages."
|
||||
exit 2
|
||||
else
|
||||
info "Required packages are installed."
|
||||
fi
|
||||
}
|
||||
|
||||
check_multipathd() {
|
||||
local pods=$(kubectl get pods -o name | grep longhorn-environment-check)
|
||||
local allNotFound=true
|
||||
|
||||
for pod in ${pods}; do
|
||||
kubectl exec -t $pod -- nsenter --mount=/proc/1/ns/mnt -- bash -c "systemctl status --no-pager multipathd.service" > /dev/null 2>&1
|
||||
if [ $? = 0 ]; then
|
||||
allNotFound=false
|
||||
node=`kubectl get ${pod} --no-headers -o=custom-columns=:.spec.nodeName`
|
||||
warn "multipathd is running on $node."
|
||||
fi
|
||||
done
|
||||
|
||||
if [ "$allNotFound" == "false" ]; then
|
||||
warn "multipathd would probably result in the Longhorn volume mount failure. Please refer to https://longhorn.io/kb/troubleshooting-volume-with-multipath for more information."
|
||||
fi
|
||||
}
|
||||
|
||||
check_iscsid() {
|
||||
local pods=$(kubectl get pods -o name | grep longhorn-environment-check)
|
||||
local allFound=true
|
||||
|
||||
for pod in ${pods}; do
|
||||
kubectl exec -t $pod -- nsenter --mount=/proc/1/ns/mnt -- bash -c "systemctl status --no-pager iscsid.service" > /dev/null 2>&1
|
||||
|
||||
if [ $? != 0 ]; then
|
||||
allFound=false
|
||||
node=`kubectl get ${pod} --no-headers -o=custom-columns=:.spec.nodeName`
|
||||
error "iscsid is not running on $node."
|
||||
fi
|
||||
done
|
||||
|
||||
if [ "$allFound" == "false" ]; then
|
||||
exit 2
|
||||
fi
|
||||
}
|
||||
|
||||
DEPENDENCIES=(kubectl jq mktemp)
|
||||
check_dependencies ${DEPENDENCIES[@]}
|
||||
|
||||
TEMP_DIR=$(mktemp -d)
|
||||
|
||||
trap cleanup EXIT
|
||||
create_ds
|
||||
wait_ds_ready
|
||||
check_package_installed
|
||||
check_iscsid
|
||||
check_multipathd
|
||||
check_mount_propagation
|
||||
|
||||
exit 0
|
||||
|
||||
Reference in New Issue
Block a user