Separate cluster addons installation (openebs, metallb, cert-mgr) from install_kubead...
[osm/devops.git] / installers / install_kubeadm_cluster.sh
1 #!/bin/bash
2 #
3 # Licensed under the Apache License, Version 2.0 (the "License");
4 # you may not use this file except in compliance with the License.
5 # You may obtain a copy of the License at
6 #
7 # http://www.apache.org/licenses/LICENSE-2.0
8 #
9 # Unless required by applicable law or agreed to in writing, software
10 # distributed under the License is distributed on an "AS IS" BASIS,
11 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 # See the License for the specific language governing permissions and
13 # limitations under the License.
14 #
15
16 set +eux
17
18 K8S_VERSION=1.29
19 K8S_PACKAGE_VERSION="$K8S_VERSION".3-1.1
20
21 # installs kubernetes packages
22 function install_kube() {
23 [ -z "${DEBUG_INSTALL}" ] || DEBUG beginning of function
24 # Kubernetes releases can be found here: https://kubernetes.io/releases/
25 # To check other available versions, run the following command
26 # curl -s https://packages.cloud.google.com/apt/dists/kubernetes-xenial/main/binary-amd64/Packages | grep Version | awk '{print $2}'
27 sudo apt-get -y update && sudo apt-get install -y apt-transport-https ca-certificates curl
28 curl -fsSL https://pkgs.k8s.io/core:/stable:/v"$K8S_VERSION"/deb/Release.key | sudo gpg --dearmor -o /etc/apt/keyrings/kubernetes-apt-keyring.gpg
29 echo 'deb [signed-by=/etc/apt/keyrings/kubernetes-apt-keyring.gpg] https://pkgs.k8s.io/core:/stable:/v'$K8S_VERSION'/deb/ /' | sudo tee /etc/apt/sources.list.d/kubernetes.list
30 sudo apt-get -y update
31 echo "Installing Kubernetes Packages ..."
32 sudo apt-get install -y kubelet=${K8S_PACKAGE_VERSION} kubeadm=${K8S_PACKAGE_VERSION} kubectl=${K8S_PACKAGE_VERSION}
33 sudo apt-mark hold kubelet kubeadm kubectl
34 [ -z "${DEBUG_INSTALL}" ] || DEBUG end of function
35 }
36
37 # check and track kube packages installation
38 function check_and_track_kube_install() {
39 [ -z "${DEBUG_INSTALL}" ] || DEBUG beginning of function
40 kubelet_version=$(dpkg -s kubelet|grep Version|awk '{print $2}')
41 [ -n "${kubelet_version}" ] || FATAL_TRACK k8scluster "Kubelet was not installed."
42 kubeadm_version=$(dpkg -s kubeadm|grep Version|awk '{print $2}')
43 [ -n "${kubeadm_version}" ] || FATAL_TRACK k8scluster "Kubeadm was not installed."
44 kubectl_version=$(dpkg -s kubectl|grep Version|awk '{print $2}')
45 [ -n "${kubectl_version}" ] || FATAL_TRACK k8scluster "Kubectl was not installed."
46 track k8scluster install_k8s_ok none none none kubelet ${kubelet_version} none none kubeadm ${kubeadm_version} none none kubectl ${kubectl_version} none none
47 [ -z "${DEBUG_INSTALL}" ] || DEBUG end of function
48 }
49
50 # initializes kubernetes control plane
51 function init_kubeadm() {
52 [ -z "${DEBUG_INSTALL}" ] || DEBUG beginning of function
53 sudo swapoff -a
54 sudo sed -i.bak '/.*none.*swap/s/^\(.*\)$/#\1/g' /etc/fstab
55 sudo kubeadm init --config $1 --dry-run || FATAL_TRACK k8scluster "kubeadm init dry-run failed"
56 sudo kubeadm init --config $1
57 sleep 5
58 [ -z "${DEBUG_INSTALL}" ] || DEBUG end of function
59 }
60
61 # Initializes kubeconfig file
62 function kube_config_dir() {
63 [ -z "${DEBUG_INSTALL}" ] || DEBUG beginning of function
64 K8S_MANIFEST_DIR="/etc/kubernetes/manifests"
65 [ ! -d $K8S_MANIFEST_DIR ] && FATAL_TRACK k8scluster "Kubernetes folder $K8S_MANIFEST_DIR was not found"
66 mkdir -p $HOME/.kube
67 sudo cp /etc/kubernetes/admin.conf $HOME/.kube/config
68 sudo chown $(id -u):$(id -g) $HOME/.kube/config
69 [ -z "${DEBUG_INSTALL}" ] || DEBUG end of function
70 }
71
72 # test kubernetes installation
73 function check_and_track_init_k8s() {
74 [ -z "${DEBUG_INSTALL}" ] || DEBUG beginning of function
75 echo "Reading existing namespaces"
76 kubectl get ns || FATAL_TRACK k8scluster "Failed getting namespaces"
77 track k8scluster init_k8s_ok
78 [ -z "${DEBUG_INSTALL}" ] || DEBUG end of function
79 }
80
81 # deploys flannel as daemonsets
82 function deploy_cni_provider() {
83 [ -z "${DEBUG_INSTALL}" ] || DEBUG beginning of function
84 CNI_DIR="$(mktemp -d -q --tmpdir "flannel.XXXXXX")"
85 trap 'rm -rf "${CNI_DIR}"' EXIT
86 KUBE_FLANNEL_FILE_URL="https://raw.githubusercontent.com/coreos/flannel/master/Documentation/kube-flannel.yml"
87 wget --retry-on-host-error --retry-on-http-error 404,429,503 --tries=5 "${KUBE_FLANNEL_FILE_URL}" -P $CNI_DIR
88 [ ! -f $CNI_DIR/kube-flannel.yml ] && FATAL_TRACK k8scluster "Cannot Install Flannel because $CNI_DIR/kube-flannel.yml was not found. Maybe the file ${KUBE_FLANNEL_FILE_URL} is temporarily not accessible"
89 kubectl apply -f $CNI_DIR
90 [ $? -ne 0 ] && FATAL_TRACK k8scluster "Cannot Install Flannel"
91 [ -z "${DEBUG_INSTALL}" ] || DEBUG end of function
92 }
93
94 # taints K8s master node
95 function taint_master_node() {
96 [ -z "${DEBUG_INSTALL}" ] || DEBUG beginning of function
97 K8S_MASTER=$(kubectl get nodes | awk '$3~/control-plane/'| awk '{print $1; exit}')
98 kubectl taint node $K8S_MASTER node-role.kubernetes.io/control-plane:NoSchedule-
99 sleep 5
100 [ -z "${DEBUG_INSTALL}" ] || DEBUG end of function
101 }
102
103 # check and track kube packages installation
104 function check_and_track_k8s_ready_before_helm() {
105 [ -z "${DEBUG_INSTALL}" ] || DEBUG beginning of function
106 kubectl get events || FATAL_TRACK k8scluster "Failed getting events"
107 track k8scluster k8s_ready_before_helm
108 [ -z "${DEBUG_INSTALL}" ] || DEBUG end of function
109 }
110
111 function install_k8s_storageclass() {
112 [ -z "${DEBUG_INSTALL}" ] || DEBUG beginning of function
113 # Openebs versions can be found here: https://github.com/openebs/openebs/releases
114 OPENEBS_VERSION="3.7.0"
115 echo "Installing OpenEBS"
116 helm repo add openebs https://openebs.github.io/charts
117 helm repo update
118 helm install --create-namespace --namespace openebs openebs openebs/openebs --version ${OPENEBS_VERSION}
119 helm ls -n openebs
120 local storageclass_timeout=400
121 local counter=0
122 local storageclass_ready=""
123 echo "Waiting for storageclass"
124 while (( counter < storageclass_timeout ))
125 do
126 kubectl get storageclass openebs-hostpath &> /dev/null
127
128 if [ $? -eq 0 ] ; then
129 echo "Storageclass available"
130 storageclass_ready="y"
131 break
132 else
133 counter=$((counter + 15))
134 sleep 15
135 fi
136 done
137 [ -n "$storageclass_ready" ] || FATAL_TRACK k8scluster "Storageclass not ready after $storageclass_timeout seconds. Cannot install openebs"
138 kubectl patch storageclass openebs-hostpath -p '{"metadata": {"annotations":{"storageclass.kubernetes.io/is-default-class":"true"}}}'
139 [ -z "${DEBUG_INSTALL}" ] || DEBUG end of function
140 }
141
142 #installs metallb from helm
143 function install_helm_metallb() {
144 [ -z "${DEBUG_INSTALL}" ] || DEBUG beginning of function
145 echo "Installing MetalLB"
146 METALLB_VERSION="0.13.10"
147 helm repo add metallb https://metallb.github.io/metallb
148 helm repo update
149 helm install --create-namespace --namespace metallb-system metallb metallb/metallb --version ${METALLB_VERSION}
150 [ -z "${DEBUG_INSTALL}" ] || DEBUG end of function
151 }
152
153 function configure_ipaddresspool_metallb() {
154 [ -z "${DEBUG_INSTALL}" ] || DEBUG beginning of function
155 echo "Creating IP address pool manifest: ${OSM_CLUSTER_WORK_DIR}/metallb-ipaddrpool.yaml"
156 METALLB_IP_RANGE="$DEFAULT_IP/32"
157 echo "apiVersion: metallb.io/v1beta1
158 kind: IPAddressPool
159 metadata:
160 name: first-pool
161 namespace: metallb-system
162 spec:
163 addresses:
164 - ${METALLB_IP_RANGE}" | sudo tee -a ${OSM_CLUSTER_WORK_DIR}/metallb-ipaddrpool.yaml
165 echo "Applying IP address pool manifest: kubectl apply -f ${OSM_CLUSTER_WORK_DIR}/metallb-ipaddrpool.yaml"
166 kubectl apply -f ${OSM_CLUSTER_WORK_DIR}/metallb-ipaddrpool.yaml || FATAL_TRACK k8scluster "Cannot create IP address Pool in MetalLB"
167 [ -z "${DEBUG_INSTALL}" ] || DEBUG end of function
168 }
169
170 #installs cert-manager
171 function install_helm_certmanager() {
172 [ -z "${DEBUG_INSTALL}" ] || DEBUG beginning of function
173 echo "Installing cert-manager"
174 CERTMANAGER_VERSION="v1.9.1"
175 helm repo add jetstack https://charts.jetstack.io
176 helm repo update
177 helm install cert-manager --create-namespace --namespace cert-manager jetstack/cert-manager \
178 --version ${CERTMANAGER_VERSION} --set installCRDs=true --set prometheus.enabled=false \
179 --set clusterResourceNamespace=osm \
180 --set extraArgs="{--enable-certificate-owner-ref=true}"
181 [ -z "${DEBUG_INSTALL}" ] || DEBUG end of function
182 }
183
184 #checks openebs and metallb readiness
185 function check_for_readiness() {
186 [ -z "${DEBUG_INSTALL}" ] || DEBUG beginning of function
187 # Default input values
188 sampling_period=2 # seconds
189 time_for_readiness=20 # seconds ready
190 time_for_failure=200 # seconds broken
191 OPENEBS_NAMESPACE=openebs
192 METALLB_NAMESPACE=metallb-system
193 CERTMANAGER_NAMESPACE=cert-manager
194 # STACK_NAME=osm # By default, "osm"
195
196 # Equivalent number of samples
197 oks_threshold=$((time_for_readiness/${sampling_period})) # No. ok samples to declare the system ready
198 failures_threshold=$((time_for_failure/${sampling_period})) # No. nok samples to declare the system broken
199 failures_in_a_row=0
200 oks_in_a_row=0
201
202 ####################################################################################
203 # Loop to check system readiness
204 ####################################################################################
205 while [[ (${failures_in_a_row} -lt ${failures_threshold}) && (${oks_in_a_row} -lt ${oks_threshold}) ]]
206 do
207 # State of OpenEBS
208 OPENEBS_STATE=$(kubectl get pod -n ${OPENEBS_NAMESPACE} --no-headers 2>&1)
209 OPENEBS_READY=$(echo "${OPENEBS_STATE}" | awk '$2=="1/1" || $2=="2/2" {printf ("%s\t%s\t\n", $1, $2)}')
210 OPENEBS_NOT_READY=$(echo "${OPENEBS_STATE}" | awk '$2!="1/1" && $2!="2/2" {printf ("%s\t%s\t\n", $1, $2)}')
211 COUNT_OPENEBS_READY=$(echo "${OPENEBS_READY}"| grep -v -e '^$' | wc -l)
212 COUNT_OPENEBS_NOT_READY=$(echo "${OPENEBS_NOT_READY}" | grep -v -e '^$' | wc -l)
213
214 # State of MetalLB
215 METALLB_STATE=$(kubectl get pod -n ${METALLB_NAMESPACE} --no-headers 2>&1)
216 METALLB_READY=$(echo "${METALLB_STATE}" | awk '$2=="1/1" || $2=="4/4" {printf ("%s\t%s\t\n", $1, $2)}')
217 METALLB_NOT_READY=$(echo "${METALLB_STATE}" | awk '$2!="1/1" && $2!="4/4" {printf ("%s\t%s\t\n", $1, $2)}')
218 COUNT_METALLB_READY=$(echo "${METALLB_READY}" | grep -v -e '^$' | wc -l)
219 COUNT_METALLB_NOT_READY=$(echo "${METALLB_NOT_READY}" | grep -v -e '^$' | wc -l)
220
221 # State of CertManager
222 CERTMANAGER_STATE=$(kubectl get pod -n ${CERTMANAGER_NAMESPACE} --no-headers 2>&1)
223 CERTMANAGER_READY=$(echo "${CERTMANAGER_STATE}" | awk '$2=="1/1" || $2=="2/2" {printf ("%s\t%s\t\n", $1, $2)}')
224 CERTMANAGER_NOT_READY=$(echo "${CERTMANAGER_STATE}" | awk '$2!="1/1" && $2!="2/2" {printf ("%s\t%s\t\n", $1, $2)}')
225 COUNT_CERTMANAGER_READY=$(echo "${CERTMANAGER_READY}" | grep -v -e '^$' | wc -l)
226 COUNT_CERTMANAGER_NOT_READY=$(echo "${CERTMANAGER_NOT_READY}" | grep -v -e '^$' | wc -l)
227
228 # OK sample
229 if [[ $((${COUNT_OPENEBS_NOT_READY}+${COUNT_METALLB_NOT_READY})) -eq 0 ]]
230 then
231 ((++oks_in_a_row))
232 failures_in_a_row=0
233 echo -ne ===\> Successful checks: "${oks_in_a_row}"/${oks_threshold}\\r
234 # NOK sample
235 else
236 ((++failures_in_a_row))
237 oks_in_a_row=0
238 echo
239 echo Bootstraping... "${failures_in_a_row}" checks of ${failures_threshold}
240
241 # Reports failed pods in OpenEBS
242 if [[ "${COUNT_OPENEBS_NOT_READY}" -ne 0 ]]
243 then
244 echo "OpenEBS: Waiting for ${COUNT_OPENEBS_NOT_READY} of $((${COUNT_OPENEBS_NOT_READY}+${COUNT_OPENEBS_READY})) pods to be ready:"
245 echo "${OPENEBS_NOT_READY}"
246 echo
247 fi
248
249 # Reports failed pods in MetalLB
250 if [[ "${COUNT_METALLB_NOT_READY}" -ne 0 ]]
251 then
252 echo "MetalLB: Waiting for ${COUNT_METALLB_NOT_READY} of $((${COUNT_METALLB_NOT_READY}+${COUNT_METALLB_READY})) pods to be ready:"
253 echo "${METALLB_NOT_READY}"
254 echo
255 fi
256
257 # Reports failed pods in CertManager
258 if [[ "${COUNT_CERTMANAGER_NOT_READY}" -ne 0 ]]
259 then
260 echo "CertManager: Waiting for ${COUNT_CERTMANAGER_NOT_READY} of $((${COUNT_CERTMANAGER_NOT_READY}+${COUNT_CERTMANAGER_READY})) pods to be ready:"
261 echo "${CERTMANAGER_NOT_READY}"
262 echo
263 fi
264 fi
265
266 #------------ NEXT SAMPLE
267 sleep ${sampling_period}
268 done
269
270 ####################################################################################
271 # OUTCOME
272 ####################################################################################
273 if [[ (${failures_in_a_row} -ge ${failures_threshold}) ]]
274 then
275 echo
276 FATAL_TRACK k8scluster "K8S CLUSTER IS BROKEN"
277 else
278 echo
279 echo "K8S CLUSTER IS READY"
280 fi
281 [ -z "${DEBUG_INSTALL}" ] || DEBUG end of function
282 }
283
284 #removes osm deployments and services
285 function remove_k8s_namespace() {
286 [ -z "${DEBUG_INSTALL}" ] || DEBUG beginning of function
287 echo "Deleting existing namespace $1: kubectl delete ns $1"
288 kubectl delete ns $1 2>/dev/null
289 [ -z "${DEBUG_INSTALL}" ] || DEBUG end of function
290 }
291
292 # main
293 while getopts ":D:d:i:-: " o; do
294 case "${o}" in
295 i)
296 DEFAULT_IP="${OPTARG}"
297 ;;
298 d)
299 OSM_CLUSTER_WORK_DIR="${OPTARG}"
300 ;;
301 D)
302 OSM_DEVOPS="${OPTARG}"
303 ;;
304 -)
305 [ "${OPTARG}" == "debug" ] && DEBUG_INSTALL="y" && continue
306 echo -e "Invalid option: '--$OPTARG'\n" >&2
307 exit 1
308 ;;
309 :)
310 echo "Option -$OPTARG requires an argument" >&2
311 exit 1
312 ;;
313 \?)
314 echo -e "Invalid option: '-$OPTARG'\n" >&2
315 exit 1
316 ;;
317 *)
318 exit 1
319 ;;
320 esac
321 done
322
323 source $OSM_DEVOPS/common/logging
324 source $OSM_DEVOPS/common/track
325
326 echo "DEBUG_INSTALL=$DEBUG_INSTALL"
327 echo "OSM_DEVOPS=$OSM_DEVOPS"
328 echo "OSM_CLUSTER_WORK_DIR=$OSM_CLUSTER_WORK_DIR"
329 echo "HOME=$HOME"
330
331 echo "Creating folders for installation"
332 [ ! -d "$OSM_CLUSTER_WORK_DIR" ] && sudo mkdir -p $OSM_CLUSTER_WORK_DIR
333 echo "Copying kubeadm-config from $OSM_DEVOPS/installers/kubeadm-config.yaml to $OSM_CLUSTER_WORK_DIR/kubeadm-config.yaml"
334 sudo cp -b $OSM_DEVOPS/installers/kubeadm-config.yaml $OSM_CLUSTER_WORK_DIR/kubeadm-config.yaml
335
336 install_kube
337 check_and_track_kube_install
338
339 init_kubeadm $OSM_CLUSTER_WORK_DIR/kubeadm-config.yaml
340 kube_config_dir
341 check_and_track_init_k8s
342
343 deploy_cni_provider
344 taint_master_node
345 check_and_track_k8s_ready_before_helm
346
347 remove_k8s_namespace osm
348
349 # install_helm has been moved to install_helm_client.sh, run from full_install_osm.sh,
350 # but tracking is still here because the installation analytics still expects it
351 track k8scluster install_helm_ok
352
353 # Installation of storage class, metallb and cert-manager has been moved
354 # to install_cluster_addons.sh, run from full_install_osm.sh