This repository has been archived by the owner on Oct 22, 2024. It is now read-only.
-
Notifications
You must be signed in to change notification settings - Fork 55
/
setup-deployment.sh
executable file
·333 lines (318 loc) · 12.1 KB
/
setup-deployment.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
#!/bin/bash
set -o errexit
set -o pipefail
# This reads a file and encodes it for use in a secret.
read_key () {
base64 -w 0 "$1"
}
TEST_DIRECTORY=${TEST_DIRECTORY:-$(dirname $(readlink -f $0))}
source ${TEST_CONFIG:-${TEST_DIRECTORY}/test-config.sh}
CLUSTER=${CLUSTER:-pmem-govm}
REPO_DIRECTORY="${REPO_DIRECTORY:-$(dirname $(dirname $(readlink -f $0)))}"
CLUSTER_DIRECTORY="${CLUSTER_DIRECTORY:-${REPO_DIRECTORY}/_work/${CLUSTER}}"
SSH="${CLUSTER_DIRECTORY}/ssh.0"
KUBECTL="${SSH} kubectl" # Always use the kubectl installed in the cluster.
KUBERNETES_VERSION="$(cat "$CLUSTER_DIRECTORY/kubernetes.version")"
DEPLOYMENT_DIRECTORY="${REPO_DIRECTORY}/deploy/kubernetes-$KUBERNETES_VERSION${TEST_KUBERNETES_FLAVOR}"
case ${TEST_DEPLOYMENTMODE} in
testing)
deployment_suffix="/testing";;
production)
deployment_suffix="";;
*)
echo >&2 "invalid TEST_DEPLOYMENTMODE: ${TEST_DEPLOYMENTMODE}"
exit 1
esac
DEPLOY=(
${TEST_DEVICEMODE}${deployment_suffix}
pmem-storageclass-ext4.yaml
pmem-storageclass-ext4-kata.yaml
pmem-storageclass-xfs.yaml
pmem-storageclass-xfs-kata.yaml
pmem-storageclass-late-binding.yaml
)
echo "INFO: deploying from ${DEPLOYMENT_DIRECTORY}/${TEST_DEVICEMODE}${deployment_suffix}"
# Set up TLS secrets in the TEST_DRIVER_NAMESPACE.
PATH="${REPO_DIRECTORY}/_work/bin:$PATH" KUBECTL="${KUBECTL}" ${TEST_DIRECTORY}/setup-ca-kubernetes.sh
OPENSHIFT_SCHEDULER=false
case "$KUBERNETES_VERSION" in
1.19|1.20)
# Enable scheduler extensions. Not needed on >= 1.21.
DEPLOY+=(scheduler webhook)
if ${KUBECTL} get crd | grep -q schedulers.config.openshift.io; then
# Only the service gets deployed anew, with TEST_SCHEDULER_EXTENDER_NODE_PORT as
# well-known, fixed node port. Config map and scheduler config must be
# set up manually once before running tests.
OPENSHIFT_SCHEDULER=true
# Do some sanity checkig...
policy=$(${KUBECTL} get scheduler/cluster -o jsonpath={.spec.policy.name})
if [ ! "$policy" ]; then
echo >&2 "The scheduler config in scheduler/cluster must be set up manually. Currently there is no policy."
fi
if ! ${KUBECTL} get -n openshift-config configmap/$policy >/dev/null; then
echo >&2 "The scheduler policy configmap must be set up manually."
fi
fi
;;
esac
for deploy in ${DEPLOY[@]}; do
# Deployment files can come from:
# 1. deploy/kubernetes-*
# 2. deploy/common
# 3. deploy/kustomize directly
path="${DEPLOYMENT_DIRECTORY}/${deploy}"
paths="$path"
if ! [ -e "$path" ]; then
path="${REPO_DIRECTORY}/deploy/common/${deploy}"
paths+=" $path"
fi
if ! [ -e "$path" ]; then
path="${REPO_DIRECTORY}/deploy/kustomize/${deploy}"
paths+=" $path"
fi
if [ -f "$path" ]; then
case "$path" in
*storageclass*)
# Patch the node selector label into the storage class instead of the default storage=pmem.
sed -e "s;: storage\$;: \"$(echo $TEST_PMEM_NODE_LABEL | cut -d= -f1)\";" \
-e "s;- pmem\$;- \"$(echo $TEST_PMEM_NODE_LABEL | cut -d= -f2)\";" \
"$path" | ${KUBECTL} apply -f -
;;
*)
${KUBECTL} apply -f - <"$path"
;;
esac
elif [ -d "$path" ]; then
# A kustomize base. We need to copy all files over into the cluster, otherwise
# `kubectl kustomize` won't work.
tmpdir=$(${SSH} mktemp -d)
case "$path" in /*) tar -C / -chf - "$(echo "$path" | sed -e 's;^/;;')";;
*) tar -chf - "$path";;
esac | ${SSH} tar -xf - -C "$tmpdir"
if [ -f "$path/pmem-csi.yaml" ]; then
# Replace registry. This is easier with sed than kustomize...
${SSH} sed -i -e "s^intel/pmem^${TEST_PMEM_REGISTRY}/pmem^g" "$tmpdir/$path/pmem-csi.yaml"
# Replace Namespace object name
${SSH} "sed -ie 's;\(name: \)pmem-csi$;\1${TEST_DRIVER_NAMESPACE};g' $tmpdir/$path/pmem-csi.yaml"
# Same for image pull policy.
${SSH} <<EOF
sed -i -e "s^imagePullPolicy:.IfNotPresent^imagePullPolicy: ${TEST_IMAGE_PULL_POLICY}^g" "$tmpdir/$path/pmem-csi.yaml"
EOF
fi
${SSH} mkdir "$tmpdir/my-deployment"
trap '${SSH} "rm -rf $tmpdir"' SIGTERM SIGINT EXIT
${SSH} "cat >'$tmpdir/my-deployment/kustomization.yaml'" <<EOF
bases:
- ../$path
EOF
case $deploy in
${TEST_DEVICEMODE}${deployment_suffix})
${SSH} "cat >>'$tmpdir/my-deployment/kustomization.yaml'" <<EOF
patchesJson6902:
- target:
group: apps
version: v1
kind: Deployment
name: pmem-csi-intel-com-controller
path: scheduler-patch.yaml
EOF
${SSH} "cat >'$tmpdir/my-deployment/scheduler-patch.yaml'" <<EOF
- op: add
path: /spec/template/spec/containers/0/command/-
value: "--schedulerListen=:8000" # Exposed to kube-scheduler via the pmem-csi-scheduler service.
- op: add
path: /spec/template/spec/containers/0/command/-
value: -nodeSelector={$(echo ${TEST_PMEM_NODE_LABEL} | sed -e 's/\([^=]*\)=\(.*\)/"\1":"\2"/')}
EOF
if $OPENSHIFT_SCHEDULER; then
${SSH} "cat >'$tmpdir/my-deployment/scheduler-patch.yaml'" <<EOF
- op: add
path: /spec/template/spec/containers/0/command/-
value: "--insecureSchedulerListen=:8001"
- op: replace
# We get this from OpenShift (see service.beta.openshift.io/serving-cert-secret-name below).
path: /spec/template/spec/volumes/0/secret/secretName
value: pmem-csi-openshift-controller-tls
EOF
fi
if [ "${TEST_DEVICEMODE}" = "lvm" ]; then
# Test these options and kustomization by injecting some non-default values.
# This could be made optional to test both default and non-default values,
# but for now we just change this in all deployments.
${SSH} "cat >>'$tmpdir/my-deployment/kustomization.yaml'" <<EOF
- target:
group: apps
version: v1
kind: DaemonSet
name: pmem-csi-intel-com-node
path: lvm-parameters-patch.yaml
EOF
${SSH} "cat >'$tmpdir/my-deployment/lvm-parameters-patch.yaml'" <<EOF
- op: add
path: /spec/template/spec/containers/0/command/-
value: "--pmemPercentage=50"
EOF
fi
${SSH} "cat >>'$tmpdir/my-deployment/kustomization.yaml'" <<EOF
- target:
group: apps
version: v1
kind: DaemonSet
name: pmem-csi-intel-com-node-setup
path: node-selector-patch.yaml
EOF
${SSH} "cat >'$tmpdir/my-deployment/node-selector-patch.yaml'" <<EOF
- op: add
path: /spec/template/spec/containers/0/command/-
value: -nodeSelector={$(echo ${TEST_PMEM_NODE_LABEL} | sed -e 's/\([^=]*\)=\(.*\)/"\1":"\2"/')}
EOF
# Always use the configured label for selecting nodes.
${SSH} "cat >>'$tmpdir/my-deployment/kustomization.yaml'" <<EOF
- target:
group: apps
version: v1
kind: DaemonSet
name: pmem-csi-intel-com-node
path: node-label-patch.yaml
EOF
case $deploy in
*-testing)
${SSH} "cat >>'$tmpdir/my-deployment/kustomization.yaml'" <<EOF
- target:
group: apps
version: v1
kind: DaemonSet
name: pmem-csi-intel-com-node-testing
path: node-label-patch.yaml
EOF
;;
esac
${SSH} "cat >>'$tmpdir/my-deployment/node-label-patch.yaml'" <<EOF
- op: add
path: /spec/template/spec/nodeSelector
value:
{$(echo "${TEST_PMEM_NODE_LABEL}" | sed -e 's/\(.*\)=\(.*\)/\1: "\2"/')}
EOF
;;
scheduler)
# Change port number via JSON patch.
${SSH} "cat >>'$tmpdir/my-deployment/kustomization.yaml'" <<EOF
commonLabels:
pmem-csi.intel.com/deployment: ${TEST_DEVICEMODE}-${TEST_DEPLOYMENTMODE}
patchesJson6902:
- target:
version: v1
kind: Service
name: pmem-csi-intel-com-scheduler
path: scheduler-patch.yaml
EOF
${SSH} "cat >'$tmpdir/my-deployment/scheduler-patch.yaml'" <<EOF
- op: add
path: /spec/ports/0/nodePort
value: ${TEST_SCHEDULER_EXTENDER_NODE_PORT}
- op: add
path: /spec/type
value: NodePort
EOF
if $OPENSHIFT_SCHEDULER; then
${SSH} "cat >>'$tmpdir/my-deployment/scheduler-patch.yaml'" <<EOF
- op: add
path: /spec/ports/0/targetPort
value: 8001 # need to use the insecure port
EOF
fi
;;
webhook)
${SSH} "cat >>'$tmpdir/my-deployment/kustomization.yaml'" <<EOF
commonLabels:
pmem-csi.intel.com/deployment: ${TEST_DEVICEMODE}-${TEST_DEPLOYMENTMODE}
patchesJson6902:
- target:
group: admissionregistration.k8s.io
version: v1
kind: MutatingWebhookConfiguration
name: pmem-csi-intel-com-hook
path: webhook-patch.yaml
EOF
if $OPENSHIFT_SCHEDULER; then
${SSH} "cat >'$tmpdir/my-deployment/webhook-patch.yaml'" <<EOF
- op: replace
path: /webhooks/0/clientConfig/service/namespace
value: ${TEST_DRIVER_NAMESPACE}
- op: replace
path: /metadata/annotations
value:
service.beta.openshift.io/inject-cabundle: "true"
EOF
${SSH} "cat >>'$tmpdir/my-deployment/kustomization.yaml'" <<EOF
- target:
version: v1
kind: Service
name: pmem-csi-intel-com-webhook
path: webhook-service-patch.yaml
EOF
${SSH} "cat >'$tmpdir/my-deployment/webhook-service-patch.yaml'" <<EOF
- op: replace
path: /metadata/annotations
value:
service.beta.openshift.io/serving-cert-secret-name: pmem-csi-openshift-controller-tls
EOF
else
${SSH} "cat >'$tmpdir/my-deployment/webhook-patch.yaml'" <<EOF
- op: replace
path: /webhooks/0/clientConfig/caBundle
value: $(base64 -w 0 ${TEST_CA}.pem)
- op: replace
path: /webhooks/0/clientConfig/service/namespace
value: ${TEST_DRIVER_NAMESPACE}
EOF
fi
;;
esac
${SSH} "cat >>'$tmpdir/my-deployment/kustomization.yaml'" <<EOF
namespace: ${TEST_DRIVER_NAMESPACE}
EOF
# When quickly taking down one installation of PMEM-CSI and recreating it, sometimes we get:
# nodePort: Invalid value: 32000: provided port is already allocated
#
# A fix is going into 1.19: https://github.com/kubernetes/kubernetes/pull/89937/commits
# Not sure whether that is applicable here because we don't use a HA setup and
# besides, we also need to support older Kubernetes releases. Therefore we retry...
start=$SECONDS
while ! output="$(${KUBECTL} apply --kustomize "$tmpdir/my-deployment" 2>&1)"; do
if echo "$output" | grep -q "nodePort: Invalid value: ${TEST_SCHEDULER_EXTENDER_NODE_PORT}: provided port is already allocated" &&
[ $(($SECONDS - $start)) -lt 60 ]; then
# Retry later...
echo "Warning: kubectl failed with potentially temporary error, will try again: $output"
sleep 1
else
echo "$output"
exit 1
fi
done
echo "$output"
${SSH} rm -rf "$tmpdir"
else
case "$path" in
*/scheduler|*/webhook)
# optional, continue
:
;;
*)
# Should be there, fail.
echo >&2 "$paths are all missing."
exit 1
;;
esac
fi
done
${KUBECTL} label --overwrite ns kube-system pmem-csi.intel.com/webhook=ignore
if [ "${TEST_DEPLOYMENT_QUIET}" = "" ]; then
cat <<EOF
To try out the PMEM-CSI driver with persistent volumes that use late binding:
cat deploy/common/pmem-pvc-late-binding.yaml | ${KUBECTL} create -f -
cat deploy/common/pmem-app-late-binding.yaml | ${KUBECTL} create -f -
To try out the PMEM-CSI driver with ephemeral volumes:
cat deploy/common/pmem-app-ephemeral.yaml | ${KUBECTL} create -f -
EOF
fi