forked from chainzero/provider-build-scripts
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathworkerNode.sh
119 lines (100 loc) · 3.68 KB
/
workerNode.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
#!/usr/bin/env bash
# Example use:
#./worker.sh -m 10.128.0.8 -t K10cef5da8867a6d3d2acc25aa817c7c06f86a638ee7ad4c0668c248c23167c1140::server:da3e13b2aafc1983789be9841b7e5e83 -g -s -o /data/k3s -k /data/kubelet
# Worker Script
# Initialize variables
master_ip=""
token=""
install_gpu_drivers=false
install_storage_support=false
nodefs_dir=""
imagefs_dir=""
INSTALL_K3S_EXEC=""
# Process command-line options
while getopts ":m:t:gsk:o:" opt; do
case ${opt} in
m )
master_ip=$OPTARG
;;
t )
token=$OPTARG
;;
g )
install_gpu_drivers=true
;;
s )
install_storage_support=true
;;
k )
nodefs_dir="--kubelet-arg=root-dir=$OPTARG"
;;
o )
imagefs_dir="--data-dir=$OPTARG"
;;
\? )
echo "Invalid option: $OPTARG" 1>&2
exit 1
;;
: )
echo "Invalid option: $OPTARG requires an argument" 1>&2
exit 1
;;
esac
done
shift $((OPTIND -1))
# Check if the master IP and token have been provided
if [ -z "$master_ip" ] || [ -z "$token" ]; then
echo "Both master IP (-m) and token (-t) must be provided."
exit 1
fi
# debugging OPTARG
echo "Debug: nodefs_dir = $nodefs_dir"
echo "Debug: imagefs_dir = $imagefs_dir"
# Install K3s worker node
echo "Starting K3s installation on worker node..."
echo "INSTALL_K3S_EXEC value: agent ${nodefs_dir} ${imagefs_dir}"
curl -sfL https://get.k3s.io | K3S_URL=https://$master_ip:6443 K3S_TOKEN=$token INSTALL_K3S_EXEC="$nodefs_dir $imagefs_dir" sh -
# Check if K3s agent is running
echo "Verifying K3s installation on worker node..."
if systemctl is-active --quiet k3s-agent; then
echo "K3s installation completed on worker node."
else
echo "K3s installation failed on worker node. Please check the logs for more information."
exit 1
fi
# GPU host prep, driver, and toolkit install
if [ "$install_gpu_drivers" = true ]; then
echo "Starting GPU host preparation, driver, and toolkit installation..."
apt update
DEBIAN_FRONTEND=noninteractive apt-get -y -o Dpkg::Options::="--force-confdef" -o Dpkg::Options::="--force-confold" dist-upgrade
apt-get autoremove -y
echo "Installing NVIDIA drivers..."
apt-get install -y ubuntu-drivers-common
ubuntu-drivers devices
ubuntu-drivers autoinstall
echo "NVIDIA GPU drivers installation completed."
echo "Installing NVIDIA container runtime..."
distribution="stable/deb"
curl -s -L https://nvidia.github.io/libnvidia-container/gpgkey | apt-key add -
curl -s -L https://nvidia.github.io/libnvidia-container/$distribution/libnvidia-container.list | tee /etc/apt/sources.list.d/libnvidia-container.list
apt-get update
DEBIAN_FRONTEND=noninteractive apt-get install -y nvidia-container-toolkit nvidia-container-runtime
echo "NVIDIA container runtime installation completed."
# Update nvidia runtime config
CONFIG_FILE="/etc/nvidia-container-runtime/config.toml"
if [ -f "$CONFIG_FILE" ]; then
echo "Updating NVIDIA runtime configuration..."
sed -i 's/#accept-nvidia-visible-devices-as-volume-mounts = false/accept-nvidia-visible-devices-as-volume-mounts = true/' "$CONFIG_FILE"
sed -i 's/#accept-nvidia-visible-devices-envvar-when-unprivileged = true/accept-nvidia-visible-devices-envvar-when-unprivileged = false/' "$CONFIG_FILE"
else
echo "NVIDIA runtime configuration file not found."
fi
fi
# Persistent storage support with Rook-Ceph if enabled
if [ "$install_storage_support" = true ]; then
echo "Persistent storage support enabled, installing necessary packages..."
apt-get update
apt-get install -y lvm2
echo "LVM package installed for persistent storage support."
fi
echo "Worker node setup completed."