@@ -35,35 +35,38 @@ DRIVER_NAME=$(from_versions_mk "DRIVER_NAME")
35
35
36
36
NETWORK_NAME=" ${DRIVER_NAME} -net"
37
37
CLUSTER_NAME=" ${DRIVER_NAME} -cluster"
38
- NODE_VERSION=" 1.31.1"
38
+ NODE_VERSION=" 1.32"
39
+ ROUTER_REGION=" us-central1"
40
+ REGION=" us-central1-c"
39
41
40
42
# # Create the Network for the cluster
41
43
gcloud compute networks create " ${NETWORK_NAME} " \
42
44
--quiet \
43
45
--project=" ${PROJECT_NAME} " \
44
- --description=Manually\ created\ network\ for\ TMS \ DRA\ Alpha \ cluster \
46
+ --description=" Manually created network for DRA beta test cluster" \
45
47
--subnet-mode=auto \
46
48
--mtu=1460 \
47
49
--bgp-routing-mode=regional
48
50
49
51
# # Create the cluster
50
52
gcloud container clusters create " ${CLUSTER_NAME} " \
51
53
--quiet \
52
- --enable-kubernetes-alpha \
54
+ --enable-kubernetes-unstable-apis=" resource.k8s.io/v1beta1/deviceclasses,resource.k8s.io/v1beta1/resourceclaims,resource.k8s.io/v1beta1/resourceclaimtemplates,resource.k8s.io/v1beta1/resourceslices" \
55
+ --release-channel=rapid \
53
56
--no-enable-autorepair \
54
- --no- enable-autoupgrade \
55
- --region us-west1 \
57
+ --enable-autoupgrade \
58
+ --region " ${REGION} " \
56
59
--num-nodes " 1" \
57
60
--network " ${NETWORK_NAME} " \
58
61
--cluster-version " ${NODE_VERSION} " \
59
- --node-version " ${NODE_VERSION} "
62
+ --node-version " ${NODE_VERSION} " \
60
63
61
64
# Create t4 node pool
62
65
gcloud beta container node-pools create " pool-1" \
63
66
--quiet \
64
67
--project " ${PROJECT_NAME} " \
65
68
--cluster " ${CLUSTER_NAME} " \
66
- --region " us-west1 " \
69
+ --region " ${REGION} " \
67
70
--node-version " ${NODE_VERSION} " \
68
71
--machine-type " n1-standard-8" \
69
72
--accelerator " type=nvidia-tesla-t4,count=1" \
@@ -77,19 +80,19 @@ gcloud beta container node-pools create "pool-1" \
77
80
--min-nodes " 2" \
78
81
--max-nodes " 6" \
79
82
--location-policy " ANY" \
80
- --no- enable-autoupgrade \
83
+ --enable-autoupgrade \
81
84
--no-enable-autorepair \
82
85
--max-surge-upgrade 1 \
83
86
--max-unavailable-upgrade 0 \
84
- --node-locations " us-west1-a " \
87
+ --node-locations " ${REGION} " \
85
88
--node-labels=gke-no-default-nvidia-gpu-device-plugin=true,nvidia.com/gpu.present=true
86
89
87
90
# Create v100 node pool
88
91
gcloud beta container node-pools create " pool-2" \
89
92
--quiet \
90
93
--project " ${PROJECT_NAME} " \
91
94
--cluster " ${CLUSTER_NAME} " \
92
- --region " us-west1 " \
95
+ --region " ${REGION} " \
93
96
--node-version " ${NODE_VERSION} " \
94
97
--machine-type " n1-standard-8" \
95
98
--accelerator " type=nvidia-tesla-v100,count=1" \
@@ -103,30 +106,30 @@ gcloud beta container node-pools create "pool-2" \
103
106
--min-nodes " 1" \
104
107
--max-nodes " 6" \
105
108
--location-policy " ANY" \
106
- --no- enable-autoupgrade \
109
+ --enable-autoupgrade \
107
110
--no-enable-autorepair \
108
111
--max-surge-upgrade 1 \
109
112
--max-unavailable-upgrade 0 \
110
- --node-locations " us-west1-a " \
113
+ --node-locations " ${REGION} " \
111
114
--node-labels=gke-no-default-nvidia-gpu-device-plugin=true,nvidia.com/gpu.present=true
112
115
113
116
# # Allow the GPU nodes access to the internet
114
117
gcloud compute routers create ${NETWORK_NAME} -nat-router \
115
118
--quiet \
116
119
--project " ${PROJECT_NAME} " \
117
120
--network " ${NETWORK_NAME} " \
118
- --region " us-west1 "
121
+ --region " ${ROUTER_REGION} " \
119
122
120
123
gcloud compute routers nats create " ${NETWORK_NAME} -nat-config" \
121
124
--quiet \
122
125
--project " ${PROJECT_NAME} " \
123
126
--router " ${NETWORK_NAME} -nat-router" \
124
127
--nat-all-subnet-ip-ranges \
125
128
--auto-allocate-nat-external-ips \
126
- --router-region " us-west1 "
129
+ --router-region " ${ROUTER_REGION} " \
127
130
128
131
# # Start using this cluster for kubectl
129
- gcloud container clusters get-credentials " ${CLUSTER_NAME} " --location=" us-west1 "
132
+ gcloud container clusters get-credentials " ${CLUSTER_NAME} " --location=" ${REGION} "
130
133
131
134
# # Launch the nvidia-driver-installer daemonset to install the GPU drivers on any GPU nodes that come online:
132
135
kubectl label node --overwrite -l nvidia.com/gpu.present=true cloud.google.com/gke-gpu-driver-version-
0 commit comments