Skip to content

Commit

Permalink
Merge pull request #2554 from consideRatio/pr/awi-ciroh-maint
Browse files Browse the repository at this point in the history
awi-ciroh: upgrade k8s to 1.25, and adjust node pools following event
  • Loading branch information
consideRatio authored May 19, 2023
2 parents 904a280 + 869d9c2 commit 86659aa
Show file tree
Hide file tree
Showing 3 changed files with 46 additions and 88 deletions.
3 changes: 3 additions & 0 deletions config/clusters/awi-ciroh/common.values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -78,6 +78,9 @@ basehub:
# the previous 1:1 user:node setup with a node sharing setup. It
# is not meant to be retained long term!
#
# -[ ] Make this cluster have a node sharing setup like in the
# basehub/daskhub template.
#
- display_name: "Small"
description: 5GB RAM, 2 CPUs
default: true
Expand Down
121 changes: 33 additions & 88 deletions terraform/gcp/projects/awi-ciroh.tfvars
Original file line number Diff line number Diff line change
Expand Up @@ -2,11 +2,18 @@ prefix = "awi-ciroh"
project_id = "awi-ciroh"
zone = "us-central1-b"
region = "us-central1"
core_node_machine_type = "n1-highmem-4"
core_node_machine_type = "n2-highmem-4"
enable_network_policy = true
enable_filestore = true
filestore_capacity_gb = 1024

k8s_versions = {
min_master_version: "1.25.8-gke.500",
core_nodes_version: "1.25.6-gke.1000",
notebook_nodes_version: "1.25.6-gke.1000",
dask_nodes_version: "1.25.6-gke.1000",
}

user_buckets = {
"scratch-staging": {
"delete_after": 7
Expand All @@ -27,110 +34,48 @@ notebook_nodes = {
"small" : {
min : 0,
max : 100,
machine_type : "n1-standard-2",
labels: {},
gpu: {
enabled: false,
type: "",
count: 0
machine_type : "n2-highmem-4",
labels : {},
gpu : {
enabled : false,
type : "",
count : 0
}
},
"medium" : {
min : 0,
max : 100,
machine_type : "n1-standard-4",
labels: {},
gpu: {
enabled: false,
type: "",
count: 0
machine_type : "n2-highmem-16",
labels : {},
gpu : {
enabled : false,
type : "",
count : 0
}
},
"large" : {
min : 0,
max : 100,
machine_type : "n1-standard-8",
labels: {},
gpu: {
enabled: false,
type: "",
count: 0
}
},
"huge" : {
min : 0,
max : 100,
machine_type : "n1-standard-16",
labels: {},
gpu: {
enabled: false,
type: "",
count: 0
}
},
# added stressfully before an event where we ran out of ssd quota, see
# https://github.com/2i2c-org/infrastructure/pull/2539 and the linked
# event https://github.com/2i2c-org/infrastructure/issues/2520.
#
# FIXME: make this cluster have a node sharing setup like in the
# basehub/daskhub template.
#
"highmem-medium" : {
min : 10,
max : 100,
machine_type : "n2-highmem-16",
labels: {},
gpu: {
enabled: false,
type: "",
count: 0
machine_type : "n2-highmem-64",
labels : {},
gpu : {
enabled : false,
type : "",
count : 0
}
},
}

dask_nodes = {
"small" : {
min : 0,
max : 100,
machine_type : "n1-standard-2",
labels: {},
gpu: {
enabled: false,
type: "",
count: 0
}
},
"medium" : {
min : 0,
max : 100,
machine_type : "n1-standard-4",
labels: {},
gpu: {
enabled: false,
type: "",
count: 0
}
},
"large" : {
min : 0,
max : 100,
machine_type : "n1-standard-8",
labels: {},
gpu: {
enabled: false,
type: "",
count: 0
}
},
"huge" : {
min : 0,
max : 100,
machine_type : "n1-standard-16",
labels: {},
gpu: {
enabled: false,
type: "",
count: 0
max : 200,
machine_type : "n2-highmem-16",
labels : {},
gpu : {
enabled : false,
type : "",
count : 0
}
},
}
Expand Down
10 changes: 10 additions & 0 deletions terraform/gcp/variables.tf
Original file line number Diff line number Diff line change
Expand Up @@ -25,6 +25,13 @@ variable "project_id" {

variable "k8s_version_prefixes" {
type = set(string)
# Available minor versions are picked from the GKE regular release channel. To
# see the available versions see
# https://cloud.google.com/kubernetes-engine/docs/release-notes-regular
#
# This list should list all minor versions available in the regular release
# channel, so we may want to remove or add minor versions here over time.
#
default = [
"1.22.",
"1.23.",
Expand All @@ -35,6 +42,9 @@ variable "k8s_version_prefixes" {
description = <<-EOT
A list of k8s version prefixes that can be evaluated to their latest version by
the output defined in cluster.tf called regular_channel_latest_k8s_versions.
For details about release channels (rapid, regular, stable), see:
https://cloud.google.com/kubernetes-engine/docs/concepts/release-channels#channels
EOT
}

Expand Down

0 comments on commit 86659aa

Please sign in to comment.