From 5b96829548c9c3a3646d0b4a2f26c5208a5036d8 Mon Sep 17 00:00:00 2001 From: Aiden Grossman Date: Thu, 24 Jul 2025 17:32:44 +0000 Subject: [PATCH 1/2] [CI] Add maintenance window to premerge clusters This patch adds an explicit maintenance window to the premerge clusters. This is in response to some control plane upgrades that we recieved notice of that will prevent access to the k8s control plane for ~15 minutes which means we will not be able to start new jobs. We should have this anyways though as the current node upgrade strategy also breaks jobs. --- premerge/gke_cluster/main.tf | 10 ++++++++++ 1 file changed, 10 insertions(+) diff --git a/premerge/gke_cluster/main.tf b/premerge/gke_cluster/main.tf index 2294c21e0..c2a7861d7 100644 --- a/premerge/gke_cluster/main.tf +++ b/premerge/gke_cluster/main.tf @@ -19,6 +19,16 @@ resource "google_container_cluster" "llvm_premerge" { workload_identity_config { workload_pool = "llvm-premerge-checks.svc.id.goog" } + + # We prefer that maintenance is done on weekends betwee 02:00 and 05:00 + # UTC when commit traffic is low to avoid interruptions. + maintenance_policy { + recurring_window { + start_time = "2025-07-24T02:00:00Z" + end_time = "2025-07-24T05:00:00Z" + recurrence = "FREQ=WEEKLY;BYDAY=SA,SU" + } + } } resource "google_container_node_pool" "llvm_premerge_linux_service" { From f655945d2a4292da411f3e4ae20e5678ff3eaf11 Mon Sep 17 00:00:00 2001 From: Aiden Grossman Date: Thu, 24 Jul 2025 21:14:30 +0000 Subject: [PATCH 2/2] feedback --- premerge/gke_cluster/main.tf | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/premerge/gke_cluster/main.tf b/premerge/gke_cluster/main.tf index c2a7861d7..ea92a6a3a 100644 --- a/premerge/gke_cluster/main.tf +++ b/premerge/gke_cluster/main.tf @@ -20,7 +20,7 @@ resource "google_container_cluster" "llvm_premerge" { workload_pool = "llvm-premerge-checks.svc.id.goog" } - # We prefer that maintenance is done on weekends betwee 02:00 and 05:00 + # We prefer that maintenance is done on weekends between 02:00 and 05:00 # UTC when commit traffic is low to avoid interruptions. maintenance_policy { recurring_window {