konturio · Komzpa · Oct 1, 2024 · Oct 1, 2024 · Oct 1, 2024 · Oct 1, 2024
diff --git a/flux/clusters/k8s-01/basemap/dev/kustomization.yaml b/flux/clusters/k8s-01/basemap/dev/kustomization.yaml
@@ -16,4 +16,20 @@ patches:
         value:
           - ./helm/basemap/values.yaml
           - ./helm/basemap/values/values-dev.yaml
----
+  - target:
+      kind: CronJob
+      name: 'dev-basemap'
+      group: batch
+      version: v1
+    patch: |-
+      - op: add
+        path: /spec/jobTemplate/spec/template/spec/affinity/nodeAffinity
+        value:
+          requiredDuringSchedulingIgnoredDuringExecution:
+            nodeSelectorTerms:
+              - matchExpressions:
+                  - key: kubernetes.io/hostname
+                    operator: In
+                    values:
+                      - hwn02.k8s-01.kontur.io
+---
diff --git a/flux/clusters/k8s-01/basemap/prod/kustomization.yaml b/flux/clusters/k8s-01/basemap/prod/kustomization.yaml
@@ -16,4 +16,36 @@ patches:
         value:
           - ./helm/basemap/values.yaml
           - ./helm/basemap/values/values-prod.yaml
----
+  - target:
+      kind: Deployment
+      name: 'prod-basemap-tileserver'
+      group: apps
+      version: v1
+    patch: |-
+      - op: add
+        path: /spec/template/spec/affinity/nodeAffinity
+        value:
+          requiredDuringSchedulingIgnoredDuringExecution:
+            nodeSelectorTerms:
+              - matchExpressions:
+                  - key: kubernetes.io/hostname
+                    operator: NotIn
+                    values:
+                      - hwn01.k8s-01.kontur.io
+  - target:
+      kind: CronJob
+      name: 'prod-basemap'
+      group: batch
+      version: v1
+    patch: |-
+      - op: add
+        path: /spec/jobTemplate/spec/template/spec/affinity/nodeAffinity
+        value:
+          requiredDuringSchedulingIgnoredDuringExecution:
+            nodeSelectorTerms:
+              - matchExpressions:
+                  - key: kubernetes.io/hostname
+                    operator: In
+                    values:
+                      - hwn02.k8s-01.kontur.io
+---
diff --git a/flux/clusters/k8s-01/basemap/test/kustomization.yaml b/flux/clusters/k8s-01/basemap/test/kustomization.yaml
@@ -16,4 +16,36 @@ patches:
         value:
           - ./helm/basemap/values.yaml
           - ./helm/basemap/values/values-test.yaml
----
+  - target: # temporary stick to hwn02
+      kind: CronJob
+      name: 'test-basemap'
+      group: batch
+      version: v1
+    patch: |-
+      - op: add
+        path: /spec/jobTemplate/spec/template/spec/affinity/nodeAffinity
+        value:
+          requiredDuringSchedulingIgnoredDuringExecution:
+            nodeSelectorTerms:
+              - matchExpressions:
+                  - key: kubernetes.io/hostname
+                    operator: In
+                    values:
+                      - hwn02.k8s-01.kontur.io
+  - target: # temporary move out from hwn01
+      kind: Deployment
+      name: 'test-basemap-tileserver'
+      group: apps
+      version: v1
+    patch: |-
+      - op: add
+        path: /spec/template/spec/affinity/nodeAffinity
+        value:
+          requiredDuringSchedulingIgnoredDuringExecution:
+            nodeSelectorTerms:
+              - matchExpressions:
+                  - key: kubernetes.io/hostname
+                    operator: NotIn
+                    values:
+                      - hwn01.k8s-01.kontur.io
+---
diff --git a/flux/clusters/k8s-01/event-api-db/overlays/DEV/kustomization.yaml b/flux/clusters/k8s-01/event-api-db/overlays/DEV/kustomization.yaml
@@ -21,18 +21,12 @@ patchesJson6902:
       kind: PostgresCluster
       name: db-event-api
     path: postgrescluster-custom-image.yaml
-#  - target:
-#      group: postgres-operator.crunchydata.com
-#      version: v1beta1
-#      kind: PostgresCluster
-#      name: db-event-api
-#    path: postgrescluster-resource-adjustment.yaml
-  - target:
+  - target: # new config for instances management
       group: postgres-operator.crunchydata.com
       version: v1beta1
       kind: PostgresCluster
       name: db-event-api
-    path: postgrescluster-assigning.yaml
+    path: postgrescluster-instances.yaml
 
 generatorOptions:
   disableNameSuffixHash: true

diff --git a/flux/clusters/k8s-01/event-api-db/overlays/DEV/postgrescluster-assigning.yaml b/flux/clusters/k8s-01/event-api-db/overlays/DEV/postgrescluster-assigning.yaml
diff --git a/flux/clusters/k8s-01/event-api-db/overlays/DEV/postgrescluster-instances.yaml b/flux/clusters/k8s-01/event-api-db/overlays/DEV/postgrescluster-instances.yaml
@@ -0,0 +1,71 @@
+# Always replace placeholder instances from `base`
+- op: replace 
+  path: /spec/instances
+  value:
+    - name: hwn04
+      replicas: 1
+      resources: &resources
+        limits:
+          memory: 512Gi # # let Postres use the page cache
+          cpu: '64' # set as event-api pool size + autovacuum workers + a bit for parallel workers
+          # empyrical recommendations below
+          # memory: 100Gi 
+          # cpu: '5' 
+        requests:
+          memory: 22Gi # roughly shared_buffers + pool size * work_mem
+          cpu: '2' # if we don't have CPU we can run on potato
+          # empyrical recommendations below
+          # memory: 7Gi
+          # cpu: '1' 
+      dataVolumeClaimSpec: &storage
+        accessModes:
+          - ReadWriteOnce
+        resources:
+          requests:
+            storage: 100Gi
+            # empyrical recommendations below -- actual storage varies from 2300Gi to 6200Gi
+            # storage: 2500Gi
+      affinity:
+        nodeAffinity:
+          requiredDuringSchedulingIgnoredDuringExecution:
+            nodeSelectorTerms:
+              - matchExpressions:
+                  - key: kubernetes.io/hostname
+                    operator: In
+                    values:
+                      - hwn04.k8s-01.kontur.io
+    - name: hwn03
+      replicas: 1
+      resources:
+        <<: *resources
+      dataVolumeClaimSpec:
+        <<: *storage
+      affinity:
+        nodeAffinity:
+          requiredDuringSchedulingIgnoredDuringExecution:
+            nodeSelectorTerms:
+              - matchExpressions:
+                  - key: kubernetes.io/hostname
+                    operator: In
+                    values:
+                      - hwn03.k8s-01.kontur.io
+
+# Switchover section
+# https://access.crunchydata.com/documentation/postgres-operator/latest/tutorials/cluster-management/administrative-tasks#changing-the-primary
+# https://access.crunchydata.com/documentation/postgres-operator/latest/tutorials/cluster-management/administrative-tasks#targeting-an-instance
+# 1. Requires fully-qualified instance id of new master
+# 2. New master must be in sink with current master (check via `patronictl list`)
+# 3. Its recommended to retain switchover section, to keep track of last desired master both in code and k8s
+- op: add
+  path: /spec/patroni/switchover
+  value:
+    enabled: true
+    targetInstance: db-event-api-hwn04-OVERRIDEME
+    #type: Failover
+# trigger-switchover annotation triggers actual switchover whenever its updated
+# value is arbitrary, but it's recommended to reference the date of switchover
+# special syntax is used to escape slash with sequence ~1
+# See https://windsock.io/json-pointer-syntax-in-json-patches-with-kustomize/
+- op: add
+  path: /metadata/annotations/postgres-operator.crunchydata.com~1trigger-switchover
+  value: OVERRIDEME
diff --git a/flux/clusters/k8s-01/event-api-db/overlays/DEV/postgrescluster-resource-adjustment.yaml b/flux/clusters/k8s-01/event-api-db/overlays/DEV/postgrescluster-resource-adjustment.yaml
diff --git a/flux/clusters/k8s-01/event-api-db/overlays/PROD/kustomization.yaml b/flux/clusters/k8s-01/event-api-db/overlays/PROD/kustomization.yaml
@@ -9,12 +9,12 @@ patchesJson6902:
       kind: PostgresCluster
       name: db-event-api
     path: postgrescluster-s3-backups.yaml
-  - target:
+  - target: # new config for instances management
       group: postgres-operator.crunchydata.com
       version: v1beta1
       kind: PostgresCluster
       name: db-event-api
-    path: postgrescluster-resource-adjustment.yaml
+    path: postgrescluster-instances.yaml
   - target:
       group: postgres-operator.crunchydata.com
       version: v1beta1

diff --git a/flux/clusters/k8s-01/event-api-db/overlays/PROD/postgrescluster-instances.yaml b/flux/clusters/k8s-01/event-api-db/overlays/PROD/postgrescluster-instances.yaml
@@ -0,0 +1,71 @@
+# Always replace placeholder instances from `base`
+- op: replace 
+  path: /spec/instances
+  value:
+    - name: hwn04
+      replicas: 1
+      resources: &resources
+        limits:
+          memory: 512Gi # # let Postres use the page cache
+          cpu: '64' # set as event-api pool size + autovacuum workers + a bit for parallel workers
+          # empyrical recommendations below
+          # memory: 100Gi 
+          # cpu: '5' 
+        requests:
+          memory: 22Gi # roughly shared_buffers + pool size * work_mem
+          cpu: '2' # if we don't have CPU we can run on potato
+          # empyrical recommendations below
+          # memory: 7Gi
+          # cpu: '1' 
+      dataVolumeClaimSpec: &storage
+        accessModes:
+          - ReadWriteOnce
+        resources:
+          requests:
+            storage: 100Gi
+            # empyrical recommendations below -- actual storage varies from 2300Gi to 6200Gi
+            # storage: 2500Gi
+      affinity:
+        nodeAffinity:
+          requiredDuringSchedulingIgnoredDuringExecution:
+            nodeSelectorTerms:
+              - matchExpressions:
+                  - key: kubernetes.io/hostname
+                    operator: In
+                    values:
+                      - hwn04.k8s-01.kontur.io
+    - name: hwn03
+      replicas: 1
+      resources:
+        <<: *resources
+      dataVolumeClaimSpec:
+        <<: *storage
+      affinity:
+        nodeAffinity:
+          requiredDuringSchedulingIgnoredDuringExecution:
+            nodeSelectorTerms:
+              - matchExpressions:
+                  - key: kubernetes.io/hostname
+                    operator: In
+                    values:
+                      - hwn03.k8s-01.kontur.io
+
+# Switchover section
+# https://access.crunchydata.com/documentation/postgres-operator/latest/tutorials/cluster-management/administrative-tasks#changing-the-primary
+# https://access.crunchydata.com/documentation/postgres-operator/latest/tutorials/cluster-management/administrative-tasks#targeting-an-instance
+# 1. Requires fully-qualified instance id of new master
+# 2. New master must be in sink with current master (check via `patronictl list`)
+# 3. Its recommended to retain switchover section, to keep track of last desired master both in code and k8s
+- op: add
+  path: /spec/patroni/switchover
+  value:
+    enabled: true
+    targetInstance: db-event-api-hwn04-OVERRIDEME
+    #type: Failover
+# trigger-switchover annotation triggers actual switchover whenever its updated
+# value is arbitrary, but it's recommended to reference the date of switchover
+# special syntax is used to escape slash with sequence ~1
+# See https://windsock.io/json-pointer-syntax-in-json-patches-with-kustomize/
+- op: add
+  path: /metadata/annotations/postgres-operator.crunchydata.com~1trigger-switchover
+  value: OVERRIDEME
diff --git a/flux/clusters/k8s-01/event-api-db/overlays/PROD/postgrescluster-resource-adjustment.yaml b/flux/clusters/k8s-01/event-api-db/overlays/PROD/postgrescluster-resource-adjustment.yaml
diff --git a/flux/clusters/k8s-01/raster-tiler/dev/kustomization.yaml b/flux/clusters/k8s-01/raster-tiler/dev/kustomization.yaml
@@ -16,4 +16,20 @@ patches:
         value:
           - ./helm/raster-tiler/values.yaml
           - ./helm/raster-tiler/values/values-dev.yaml
+  - target:
+      kind: Deployment
+      name: 'dev-raster-tiler'
+      group: apps
+      version: v1
+    patch: |-
+      - op: add
+        path: /spec/template/spec/affinity/nodeAffinity
+        value:
+          requiredDuringSchedulingIgnoredDuringExecution:
+            nodeSelectorTerms:
+              - matchExpressions:
+                  - key: kubernetes.io/hostname
+                    operator: NotIn
+                    values:
+                      - hwn01.k8s-01.kontur.io
 ---
diff --git a/flux/clusters/k8s-01/raster-tiler/geocint/kustomization.yaml b/flux/clusters/k8s-01/raster-tiler/geocint/kustomization.yaml
@@ -16,4 +16,20 @@ patches:
         value:
           - ./helm/raster-tiler/values.yaml
           - ./helm/raster-tiler/values/values-geocint.yaml
+  - target:
+      kind: Deployment
+      name: 'geocint-raster-tiler'
+      group: apps
+      version: v1
+    patch: |-
+      - op: add
+        path: /spec/template/spec/affinity/nodeAffinity
+        value:
+          requiredDuringSchedulingIgnoredDuringExecution:
+            nodeSelectorTerms:
+              - matchExpressions:
+                  - key: kubernetes.io/hostname
+                    operator: NotIn
+                    values:
+                      - hwn01.k8s-01.kontur.io
 ---
diff --git a/helm/basemap/Chart.yaml b/helm/basemap/Chart.yaml
@@ -15,7 +15,7 @@ type: application
 # This is the chart version. This version number should be incremented each time you make changes
 # to the chart and its templates, including the app version.
 # Versions are expected to follow Semantic Versioning (https://semver.org/)
-version: 0.0.37
+version: 0.0.45
 
 #Don't use appVersion, use {{ .Values.images...tag's. }} instead. That's required for Flux automation - so that different
 # stages can have different versions within the same branch watched by Flux.