feat(chart): implement HPA spec with prometheus-adapter config (P6.6, miroir-m9q.6)

Implements the HPA specification from plan §14.4: - values.yaml: Add per-workload-tier min/max defaults (≤5k QPS: min=4, max=8) - values.yaml: Add stabilization windows (scale-up: 30s, scale-down: 300s) - values.yaml: Add custom metrics (targetRequestsInFlight: 500, targetBackgroundQueueDepth: 10) - values.yaml: Update targetMemoryUtilizationPercentage from 80% to 75% (per plan §14.4) - values.schema.json: Add behavior, targetRequestsInFlight, targetBackgroundQueueDepth properties - miroir-hpa.yaml: Fix value paths from .Values.hpa.* to .Values.miroir.hpa.* - miroir-hpa.yaml: Remove selector from external metric (not applicable for Value type) - miroir-prometheus-adapter-configmap.yaml: New separate ConfigMap for prometheus-adapter rules - NOTES.txt: Add prometheus-adapter prerequisite documentation with verification steps Chart preconditions enforced via values.schema.json: - hpa.enabled: true requires replicas >= 2 AND taskStore.backend: redis - prometheus-adapter (or equivalent) is a documented prerequisite when HPA is enabled Closes: miroir-m9q.6 Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com>
2026-05-24 06:37:40 -04:00 · 2026-05-24 06:37:40 -04:00 · 57d5098bd3
commit 57d5098bd3
parent e2fa9b2a7f
5 changed files with 107 additions and 90 deletions
--- a/charts/miroir/templates/NOTES.txt
+++ b/charts/miroir/templates/NOTES.txt
@ -35,6 +35,30 @@ Redis is deployed and accessible at:

 {{- end }}

+{{- if .Values.miroir.hpa.enabled }}
+
+HPA is enabled for this deployment.
+
+IMPORTANT: HPA uses custom metrics (miroir_requests_in_flight, miroir_background_queue_depth) that require prometheus-adapter (or an equivalent custom/external metrics API bridge). This chart does NOT install prometheus-adapter — it must be deployed separately in your cluster.
+
+To verify prometheus-adapter is configured correctly:
+
+1. Check the custom metrics API is available:
+   kubectl get --raw /apis/custom.metrics.k8s.io/v1beta1 | jq .
+
+2. Query the per-pod metric:
+   kubectl get --raw /apis/custom.metrics.k8s.io/v1beta1/namespaces/{{ .Release.Namespace }}/pods/*/miroir_requests_in_flight | jq .
+
+3. Query the global metric (requires prometheus-adapter external metrics):
+   kubectl get --raw /apis/external.metrics.k8s.io/v1beta1/namespaces/{{ .Release.Namespace }}/miroir_background_queue_depth | jq .
+
+4. Check HPA status and current metrics:
+   kubectl describe hpa {{ include "miroir.fullname" . }}-miroir -n {{ .Release.Namespace }}
+
+This chart renders a ConfigMap ({{ include "miroir.fullname" . }}-prometheus-adapter-metrics) with the required prometheus-adapter rules. Configure your prometheus-adapter installation to load rules from ConfigMaps with the label: app.kubernetes.io/name={{ include "miroir.name" . }}
+
+{{- end }}
+
 To verify the deployment, run:
  kubectl get pods --namespace {{ .Release.Namespace }} -l "app.kubernetes.io/name={{ include "miroir.name" . }},app.kubernetes.io/instance={{ .Release.Name }}"

--- a/charts/miroir/templates/miroir-hpa.yaml
+++ b/charts/miroir/templates/miroir-hpa.yaml
@ -1,9 +1,9 @@
 {{/*
 Miroir Horizontal Pod Autoscaler (plan §14.4)
 Requires prometheus-adapter for custom metrics (miroir_requests_in_flight, miroir_background_queue_depth).
-The prometheus-adapter dependency is auto-enabled when hpa.enabled=true.
+The prometheus-adapter dependency is a prerequisite when hpa.enabled=true (see NOTES.txt).
 */}}
-{{- if and .Values.miroir.replicas .Values.hpa.enabled }}
+{{- if and .Values.miroir.replicas .Values.miroir.hpa.enabled }}
 apiVersion: autoscaling/v2
 kind: HorizontalPodAutoscaler
 metadata:
@ -12,37 +12,34 @@ metadata:
    {{- include "miroir.labels" . | nindent 4 }}
    app.kubernetes.io/component: miroir
  annotations:
-    {{- with .Values.hpa.annotations }}
+    {{- with .Values.miroir.hpa.annotations }}
    {{- toYaml . | nindent 4 }}
    {{- end }}
-    {{- if .Values.hpa.enabled }}
-    helm.sh/hook: post-install,post-upgrade
-    {{- end }}
 spec:
  scaleTargetRef:
    apiVersion: apps/v1
    kind: Deployment
    name: {{ include "miroir.fullname" . }}-miroir
-  minReplicas: {{ .Values.hpa.minReplicas }}
-  maxReplicas: {{ .Values.hpa.maxReplicas }}
+  minReplicas: {{ .Values.miroir.hpa.minReplicas }}
+  maxReplicas: {{ .Values.miroir.hpa.maxReplicas }}
  metrics:
-    {{- if .Values.hpa.targetCPUUtilizationPercentage }}
+    {{- if .Values.miroir.hpa.targetCPUUtilizationPercentage }}
    - type: Resource
      resource:
        name: cpu
        target:
          type: Utilization
-          averageUtilization: {{ .Values.hpa.targetCPUUtilizationPercentage }}
+          averageUtilization: {{ .Values.miroir.hpa.targetCPUUtilizationPercentage }}
    {{- end }}
-    {{- if .Values.hpa.targetMemoryUtilizationPercentage }}
+    {{- if .Values.miroir.hpa.targetMemoryUtilizationPercentage }}
    - type: Resource
      resource:
        name: memory
        target:
          type: Utilization
-          averageUtilization: {{ .Values.hpa.targetMemoryUtilizationPercentage }}
+          averageUtilization: {{ .Values.miroir.hpa.targetMemoryUtilizationPercentage }}
    {{- end }}
-    {{- if .Values.hpa.targetRequestsInFlight }}
+    {{- if .Values.miroir.hpa.targetRequestsInFlight }}
    # Per-pod custom metric (plan §14.4)
    # Type: Pods AverageValue
    # Query: sum(miroir_requests_in_flight{pod=<pod>}) by (pod)
@ -57,9 +54,9 @@ spec:
              app.kubernetes.io/component: miroir
        target:
          type: AverageValue
-          averageValue: {{ .Values.hpa.targetRequestsInFlight | default "500" }}
+          averageValue: {{ .Values.miroir.hpa.targetRequestsInFlight | default "500" }}
    {{- end }}
-    {{- if .Values.hpa.targetBackgroundQueueDepth }}
+    {{- if .Values.miroir.hpa.targetBackgroundQueueDepth }}
    # Global custom metric (plan §14.4)
    # Type: External Value (not averaged across pods)
    # Query: sum(miroir_background_queue_depth)
@ -69,80 +66,12 @@ spec:
      external:
        metric:
          name: miroir_background_queue_depth
-          selector:
-            matchLabels:
-              {{- include "miroir.selectorLabels" . | nindent 14 }}
-              app.kubernetes.io/component: miroir
        target:
          type: Value
-          value: {{ .Values.hpa.targetBackgroundQueueDepth | default "10" }}
+          value: {{ .Values.miroir.hpa.targetBackgroundQueueDepth | default "10" }}
    {{- end }}
-  {{- with .Values.hpa.behavior }}
+  {{- with .Values.miroir.hpa.behavior }}
  behavior:
    {{- toYaml . | nindent 4 }}
  {{- end }}
 {{- end }}
-
-{{/*
-PrometheusAdapter custom metrics configuration (plan §14.4)
-Auto-rendered when hpa.enabled=true to configure prometheus-adapter for Miroir metrics.
-This ConfigMap is consumed by the prometheus-adapter Helm chart.
-*/}}
-{{- if and .Values.miroir.replicas .Values.hpa.enabled }}
-apiVersion: v1
-kind: ConfigMap
-metadata:
-  name: {{ include "miroir.fullname" . }}-prometheus-adapter-metrics
-  labels:
-    {{- include "miroir.labels" . | nindent 4 }}
-  annotations:
-    helm.sh/hook: pre-install,pre-upgrade
-    helm.sh/hook-weight: "-5"
-data:
-  # Custom metrics for Miroir HPA (plan §14.4)
-  # Per-pod metric: miroir_requests_in_flight
-  # Type: Pods (average value across all pods)
-  rules.yaml: |
-    - seriesQuery: '{__name__="miroir_requests_in_flight",namespace="{{ .Release.Namespace }}"}'
-      name:
-        as: "miroir_requests_in_flight"
-      metricsQuery: |
-        sum(miroir_requests_in_flight{<<.LabelMatchers>>}) by (<<.GroupBy>>)
-      resource:
-        name: miroir_requests_in_flight
-      container: miroir
-      type:
-        type: Pods
-    # Global metric: miroir_background_queue_depth
-    # Type: Value (not averaged, global cluster-wide metric)
-    - seriesQuery: '{__name__="miroir_background_queue_depth",namespace="{{ .Release.Namespace }}"}'
-      name:
-        as: "miroir_background_queue_depth"
-      metricsQuery: |
-        sum(miroir_background_queue_depth{<<.LabelMatchers>>})
-      resource:
-        name: miroir_background_queue_depth
-      type:
-        type: Value
-{{- end }}
-{{- if and .Values.miroir.replicas .Values.hpa.enabled }}
---
-# NOTES: Prometheus Adapter Configuration (plan §14.4)
-#
-# The Miroir Helm chart auto-enables prometheus-adapter when HPA is enabled.
-# Custom metrics are configured via the ConfigMap above.
-#
-# To verify prometheus-adapter is working:
-#
-# 1. Check the custom metrics API is available:
-#    kubectl get --raw /apis/custom.metrics.k8s.io/v1beta1 | jq .
-#
-# 2. Query the per-pod metric:
-#    kubectl get --raw /apis/custom.metrics.k8s.io/v1beta1/namespaces/{{ .Release.Namespace }}/pods/miroir_requests_in_flight | jq .
-#
-# 3. Query the global metric:
-#    kubectl get --raw /apis/custom.metrics.k8s.io/v1beta1/namespaces/{{ .Release.Namespace }}/miroir_background_queue_depth | jq .
-#
-# 4. Check HPA status:
-#    kubectl describe hpa {{ include "miroir.fullname" . }}-miroir
-{{- end }}
--- a/charts/miroir/templates/miroir-prometheus-adapter-configmap.yaml
+++ b/charts/miroir/templates/miroir-prometheus-adapter-configmap.yaml
@ -0,0 +1,43 @@
+{{/*
+PrometheusAdapter custom metrics configuration (plan §14.4)
+Auto-rendered when hpa.enabled=true to configure prometheus-adapter for Miroir metrics.
+This ConfigMap is consumed by the prometheus-adapter Helm chart.
+*/}}
+{{- if and .Values.miroir.replicas .Values.miroir.hpa.enabled }}
+apiVersion: v1
+kind: ConfigMap
+metadata:
+  name: {{ include "miroir.fullname" . }}-prometheus-adapter-metrics
+  labels:
+    {{- include "miroir.labels" . | nindent 4 }}
+    app.kubernetes.io/component: prometheus-adapter
+  annotations:
+    helm.sh/hook: pre-install,pre-upgrade
+    helm.sh/hook-weight: "-5"
+data:
+  # Custom metrics for Miroir HPA (plan §14.4)
+  # Per-pod metric: miroir_requests_in_flight
+  # Type: Pods (average value across all pods)
+  rules.yaml: |
+    - seriesQuery: '{__name__="miroir_requests_in_flight",namespace="{{ .Release.Namespace }}"}'
+      name:
+        as: "miroir_requests_in_flight"
+      metricsQuery: |
+        sum(miroir_requests_in_flight{<<.LabelMatchers>>}) by (<<.GroupBy>>)
+      resource:
+        name: miroir_requests_in_flight
+      container: miroir
+      type:
+        type: Pods
+    # Global metric: miroir_background_queue_depth
+    # Type: Value (not averaged, global cluster-wide metric)
+    - seriesQuery: '{__name__="miroir_background_queue_depth",namespace="{{ .Release.Namespace }}"}'
+      name:
+        as: "miroir_background_queue_depth"
+      metricsQuery: |
+        sum(miroir_background_queue_depth{<<.LabelMatchers>>})
+      resource:
+        name: miroir_background_queue_depth
+      type:
+        type: Value
+{{- end }}
--- a/charts/miroir/values.schema.json
+++ b/charts/miroir/values.schema.json
@ -63,8 +63,11 @@
            "enabled": {"type": "boolean"},
            "minReplicas": {"type": "integer", "minimum": 1},
            "maxReplicas": {"type": "integer", "minimum": 1},
+            "behavior": {"type": "object"},
            "targetCPUUtilizationPercentage": {"type": "integer", "minimum": 1, "maximum": 100},
-            "targetMemoryUtilizationPercentage": {"type": "integer", "minimum": 1, "maximum": 100}
+            "targetMemoryUtilizationPercentage": {"type": "integer", "minimum": 1, "maximum": 100},
+            "targetRequestsInFlight": {"type": "string"},
+            "targetBackgroundQueueDepth": {"type": "string"}
          }
        },
        "ingress": {
--- a/charts/miroir/values.yaml
+++ b/charts/miroir/values.yaml
@ -30,13 +30,31 @@ miroir:
  scatter:
    unavailableShardPolicy: partial  # partial | error

-  # Horizontal Pod Autoscaler
+  # Horizontal Pod Autoscaler (plan §14.4)
  hpa:
    enabled: false  # dev default; production: true (requires taskStore.backend=redis)
-    minReplicas: 2
-    maxReplicas: 10
+    # Per-workload-tier defaults (plan §14.7):
+    #   ≤ 500 QPS:   min=2, max=3
+    #   ≤ 2k QPS:    min=2, max=4
+    #   ≤ 5k QPS:    min=4, max=8  (default)
+    #   ≤ 20k QPS:   min=8, max=12
+    #   ≤ 100k QPS:  min=12, max=24
+    minReplicas: 4
+    maxReplicas: 8
+    # Stabilization windows (plan §14.4): scale-up fast, scale-down slow
+    behavior:
+      scaleDown:
+        stabilizationWindowSeconds: 300
+      scaleUp:
+        stabilizationWindowSeconds: 30
+    # Resource metrics (plan §14.4)
    targetCPUUtilizationPercentage: 70
-    targetMemoryUtilizationPercentage: 80
+    targetMemoryUtilizationPercentage: 75
+    # Custom metrics (require prometheus-adapter)
+    # Per-pod metric: average requests per pod
+    targetRequestsInFlight: 500
+    # Global metric: total background jobs queued across all pods
+    targetBackgroundQueueDepth: 10

  # Ingress configuration
  ingress: