Skip to content

Commit

Permalink
fix: helm release prioritize upgrade failed over reconcile progressing
Browse files Browse the repository at this point in the history
  • Loading branch information
adityathebe committed Jun 25, 2024
1 parent 0780ab0 commit f05a1c3
Show file tree
Hide file tree
Showing 4 changed files with 94 additions and 0 deletions.
1 change: 1 addition & 0 deletions pkg/health/health.go
Original file line number Diff line number Diff line change
Expand Up @@ -49,6 +49,7 @@ const (
HealthStatusRestart HealthStatusCode = "Restarting"
HealthStatusStarting HealthStatusCode = "Starting"
HealthStatusUnschedulable HealthStatusCode = "Unschedulable"
HealthStatusUpgradeFailed HealthStatusCode = "UpgradeFailed"

HealthStatusScalingUp HealthStatusCode = "Scaling Up"
HealthStatusScaledToZero HealthStatusCode = "Scaled to Zero"
Expand Down
5 changes: 5 additions & 0 deletions pkg/health/health_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -202,8 +202,13 @@ func TestFluxResources(t *testing.T) {
assertAppHealth(t, "./testdata/flux-kustomization-failed.yaml", "BuildFailed", health.HealthUnhealthy, false)
status := getHealthStatus("./testdata/flux-kustomization-failed.yaml", t)
assert.Contains(t, status.Message, "err='accumulating resources from 'kubernetes_resource_ingress_fail.yaml'")

assertAppHealth(t, "./testdata/flux-helmrelease-healthy.yaml", "ReconciliationSucceeded", health.HealthHealthy, true)
assertAppHealth(t, "./testdata/flux-helmrelease-unhealthy.yaml", "UpgradeFailed", health.HealthUnhealthy, false)
assertAppHealth(t, "./testdata/flux-helmrelease-upgradefailed.yaml", "UpgradeFailed", health.HealthUnhealthy, false)
helmreleaseStatus := getHealthStatus("./testdata/flux-helmrelease-upgradefailed.yaml", t)
assert.Contains(t, helmreleaseStatus.Message, "Helm upgrade failed for release mission-control-agent/prod-kubernetes-bundle with chart [email protected]: YAML parse error on mission-control-kubernetes/templates/topology.yaml: error converting YAML to JSON: yaml: line 171: did not find expected '-' indicator")
assert.Equal(t, helmreleaseStatus.Status, health.HealthStatusUpgradeFailed)

assertAppHealth(t, "./testdata/flux-helmrepository-healthy.yaml", "Succeeded", health.HealthHealthy, true)
assertAppHealth(t, "./testdata/flux-helmrepository-unhealthy.yaml", "Failed", health.HealthUnhealthy, false)
Expand Down
4 changes: 4 additions & 0 deletions pkg/health/statusMap.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -121,6 +121,10 @@ HelmRelease: &flux
ready: true
health: healthy
message: true
reasons:
UpgradeFailed:
health: unhealthy
order: 1
onUnknown:
status: Reconciling
nonReady: true
Expand Down
84 changes: 84 additions & 0 deletions pkg/health/testdata/flux-helmrelease-upgradefailed.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,84 @@
apiVersion: helm.toolkit.fluxcd.io/v2beta1
kind: HelmRelease
metadata:
annotations:
meta.helm.sh/release-name: netflix
meta.helm.sh/release-namespace: netflix
creationTimestamp: "2023-09-11T12:35:35Z"
finalizers:
- finalizers.fluxcd.io
generation: 2
labels:
app.kubernetes.io/instance: netflix
app.kubernetes.io/managed-by: Helm
app.kubernetes.io/name: mission-control-tenant
app.kubernetes.io/version: 1.0.26
helm.sh/chart: mission-control-tenant-1.0.26
helm.toolkit.fluxcd.io/name: netflix
helm.toolkit.fluxcd.io/namespace: netflix
name: netflix-mission-control-tenant
namespace: netflix
resourceVersion: "156985353"
uid: 7568b4fe-e5b3-442d-abdb-1f1f7bdb8e0c
spec:
chart:
spec:
chart: mission-control
interval: 1m
reconcileStrategy: ChartVersion
sourceRef:
kind: HelmRepository
name: netflix-mission-control-tenant
version: '>=0.0.0'
install:
crds: CreateReplace
createNamespace: true
interval: 5m
kubeConfig:
secretRef:
key: config
name: vc-netflix
storageNamespace: default
targetNamespace: default
upgrade:
crds: CreateReplace
values:
authProvider: clerk
clerkJWKSURL: https://secure-eagle-96.clerk.accounts.dev/.well-known/jwks.json
clerkOrgID: org_2VFcRC1Y4JSIUSoDfGUt8X2GZxd
db:
create: false
flanksource-ui:
enabled: false
kratos:
enabled: false
status:
conditions:
- lastTransitionTime: "2023-09-11T14:12:06Z"
type: Reconciling
reason: Progressing
status: "True"
message: Running 'upgrade' action with timeout of 5m0s
- lastTransitionTime: "2023-09-11T14:12:06Z"
type: Ready
reason: UpgradeFailed
status: "False"
message: "Helm upgrade failed for release
mission-control-agent/prod-kubernetes-bundle with chart
[email protected]: YAML parse error on
mission-control-kubernetes/templates/topology.yaml: error converting
YAML to JSON: yaml: line 171: did not find expected '-' indicator"
- lastTransitionTime: "2023-09-11T14:12:06Z"
type: Released
reason: UpgradeFailed
status: "False"
message: "Helm upgrade failed for release
mission-control-agent/prod-kubernetes-bundle with chart
[email protected]: YAML parse error on
mission-control-kubernetes/templates/topology.yaml: error converting
YAML to JSON: yaml: line 171: did not find expected '-' indicator"
storageNamespace: mission-control-agent
lastAttemptedRevision: 0.1.29
lastAttemptedGeneration: 1
lastAttemptedConfigDigest: sha256:e6dfc2b4a98058b60adc4fb33ed42d5e80f88471a4f9eb3e272709bf69417a32
lastAttemptedReleaseAction: upgrade

0 comments on commit f05a1c3

Please sign in to comment.