Skip to content

Commit

Permalink
[CRDB-44997] feature: support WAL failover
Browse files Browse the repository at this point in the history
Adds support for WAL failover via:
- among multiple stores
- single store side disk (as a PVC)
  • Loading branch information
pritesh-lahoti committed Dec 18, 2024
1 parent e4ea4de commit 28168fd
Show file tree
Hide file tree
Showing 7 changed files with 638 additions and 38 deletions.
41 changes: 41 additions & 0 deletions build/templates/values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -175,19 +175,60 @@ conf:
http-port: ""

# CockroachDB's data mount path.
# For multi-store configuration, the path for each store is evaluated as:
# Store 1: cockroach-data
# Store 2: cockroach-data-2
# Store N: cockroach-data-N
path: cockroach-data

# CockroachDB's storage configuration https://www.cockroachlabs.com/docs/v21.1/cockroach-start.html#storage
# Uses --store flag
store:
enabled: false
# Number of data stores per node.
# For multi-store configuration, set this to a value greater than 1.
count: 1
# Should be empty or 'mem'
type:
# Required for type=mem. If type and size is empty - storage.persistentVolume.size is used
size:
# Arbitrary strings, separated by colons, specifying disk type or capability
attrs:

# CockroachDB's WAL failover configuration:
# https://www.cockroachlabs.com/docs/stable/cockroach-start#write-ahead-log-wal-failover
# Uses `--wal-failover` flag
wal-failover:
# The value to be passed to the `--wal-failover` flag.
# Possible configurations:
# 1. ``: If empty, `--wal-failover` is not passed to cockroach start.
# 2. `disabled`: Disables WAL failover.
# 3. `among-stores`: Enables WAL failover among multiple stores. This requires
# `conf.store.count` to be greater than 1.
# 4. `path=<path-to-side-disk>`: Enables WAL failover to a side disk. This requires
# a persistent volume should be mounted at this path (e.g. `path=/cockroach/cockroach-failover`).
value:

persistentVolume:
# If enabled, then a PersistentVolumeClaim will be created and
# used for WAL failover as a side disk.
# https://www.cockroachlabs.com/docs/v24.3/wal-failover#provision-a-single-store-cluster-and-side-disk-for-wal-failover
enabled: false
# Mount path for the side disk. This gets prepended with `/cockroach/` in the stateful set.
path: cockroach-failover
size: 25Gi
# If defined, then `storageClassName: <storageClass>`.
# If set to "-", then `storageClassName: ""`, which disables dynamic
# provisioning.
# If undefined or empty (default), then no `storageClassName` spec is
# set, so the default provisioner will be chosen (gp2 on AWS, standard
# on GKE, AWS & OpenStack).
storageClass: ""
# Additional labels to apply to the created PersistentVolumeClaims.
labels: {}
# Additional annotations to apply to the created PersistentVolumeClaims.
annotations: {}

statefulset:
replicas: 3
updateStrategy:
Expand Down
63 changes: 55 additions & 8 deletions cockroachdb/templates/_helpers.tpl
Original file line number Diff line number Diff line change
Expand Up @@ -85,16 +85,20 @@ Return the appropriate apiVersion for StatefulSets
Return CockroachDB store expression
*/}}
{{- define "cockroachdb.conf.store" -}}
{{- $isInMemory := eq (.Values.conf.store.type | toString) "mem" -}}
{{- $persistentSize := empty .Values.conf.store.size | ternary .Values.storage.persistentVolume.size .Values.conf.store.size -}}
{{- $isInMemory := eq (.Values.conf.store.type | toString) "mem" -}}
{{- $persistentSize := empty .Values.conf.store.size | ternary .Values.storage.persistentVolume.size .Values.conf.store.size -}}

{{- $store := dict -}}
{{- $_ := set $store "type" ($isInMemory | ternary "type=mem" "") -}}
{{- $_ := set $store "path" ($isInMemory | ternary "" (print "path=" .Values.conf.path)) -}}
{{- $_ := set $store "size" (print "size=" ($isInMemory | ternary .Values.conf.store.size $persistentSize)) -}}
{{- $_ := set $store "attrs" (empty .Values.conf.store.attrs | ternary "" (print "attrs=" .Values.conf.store.attrs)) -}}
{{- $store := dict -}}
{{- $_ := set $store "type" ($isInMemory | ternary "type=mem" "") -}}
{{- if eq .Args.idx 0 -}}
{{- $_ := set $store "path" ($isInMemory | ternary "" (print "path=" .Values.conf.path)) -}}
{{- else -}}
{{- $_ := set $store "path" ($isInMemory | ternary "" (print "path=" .Values.conf.path "-" (add1 .Args.idx))) -}}
{{- end -}}
{{- $_ := set $store "size" (print "size=" ($isInMemory | ternary .Values.conf.store.size $persistentSize)) -}}
{{- $_ := set $store "attrs" (empty .Values.conf.store.attrs | ternary "" (print "attrs=" .Values.conf.store.attrs)) -}}

{{ compact (values $store) | join "," }}
{{- compact (values $store) | sortAlpha | join "," -}}
{{- end -}}

{{/*
Expand Down Expand Up @@ -303,3 +307,46 @@ Validate the log configuration.
{{- end -}}
{{- end -}}
{{- end -}}

{{- define "cockroachdb.storage.hostPath.computation" -}}
{{- if hasSuffix "/" .Values.storage.hostPath -}}
{{- printf "%s-%d/" (dir .Values.storage.hostPath) (add1 .Args.idx) | quote -}}
{{- else -}}
{{- printf "%s-%d" .Values.storage.hostPath (add1 .Args.idx) | quote -}}
{{- end -}}
{{- end -}}

{{/*
Validate the store count configuration.
*/}}
{{- define "cockroachdb.conf.store.validation" -}}
{{- if and (not .Values.conf.store.enabled) (ne (int .Values.conf.store.count) 1) -}}
{{ fail "Store count should be 1 when disabled" }}
{{- end -}}
{{- end -}}

{{/*
Validate the WAL failover configuration.
*/}}
{{- define "cockroachdb.conf.wal-failover.validation" -}}
{{- with index .Values.conf `wal-failover` -}}
{{- if not (mustHas .value (list "" "disabled" "among-stores")) -}}
{{- if not (hasPrefix "path=" (.value | toString)) -}}
{{ fail "Invalid WAL failover configuration value. Expected either of '', 'disabled', 'among-stores' or 'path=<path>'" }}
{{- end -}}
{{- end -}}
{{- if eq .value "among-stores" -}}
{{- if or (not $.Values.conf.store.enabled) (eq (int $.Values.conf.store.count) 1) -}}
{{ fail "WAL failover among stores requires store enabled with count greater than 1" }}
{{- end -}}
{{- end -}}
{{- if hasPrefix "path=" (.value | toString) -}}
{{- if not .persistentVolume.enabled -}}
{{ fail "WAL failover to a side disk requires a persistent volume" }}
{{- end -}}
{{- if and (not (hasPrefix (printf "/cockroach/%s" .persistentVolume.path) (trimPrefix "path=" .value))) (not (hasPrefix .persistentVolume.path (trimPrefix "path=" .value))) -}}
{{ fail "WAL failover to a side disk requires a path to the mounted persistent volume" }}
{{- end -}}
{{- end -}}
{{- end -}}
{{- end -}}
114 changes: 99 additions & 15 deletions cockroachdb/templates/statefulset.yaml
Original file line number Diff line number Diff line change
@@ -1,4 +1,5 @@
{{ template "cockroachdb.conf.log.validation" . }}
{{ template "cockroachdb.conf.store.validation" . }}
kind: StatefulSet
apiVersion: {{ template "cockroachdb.statefulset.apiVersion" . }}
metadata:
Expand Down Expand Up @@ -235,7 +236,14 @@ spec:
--sql-audit-dir={{ . }}
{{- end }}
{{- if .Values.conf.store.enabled }}
--store={{ template "cockroachdb.conf.store" . }}
{{- range $idx := until (int .Values.conf.store.count) }}
{{- $_ := set $ "Args" (dict "idx" $idx) }}
--store={{ include "cockroachdb.conf.store" $ }}
{{- end }}
{{- end }}
{{- with index .Values.conf `wal-failover` `value` }}
{{- template "cockroachdb.conf.wal-failover.validation" $ }}
--wal-failover={{ . }}
{{- end }}
{{- if .Values.conf.log.enabled }}
--log-config-file=/cockroach/log-config/log-config.yaml
Expand Down Expand Up @@ -271,8 +279,21 @@ spec:
{{- end }}
protocol: TCP
volumeMounts:
{{- range $i := until (int .Values.conf.store.count) }}
{{- if eq $i 0 }}
- name: datadir
mountPath: /cockroach/{{ .Values.conf.path }}/
mountPath: /cockroach/{{ $.Values.conf.path }}/
{{- else }}
- name: datadir-{{ add1 $i }}
mountPath: /cockroach/{{ $.Values.conf.path }}-{{ add1 $i }}/
{{- end }}
{{- end }}
{{- with index .Values.conf `wal-failover` `persistentVolume` }}
{{- if .enabled }}
- name: failoverdir
mountPath: /cockroach/{{ .path }}/
{{- end }}
{{- end }}
{{- if .Values.tls.enabled }}
- name: certs
mountPath: /cockroach/cockroach-certs/
Expand Down Expand Up @@ -344,16 +365,43 @@ spec:
resources: {{- toYaml . | nindent 12 }}
{{- end }}
volumes:
{{- range $i := until (int .Values.conf.store.count) }}
{{- if eq $i 0 }}
- name: datadir
{{- if .Values.storage.persistentVolume.enabled }}
{{- if $.Values.storage.persistentVolume.enabled }}
persistentVolumeClaim:
claimName: datadir
{{- else if .Values.storage.hostPath }}
{{- else if $.Values.storage.hostPath }}
hostPath:
path: {{ $.Values.storage.hostPath | quote }}
{{- else }}
emptyDir: {}
{{- end }}
{{- else }}
- name: datadir-{{ add1 $i }}
{{- if $.Values.storage.persistentVolume.enabled }}
persistentVolumeClaim:
claimName: datadir-{{ add1 $i }}
{{- else if $.Values.storage.hostPath }}
{{- $_ := set $ "Args" (dict "idx" $i) }}
hostPath:
path: {{ .Values.storage.hostPath | quote }}
path: {{ include "cockroachdb.storage.hostPath.computation" $ }}
{{- else }}
emptyDir: {}
{{- end }}
{{- end }}
{{- end }}
{{- with index .Values.conf `wal-failover` }}
{{- if .value }}
- name: failoverdir
{{- if .persistentVolume.enabled }}
persistentVolumeClaim:
claimName: failoverdir
{{- else }}
emptyDir: {}
{{- end }}
{{- end }}
{{- end }}
{{- with .Values.statefulset.volumes }}
{{ toYaml . | nindent 8 }}
{{- end }}
Expand Down Expand Up @@ -418,35 +466,71 @@ spec:
runAsNonRoot: true
{{- end }}
{{- end }}
{{- if or .Values.storage.persistentVolume.enabled .Values.conf.log.persistentVolume.enabled }}
{{- if or .Values.storage.persistentVolume.enabled (index .Values.conf `wal-failover` `persistentVolume` `enabled`) .Values.conf.log.persistentVolume.enabled }}
volumeClaimTemplates:
{{- if .Values.storage.persistentVolume.enabled }}
{{- range $i := until (int .Values.conf.store.count) }}
- metadata:
{{- if eq $i 0 }}
name: datadir
{{- else }}
name: datadir-{{ add1 $i }}
{{- end }}
labels:
app.kubernetes.io/name: {{ template "cockroachdb.name" . }}
app.kubernetes.io/instance: {{ .Release.Name | quote }}
{{- with .Values.storage.persistentVolume.labels }}
app.kubernetes.io/name: {{ template "cockroachdb.name" $ }}
app.kubernetes.io/instance: {{ $.Release.Name | quote }}
{{- with $.Values.storage.persistentVolume.labels }}
{{- toYaml . | nindent 10 }}
{{- end }}
{{- with .Values.labels }}
{{- with $.Values.labels }}
{{- toYaml . | nindent 10 }}
{{- end }}
{{- with $.Values.storage.persistentVolume.annotations }}
annotations: {{- toYaml . | nindent 10 }}
{{- end }}
spec:
accessModes: ["ReadWriteOnce"]
{{- if $.Values.storage.persistentVolume.storageClass }}
{{- if (eq "-" $.Values.storage.persistentVolume.storageClass) }}
storageClassName: ""
{{- else }}
storageClassName: {{ $.Values.storage.persistentVolume.storageClass | quote}}
{{- end }}
{{- end }}
resources:
requests:
storage: {{ $.Values.storage.persistentVolume.size | quote }}
{{- end }}
{{- end }}
{{- with index .Values.conf `wal-failover` }}
{{- if .persistentVolume.enabled }}
- metadata:
name: failoverdir
labels:
app.kubernetes.io/name: {{ template "cockroachdb.name" $ }}
app.kubernetes.io/instance: {{ $.Release.Name | quote }}
{{- with .persistentVolume.labels }}
{{- toYaml . | nindent 10 }}
{{- end }}
{{- with .Values.storage.persistentVolume.annotations }}
{{- with $.Values.labels }}
{{- toYaml . | nindent 10 }}
{{- end }}
{{- with .persistentVolume.annotations }}
annotations: {{- toYaml . | nindent 10 }}
{{- end }}
spec:
accessModes: ["ReadWriteOnce"]
{{- if .Values.storage.persistentVolume.storageClass }}
{{- if (eq "-" .Values.storage.persistentVolume.storageClass) }}
{{- with .persistentVolume.storageClass }}
{{- if eq "-" . }}
storageClassName: ""
{{- else }}
storageClassName: {{ .Values.storage.persistentVolume.storageClass | quote}}
storageClassName: {{ . | quote}}
{{- end }}
{{- end }}
resources:
requests:
storage: {{ .Values.storage.persistentVolume.size | quote }}
storage: {{ .persistentVolume.size | quote }}
{{- end }}
{{- end }}
{{- if .Values.conf.log.persistentVolume.enabled }}
- metadata:
Expand Down
41 changes: 41 additions & 0 deletions cockroachdb/values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -176,19 +176,60 @@ conf:
http-port: ""

# CockroachDB's data mount path.
# For multi-store configuration, the path for each store is evaluated as:
# Store 1: cockroach-data
# Store 2: cockroach-data-2
# Store N: cockroach-data-N
path: cockroach-data

# CockroachDB's storage configuration https://www.cockroachlabs.com/docs/v21.1/cockroach-start.html#storage
# Uses --store flag
store:
enabled: false
# Number of data stores per node.
# For multi-store configuration, set this to a value greater than 1.
count: 1
# Should be empty or 'mem'
type:
# Required for type=mem. If type and size is empty - storage.persistentVolume.size is used
size:
# Arbitrary strings, separated by colons, specifying disk type or capability
attrs:

# CockroachDB's WAL failover configuration:
# https://www.cockroachlabs.com/docs/stable/cockroach-start#write-ahead-log-wal-failover
# Uses `--wal-failover` flag
wal-failover:
# The value to be passed to the `--wal-failover` flag.
# Possible configurations:
# 1. ``: If empty, `--wal-failover` is not passed to cockroach start.
# 2. `disabled`: Disables WAL failover.
# 3. `among-stores`: Enables WAL failover among multiple stores. This requires
# `conf.store.count` to be greater than 1.
# 4. `path=<path-to-side-disk>`: Enables WAL failover to a side disk. This requires
# a persistent volume should be mounted at this path (e.g. `path=/cockroach/cockroach-failover`).
value:

persistentVolume:
# If enabled, then a PersistentVolumeClaim will be created and
# used for WAL failover as a side disk.
# https://www.cockroachlabs.com/docs/v24.3/wal-failover#provision-a-single-store-cluster-and-side-disk-for-wal-failover
enabled: false
# Mount path for the side disk. This gets prepended with `/cockroach/` in the stateful set.
path: cockroach-failover
size: 25Gi
# If defined, then `storageClassName: <storageClass>`.
# If set to "-", then `storageClassName: ""`, which disables dynamic
# provisioning.
# If undefined or empty (default), then no `storageClassName` spec is
# set, so the default provisioner will be chosen (gp2 on AWS, standard
# on GKE, AWS & OpenStack).
storageClass: ""
# Additional labels to apply to the created PersistentVolumeClaims.
labels: {}
# Additional annotations to apply to the created PersistentVolumeClaims.
annotations: {}

statefulset:
replicas: 3
updateStrategy:
Expand Down
Loading

0 comments on commit 28168fd

Please sign in to comment.