alaypatel07/etcd-sts.yaml

## etcd-sts.yaml
apiVersion: v1
kind: Service
metadata:
  name: "etcd"
  annotations:
    # Create endpoints also if the related pod isn't ready
    service.alpha.kubernetes.io/tolerate-unready-endpoints: "true"
spec:
  ports:
  - port: 2379
    name: client
  - port: 2380
    name: peer
  clusterIP: None
  selector:
    component: "etcd"
---

apiVersion: v1
kind: Service
metadata:
  name: etcd-client
spec:
  ports:
  - port: 2379
    name: client
  - port: 2380
    name: peer
  clusterIP: ""
  selector:
    component: "etcd"

---

apiVersion: apps/v1
kind: StatefulSet
metadata:
  name: "etcd"
  labels:
    component: "etcd"
spec:
  serviceName: "etcd"
  # changing replicas value will require a manual etcdctl member remove/add
  # command (remove before decreasing and add after increasing)
  replicas: 3
#  updateStrategy:
#    type: "RollingUpdate"
#    rollingUpdate:
#      partition: 3
  selector:
    matchLabels:
      component: "etcd"
  template:
    metadata:
      name: "etcd"
      labels:
        component: "etcd"
    spec:
      containers:
      - name: "etcd"
        image: "quay.io/coreos/etcd:v3.3"
        ports:
        - containerPort: 2379
          name: client
        - containerPort: 2380
          name: peer
        env:
        # When scaling the etcd cluster up or down, the INITIAL_CLUSTER_SIZE
        # would be the current size of the cluster and the CLUSTER_SIZE would
        # be the intended size of the cluster after scaling.
        - name: INITIAL_CLUSTER_SIZE
          value: "3"
        - name: CLUSTER_SIZE
          value: "3"
        - name: SET_NAME
          value: "etcd"
        volumeMounts:
        - name: data
          mountPath: /var/run/etcd
        lifecycle:
          preStop:
            exec:
              command:
              - "/bin/sh"
              - "-ec"
              - |
                EPS=""
                for i in $(seq 0 $((${INITIAL_CLUSTER_SIZE} - 1))); do
                    EPS="${EPS}${EPS:+,}http://${SET_NAME}-${i}.${SET_NAME}:2379"
                done
                HOSTNAME=$(hostname)
                member_hash() {
                    etcdctl member list | grep http://${HOSTNAME}.${SET_NAME}:2380 | cut -d':' -f1 | cut -d'[' -f1
                }
                SET_ID=${HOSTNAME##*[^0-9]}
                if [ $CLUSTER_SIZE -lt $INITIAL_CLUSTER_SIZE ]
                  echo "Removing ${HOSTNAME} from etcd cluster"
                  ETCDCTL_ENDPOINT=${EPS} etcdctl member remove $(member_hash)
                  if [ $? -eq 0 ]; then
                      # Remove everything otherwise the cluster will no longer scale-up
                      rm -rf /var/run/etcd/*
                  fi
                fi
        command:
          - "/bin/sh"
          - "-ecx"
          - |
            HOSTNAME=$(hostname)
            # store member id into PVC for later member replacement
            collect_member() {
                while ! etcdctl member list &>/dev/null; do sleep 1; done
                etcdctl member list | grep http://${HOSTNAME}.${SET_NAME}:2380 | cut -d':' -f1 | cut -d'[' -f1 > /var/run/etcd/member_id
                exit 0
            }
            eps() {
                EPS=""
                for i in $(seq 0 $((${INITIAL_CLUSTER_SIZE} - 1))); do
                    EPS="${EPS}${EPS:+,}http://${SET_NAME}-${i}.${SET_NAME}:2379"
                done
                echo ${EPS}
            }
            member_hash() {
                etcdctl member list | grep http://${HOSTNAME}.${SET_NAME}:2380 | cut -d':' -f1 | cut -d'[' -f1
            }
            # we should wait for other pods to be up before trying to join
            # otherwise we got "no such host" errors when trying to resolve other members
            SET_ID=${HOSTNAME##*[^0-9]}
            for i in $(seq 0 $((${SET_ID}))); do
                while true; do
                    echo "Waiting for ${SET_NAME}-${i}.${SET_NAME} to come up"
                    ping -W 1 -c 1 ${SET_NAME}-${i}.${SET_NAME} > /dev/null && break
                    sleep 1s
                done
            done
            # re-joining after failure?
            if [[ -e /var/run/etcd/default.etcd ]]; then
              echo "Re-joining etcd member"
              member_id=$(cat /var/run/etcd/member_id)
              # re-join member
              ETCDCTL_ENDPOINT=$(eps) etcdctl member update ${member_id} http://${HOSTNAME}.${SET_NAME}:2380 | true
              exec etcd --name ${HOSTNAME} \
                  --listen-peer-urls http://0.0.0.0:2380 \
                  --listen-client-urls http://0.0.0.0:2379\
                  --advertise-client-urls http://${HOSTNAME}.${SET_NAME}:2379 \
                  --data-dir /var/run/etcd/default.etcd
            fi
            # etcd-SET_ID
            SET_ID=${HOSTNAME##*[^0-9]}
            # adding a new member to existing cluster (assuming all initial pods are available)
            if [ "${SET_ID}" -ge ${INITIAL_CLUSTER_SIZE} ]; then
                export ETCDCTL_ENDPOINT=$(eps)
                # member already added?
                MEMBER_HASH=$(member_hash)
                if [ -n "${MEMBER_HASH}" ]; then
                    # the member hash exists but for some reason etcd failed
                    # as the datadir has not be created, we can remove the member
                    # and retrieve new hash
                    etcdctl member remove ${MEMBER_HASH}
                fi
                echo "Adding new member"
                etcdctl member add ${HOSTNAME} http://${HOSTNAME}.${SET_NAME}:2380 | grep "^ETCD_" > /var/run/etcd/new_member_envs
                if [ $? -ne 0 ]; then
                    echo "Exiting"
                    rm -f /var/run/etcd/new_member_envs
                    exit 1
                fi
                cat /var/run/etcd/new_member_envs
                source /var/run/etcd/new_member_envs
                collect_member &
                exec etcd --name ${HOSTNAME} \
                    --listen-peer-urls http://0.0.0.0:2380 \
                    --listen-client-urls http://0.0.0.0:2379 \
                    --advertise-client-urls http://${HOSTNAME}.${SET_NAME}:2379 \
                    --data-dir /var/run/etcd/default.etcd \
                    --initial-advertise-peer-urls http://${HOSTNAME}.${SET_NAME}:2380 \
                    --initial-cluster ${ETCD_INITIAL_CLUSTER} \
                    --initial-cluster-state ${ETCD_INITIAL_CLUSTER_STATE}
            fi
            PEERS=""
            for i in $(seq 0 $((${INITIAL_CLUSTER_SIZE} - 1))); do
                PEERS="${PEERS}${PEERS:+,}${SET_NAME}-${i}=http://${SET_NAME}-${i}.${SET_NAME}:2380"
            done
            collect_member &
            # join member
            exec etcd --name ${HOSTNAME} \
                --initial-advertise-peer-urls http://${HOSTNAME}.${SET_NAME}:2380 \
                --listen-peer-urls http://0.0.0.0:2380 \
                --listen-client-urls http://0.0.0.0:2379 \
                --advertise-client-urls http://${HOSTNAME}.${SET_NAME}:2379 \
                --initial-cluster-token etcd-cluster-1 \
                --initial-cluster ${PEERS} \
                --initial-cluster-state new \
                --data-dir /var/run/etcd/default.etcd
## We are using dynamic pv provisioning using the "standard" storage class so
## this resource can be directly deployed without changes to minikube (since
## minikube defines this class for its minikube hostpath provisioner). In
## production define your own way to use pv claims.
  volumeClaimTemplates:
  - metadata:
      name: data
    spec:
      accessModes:
        - "ReadWriteOnce"
      resources:
        requests:
          storage: 1Gi
---
	apiVersion: v1
	kind: Service
	metadata:
	name: "etcd"
	annotations:
	# Create endpoints also if the related pod isn't ready
	service.alpha.kubernetes.io/tolerate-unready-endpoints: "true"
	spec:
	ports:
	- port: 2379
	name: client
	- port: 2380
	name: peer
	clusterIP: None
	selector:
	component: "etcd"
	---

	apiVersion: v1
	kind: Service
	metadata:
	name: etcd-client
	spec:
	ports:
	- port: 2379
	name: client
	- port: 2380
	name: peer
	clusterIP: ""
	selector:
	component: "etcd"

	---

	apiVersion: apps/v1
	kind: StatefulSet
	metadata:
	name: "etcd"
	labels:
	component: "etcd"
	spec:
	serviceName: "etcd"
	# changing replicas value will require a manual etcdctl member remove/add
	# command (remove before decreasing and add after increasing)
	replicas: 3
	# updateStrategy:
	# type: "RollingUpdate"
	# rollingUpdate:
	# partition: 3
	selector:
	matchLabels:
	component: "etcd"
	template:
	metadata:
	name: "etcd"
	labels:
	component: "etcd"
	spec:
	containers:
	- name: "etcd"
	image: "quay.io/coreos/etcd:v3.3"
	ports:
	- containerPort: 2379
	name: client
	- containerPort: 2380
	name: peer
	env:
	# When scaling the etcd cluster up or down, the INITIAL_CLUSTER_SIZE
	# would be the current size of the cluster and the CLUSTER_SIZE would
	# be the intended size of the cluster after scaling.
	- name: INITIAL_CLUSTER_SIZE
	value: "3"
	- name: CLUSTER_SIZE
	value: "3"
	- name: SET_NAME
	value: "etcd"
	volumeMounts:
	- name: data
	mountPath: /var/run/etcd
	lifecycle:
	preStop:
	exec:
	command:
	- "/bin/sh"
	- "-ec"
	- \|
	EPS=""
	for i in $(seq 0 $((${INITIAL_CLUSTER_SIZE} - 1))); do
	EPS="${EPS}${EPS:+,}http://${SET_NAME}-${i}.${SET_NAME}:2379"
	done
	HOSTNAME=$(hostname)
	member_hash() {
	etcdctl member list \| grep http://${HOSTNAME}.${SET_NAME}:2380 \| cut -d':' -f1 \| cut -d'[' -f1
	}
	SET_ID=${HOSTNAME##*[^0-9]}
	if [ $CLUSTER_SIZE -lt $INITIAL_CLUSTER_SIZE ]
	echo "Removing ${HOSTNAME} from etcd cluster"
	ETCDCTL_ENDPOINT=${EPS} etcdctl member remove $(member_hash)
	if [ $? -eq 0 ]; then
	# Remove everything otherwise the cluster will no longer scale-up
	rm -rf /var/run/etcd/*
	fi
	fi
	command:
	- "/bin/sh"
	- "-ecx"
	- \|
	HOSTNAME=$(hostname)
	# store member id into PVC for later member replacement
	collect_member() {
	while ! etcdctl member list &>/dev/null; do sleep 1; done
	etcdctl member list \| grep http://${HOSTNAME}.${SET_NAME}:2380 \| cut -d':' -f1 \| cut -d'[' -f1 > /var/run/etcd/member_id
	exit 0
	}
	eps() {
	EPS=""
	for i in $(seq 0 $((${INITIAL_CLUSTER_SIZE} - 1))); do
	EPS="${EPS}${EPS:+,}http://${SET_NAME}-${i}.${SET_NAME}:2379"
	done
	echo ${EPS}
	}
	member_hash() {
	etcdctl member list \| grep http://${HOSTNAME}.${SET_NAME}:2380 \| cut -d':' -f1 \| cut -d'[' -f1
	}
	# we should wait for other pods to be up before trying to join
	# otherwise we got "no such host" errors when trying to resolve other members
	SET_ID=${HOSTNAME##*[^0-9]}
	for i in $(seq 0 $((${SET_ID}))); do
	while true; do
	echo "Waiting for ${SET_NAME}-${i}.${SET_NAME} to come up"
	ping -W 1 -c 1 ${SET_NAME}-${i}.${SET_NAME} > /dev/null && break
	sleep 1s
	done
	done
	# re-joining after failure?
	if [[ -e /var/run/etcd/default.etcd ]]; then
	echo "Re-joining etcd member"
	member_id=$(cat /var/run/etcd/member_id)
	# re-join member
	ETCDCTL_ENDPOINT=$(eps) etcdctl member update ${member_id} http://${HOSTNAME}.${SET_NAME}:2380 \| true
	exec etcd --name ${HOSTNAME} \
	--listen-peer-urls http://0.0.0.0:2380 \
	--listen-client-urls http://0.0.0.0:2379\
	--advertise-client-urls http://${HOSTNAME}.${SET_NAME}:2379 \
	--data-dir /var/run/etcd/default.etcd
	fi
	# etcd-SET_ID
	SET_ID=${HOSTNAME##*[^0-9]}
	# adding a new member to existing cluster (assuming all initial pods are available)
	if [ "${SET_ID}" -ge ${INITIAL_CLUSTER_SIZE} ]; then
	export ETCDCTL_ENDPOINT=$(eps)
	# member already added?
	MEMBER_HASH=$(member_hash)
	if [ -n "${MEMBER_HASH}" ]; then
	# the member hash exists but for some reason etcd failed
	# as the datadir has not be created, we can remove the member
	# and retrieve new hash
	etcdctl member remove ${MEMBER_HASH}
	fi
	echo "Adding new member"
	etcdctl member add ${HOSTNAME} http://${HOSTNAME}.${SET_NAME}:2380 \| grep "^ETCD_" > /var/run/etcd/new_member_envs
	if [ $? -ne 0 ]; then
	echo "Exiting"
	rm -f /var/run/etcd/new_member_envs
	exit 1
	fi
	cat /var/run/etcd/new_member_envs
	source /var/run/etcd/new_member_envs
	collect_member &
	exec etcd --name ${HOSTNAME} \
	--listen-peer-urls http://0.0.0.0:2380 \
	--listen-client-urls http://0.0.0.0:2379 \
	--advertise-client-urls http://${HOSTNAME}.${SET_NAME}:2379 \
	--data-dir /var/run/etcd/default.etcd \
	--initial-advertise-peer-urls http://${HOSTNAME}.${SET_NAME}:2380 \
	--initial-cluster ${ETCD_INITIAL_CLUSTER} \
	--initial-cluster-state ${ETCD_INITIAL_CLUSTER_STATE}
	fi
	PEERS=""
	for i in $(seq 0 $((${INITIAL_CLUSTER_SIZE} - 1))); do
	PEERS="${PEERS}${PEERS:+,}${SET_NAME}-${i}=http://${SET_NAME}-${i}.${SET_NAME}:2380"
	done
	collect_member &
	# join member
	exec etcd --name ${HOSTNAME} \
	--initial-advertise-peer-urls http://${HOSTNAME}.${SET_NAME}:2380 \
	--listen-peer-urls http://0.0.0.0:2380 \
	--listen-client-urls http://0.0.0.0:2379 \
	--advertise-client-urls http://${HOSTNAME}.${SET_NAME}:2379 \
	--initial-cluster-token etcd-cluster-1 \
	--initial-cluster ${PEERS} \
	--initial-cluster-state new \
	--data-dir /var/run/etcd/default.etcd
	## We are using dynamic pv provisioning using the "standard" storage class so
	## this resource can be directly deployed without changes to minikube (since
	## minikube defines this class for its minikube hostpath provisioner). In
	## production define your own way to use pv claims.
	volumeClaimTemplates:
	- metadata:
	name: data
	spec:
	accessModes:
	- "ReadWriteOnce"
	resources:
	requests:
	storage: 1Gi
	---