armenr · July 15, 2025 07:13
diff --git a/README.md b/README.md
diff --git a/_cilium-provisioner.sh b/_cilium-provisioner.sh
 #!/bin/bash
 #shellcheck disable=SC2154

 set -euo pipefail

 # !! this is important, don't touch it... !!
 export CILIUM_CLI_MODE=helm

 ###################################################################################################
 ## This script expects the following environment variables be set prior to execution,
 ## otherwise it will fail.
 #
 # CLUSTER_NAME    :    the name of your cluster
 # REGION          :    the AWS region you're running in
 # KUBECTX_ALIAS   :    the kubecontext identifier/name/alias of the cluster you intend to target
 #
 ###################################################################################################

 check_deployment_ready() {
  local deployment=$1
  kubectl wait --for=condition=available --timeout=300s deployment/${deployment} -n kube-system
 }

 check_daemonset_ready() {
  local daemonset=$1
  kubectl wait --for=condition=available --timeout=300s daemonset/${daemonset} -n kube-system
 }

 # update kubeconfig
 echo "Adding/updating kubeconfig for env..."
 aws eks --region "${REGION}" update-kubeconfig --name "${CLUSTER_NAME}" --alias "${KUBECTX_ALIAS}"

 # Check readiness for deployments
 for deployment in coredns; do
  check_deployment_ready "${deployment}" &
 done

 # Check readiness for daemonsets
 for daemonset in aws-node kube-proxy; do
  check_daemonset_ready "${daemonset}" &
 done

 # Wait for all readiness checks to complete
 wait
 echo "All specified deployments and daemonsets are ready."

 # Install/upgrade Cilium as appropriate
 if helm list --namespace kube-system | grep -q cilium; then
  echo "Cilium already installed."
  echo "Upgrading Cilium..."

  cilium upgrade \
    --cluster-name "${CLUSTER_NAME}" \
    --datapath-mode tunnel \
    --helm-values cilium-values.yaml
 else
  echo "Cilium is not installed."

  cilium install \
    --cluster-name "${CLUSTER_NAME}" \
    --datapath-mode tunnel \
    --helm-values cilium-values.yaml
 fi

 # Wait for Cilium to be ready & healthy
 cilium status --wait
 echo "Cilium is ready - flushing iptables on base nodes..."

 # Flush IPTables on base nodes
 # Get Instance Ids whose names contain cluster name and are in 'running' state
 instance_ids=$(aws ec2 describe-instances --filters "Name=tag:Name,Values=*${CLUSTER_NAME}-base-compute*" "Name=instance-state-name,Values=running" --query "Reservations[].Instances[].InstanceId" --output text)

 # Iterate through each instance
 IFS=$'\n' # change the field separator
 for id in ${instance_ids}; do
  echo "FLUSHING DEFAULT IPTABLES ON BASE NODE: ${id}"

  # Send command using AWS SSM
  aws ssm send-command \
    --instance-ids "${id}" \
    --document-name "AWS-RunShellScript" \
    --parameters commands='sudo iptables -t nat -F AWS-SNAT-CHAIN-0 && sudo iptables -t nat -F AWS-SNAT-CHAIN-1 && sudo iptables -t nat -F AWS-CONNMARK-CHAIN-0 && sudo iptables -t nat -F AWS-CONNMARK-CHAIN-1' \
    --comment "Flushing IPTables Chains" \
    --query Command.CommandId \
    --output text \
    --no-paginate \
    --no-cli-pager
 done

 echo "Rolling all stateful sets and deployments..."

 # Restart and wait for DaemonSets in the kube-system namespace
 daemonsets=$(kubectl get daemonsets --namespace kube-system --output jsonpath='{.items[*].metadata.name}')

 for daemonset in ${daemonsets}; do
    # Restart the DaemonSet
    kubectl rollout restart daemonset "${daemonset}" --namespace kube-system

    # Wait for the rollout to complete
    echo "Waiting for DaemonSet ${daemonset} to become ready..."
    kubectl rollout status daemonset "${daemonset}" --namespace kube-system
 done

 # Restart and wait for Deployments in the kube-system namespace
 deployments=$(kubectl get deployments --namespace kube-system --output jsonpath='{.items[*].metadata.name}')

 for deployment in ${deployments}; do
    # Restart the Deployment
    kubectl rollout restart deployment "${deployment}" --namespace kube-system

    # Wait for the rollout to complete
    echo "Waiting for Deployment ${deployment} to become ready..."
    kubectl rollout status deployment "${deployment}" --namespace kube-system
 done

 echo "Cilium installed successfully, cluster & cluster networking are ready!"
diff --git a/cilium-provisioner.tf b/cilium-provisioner.tf
 # this file belongs in the same folder as your EKS module

 # dynamic cilium-values file content
 data "template_file" "cilium_values_template" {
  template = templatefile(
    "${path.module}/dynamic-cilium-values.tpl",
    {
      cluster_name = var.env_name
    }
  )
 }

 # dynamic cilium-values file
 resource "local_file" "cilium_values_file" {
  content  = data.template_file.cilium_values_template.rendered
  filename = "${path.module}/cilium-values.yaml"
 }

 resource "null_resource" "setup_cilium" {
  depends_on = [module.eks.cluster_endpoint]

  triggers = {
    cluster_id              = module.eks.cluster_id
    cluster_oidc_issuer_url = module.eks.cluster_oidc_issuer_url
    cluster_version         = module.eks.cluster_version
    cilium_values           = local_file.cilium_values_file.content
  }

  provisioner "local-exec" {
    command = "${path.module}/_cilium-provisioner.sh ${var.region} ${var.env_name} ${local.eks_kubectx_alias}"

    environment = {
      CLUSTER_NAME    = var.env_name
      KUBECTX_ALIAS   = local.eks_kubectx_alias
      REGION          = var.region
      VPC_CIDR_BLOCK  = var.vpc_cidr_block
      CILIUM_CLI_MODE = "helm"
    }
  }
 }
diff --git a/dynamic-cilium-values.tpl b/dynamic-cilium-values.tpl
 ---
 # this file belongs in the same folder as _cilium-provisioner.sh and cilium-provisioner.tf
 bandwidthManager:
  enabled: true
 bpf:
  masquerade: true
 cluster:
  id: 0
  name: ${cluster_name}
 encryption:
  nodeEncryption: false
 eni:
  enabled: false
 externalIPs:
  enabled: true
 hostPort:
  enabled: true
 k8sServicePort: 443
 kubeProxyReplacement: strict
 MTU: 9000
 nodePort:
  enabled: true
 operator:
  replicas: 1
 serviceAccounts:
  cilium:
    name: cilium
  operator:
    name: cilium-operator
 socketLB:
  enabled: true
 tunnel: vxlan
	#!/bin/bash
	#shellcheck disable=SC2154

	set -euo pipefail

	# !! this is important, don't touch it... !!
	export CILIUM_CLI_MODE=helm

	###################################################################################################
	## This script expects the following environment variables be set prior to execution,
	## otherwise it will fail.
	#
	# CLUSTER_NAME : the name of your cluster
	# REGION : the AWS region you're running in
	# KUBECTX_ALIAS : the kubecontext identifier/name/alias of the cluster you intend to target
	#
	###################################################################################################

	check_deployment_ready() {
	local deployment=$1
	kubectl wait --for=condition=available --timeout=300s deployment/${deployment} -n kube-system
	}

	check_daemonset_ready() {
	local daemonset=$1
	kubectl wait --for=condition=available --timeout=300s daemonset/${daemonset} -n kube-system
	}

	# update kubeconfig
	echo "Adding/updating kubeconfig for env..."
	aws eks --region "${REGION}" update-kubeconfig --name "${CLUSTER_NAME}" --alias "${KUBECTX_ALIAS}"

	# Check readiness for deployments
	for deployment in coredns; do
	check_deployment_ready "${deployment}" &
	done

	# Check readiness for daemonsets
	for daemonset in aws-node kube-proxy; do
	check_daemonset_ready "${daemonset}" &
	done

	# Wait for all readiness checks to complete
	wait
	echo "All specified deployments and daemonsets are ready."

	# Install/upgrade Cilium as appropriate
	if helm list --namespace kube-system \| grep -q cilium; then
	echo "Cilium already installed."
	echo "Upgrading Cilium..."

	cilium upgrade \
	--cluster-name "${CLUSTER_NAME}" \
	--datapath-mode tunnel \
	--helm-values cilium-values.yaml
	else
	echo "Cilium is not installed."

	cilium install \
	--cluster-name "${CLUSTER_NAME}" \
	--datapath-mode tunnel \
	--helm-values cilium-values.yaml
	fi

	# Wait for Cilium to be ready & healthy
	cilium status --wait
	echo "Cilium is ready - flushing iptables on base nodes..."

	# Flush IPTables on base nodes
	# Get Instance Ids whose names contain cluster name and are in 'running' state
	instance_ids=$(aws ec2 describe-instances --filters "Name=tag:Name,Values=${CLUSTER_NAME}-base-compute" "Name=instance-state-name,Values=running" --query "Reservations[].Instances[].InstanceId" --output text)

	# Iterate through each instance
	IFS=$'\n' # change the field separator
	for id in ${instance_ids}; do
	echo "FLUSHING DEFAULT IPTABLES ON BASE NODE: ${id}"

	# Send command using AWS SSM
	aws ssm send-command \
	--instance-ids "${id}" \
	--document-name "AWS-RunShellScript" \
	--parameters commands='sudo iptables -t nat -F AWS-SNAT-CHAIN-0 && sudo iptables -t nat -F AWS-SNAT-CHAIN-1 && sudo iptables -t nat -F AWS-CONNMARK-CHAIN-0 && sudo iptables -t nat -F AWS-CONNMARK-CHAIN-1' \
	--comment "Flushing IPTables Chains" \
	--query Command.CommandId \
	--output text \
	--no-paginate \
	--no-cli-pager
	done

	echo "Rolling all stateful sets and deployments..."

	# Restart and wait for DaemonSets in the kube-system namespace
	daemonsets=$(kubectl get daemonsets --namespace kube-system --output jsonpath='{.items[*].metadata.name}')

	for daemonset in ${daemonsets}; do
	# Restart the DaemonSet
	kubectl rollout restart daemonset "${daemonset}" --namespace kube-system

	# Wait for the rollout to complete
	echo "Waiting for DaemonSet ${daemonset} to become ready..."
	kubectl rollout status daemonset "${daemonset}" --namespace kube-system
	done

	# Restart and wait for Deployments in the kube-system namespace
	deployments=$(kubectl get deployments --namespace kube-system --output jsonpath='{.items[*].metadata.name}')

	for deployment in ${deployments}; do
	# Restart the Deployment
	kubectl rollout restart deployment "${deployment}" --namespace kube-system

	# Wait for the rollout to complete
	echo "Waiting for Deployment ${deployment} to become ready..."
	kubectl rollout status deployment "${deployment}" --namespace kube-system
	done

	echo "Cilium installed successfully, cluster & cluster networking are ready!"
	# this file belongs in the same folder as your EKS module

	# dynamic cilium-values file content
	data "template_file" "cilium_values_template" {
	template = templatefile(
	"${path.module}/dynamic-cilium-values.tpl",
	{
	cluster_name = var.env_name
	}
	)
	}

	# dynamic cilium-values file
	resource "local_file" "cilium_values_file" {
	content = data.template_file.cilium_values_template.rendered
	filename = "${path.module}/cilium-values.yaml"
	}

	resource "null_resource" "setup_cilium" {
	depends_on = [module.eks.cluster_endpoint]

	triggers = {
	cluster_id = module.eks.cluster_id
	cluster_oidc_issuer_url = module.eks.cluster_oidc_issuer_url
	cluster_version = module.eks.cluster_version
	cilium_values = local_file.cilium_values_file.content
	}

	provisioner "local-exec" {
	command = "${path.module}/_cilium-provisioner.sh ${var.region} ${var.env_name} ${local.eks_kubectx_alias}"

	environment = {
	CLUSTER_NAME = var.env_name
	KUBECTX_ALIAS = local.eks_kubectx_alias
	REGION = var.region
	VPC_CIDR_BLOCK = var.vpc_cidr_block
	CILIUM_CLI_MODE = "helm"
	}
	}
	}
	---
	# this file belongs in the same folder as _cilium-provisioner.sh and cilium-provisioner.tf
	bandwidthManager:
	enabled: true
	bpf:
	masquerade: true
	cluster:
	id: 0
	name: ${cluster_name}
	encryption:
	nodeEncryption: false
	eni:
	enabled: false
	externalIPs:
	enabled: true
	hostPort:
	enabled: true
	k8sServicePort: 443
	kubeProxyReplacement: strict
	MTU: 9000
	nodePort:
	enabled: true
	operator:
	replicas: 1
	serviceAccounts:
	cilium:
	name: cilium
	operator:
	name: cilium-operator
	socketLB:
	enabled: true
	tunnel: vxlan