├── example
    ├── .gitignore
    ├── main.tf
    └── README.md
├── modules
    └── agent_group
    │   ├── outputs.tf
    │   ├── versions.tf
    │   ├── main.tf
    │   ├── variables.tf
    │   └── agent.tf
├── addons.tf
├── .pre-commit-config.yaml
├── versions.tf
├── CONTRIBUTING.md
├── ssh.tf
├── network.tf
├── main.tf
├── LICENSE
├── agents.tf
├── output.tf
├── kubeconfig.tf
├── manifests
    ├── hello-kubernetes.yaml
    ├── hcloud-ccm-net.yaml
    └── upgrade-controller.yaml
├── control_plane.tf
├── control_plane_primary.tf
├── .gitignore
├── upgrades.tf
├── variables.tf
├── logo.svg
└── README.md


/example/.gitignore:
--------------------------------------------------------------------------------
1 | .terraform
2 | .envrc
3 | kubeconfig*
4 | *.lock.hcl


--------------------------------------------------------------------------------
/modules/agent_group/outputs.tf:
--------------------------------------------------------------------------------
1 | output "public_ips" {
2 |   value = [for server in hcloud_server.agent : server.ipv4_address]
3 | }


--------------------------------------------------------------------------------
/addons.tf:
--------------------------------------------------------------------------------
1 | data "http" "hcloud_csi_driver_manifest" {
2 |   url = "https://raw.githubusercontent.com/hetznercloud/csi-driver/${var.hcloud_csi_driver_version}/deploy/kubernetes/hcloud-csi.yml"
3 | }
4 | 
5 | 


--------------------------------------------------------------------------------
/modules/agent_group/versions.tf:
--------------------------------------------------------------------------------
 1 | terraform {
 2 |   required_providers {
 3 |     hcloud = {
 4 |       source  = "hetznercloud/hcloud"
 5 |       version = "~> 1.27"
 6 |     }
 7 |   }
 8 |   required_version = ">= 0.13"
 9 | }
10 | 


--------------------------------------------------------------------------------
/.pre-commit-config.yaml:
--------------------------------------------------------------------------------
1 | repos:
2 |   - repo: https://github.com/antonbabenko/pre-commit-terraform
3 |     rev: v1.50.0
4 |     hooks:
5 |       - id: terraform_fmt
6 |       - id: terraform_validate
7 |       - id: terraform_docs
8 |         args: ['--args=--indent 3 --hide modules --hide providers --hide requirements --hide resources --hide data-sources']


--------------------------------------------------------------------------------
/modules/agent_group/main.tf:
--------------------------------------------------------------------------------
 1 | data "hcloud_image" "ubuntu" {
 2 |   name = "ubuntu-20.04"
 3 | }
 4 | 
 5 | resource "random_pet" "agent_suffix" {
 6 |   count = var.server_count
 7 | }
 8 | 
 9 | locals {
10 |   agent_pet_names = [for pet in random_pet.agent_suffix : pet.id]
11 |   agent_name_map  = { for i in range(0, var.server_count) : random_pet.agent_suffix[i].id => i }
12 | }
13 | 


--------------------------------------------------------------------------------
/versions.tf:
--------------------------------------------------------------------------------
 1 | terraform {
 2 |   required_providers {
 3 |     hcloud = {
 4 |       source  = "hetznercloud/hcloud"
 5 |       version = "~> 1.27"
 6 |     }
 7 |     kubectl = {
 8 |       source  = "gavinbunney/kubectl"
 9 |       version = "~> 1.13"
10 |     }
11 |     remote = {
12 |       source  = "tenstad/remote"
13 |       version = "~> 0.0.23"
14 |     }
15 |   }
16 |   required_version = ">= 0.13"
17 | }
18 | 
19 | provider "hcloud" {
20 |   token = var.hcloud_token
21 | }
22 | 


--------------------------------------------------------------------------------
/CONTRIBUTING.md:
--------------------------------------------------------------------------------
 1 | # Contribution Guide
 2 | 
 3 | This guide describes necessary tools and processes to contribute to this project.
 4 | 
 5 | ## Development Setup
 6 | 
 7 | ### Required tools
 8 | 
 9 | The following tools are necessary for working with this repository:
10 | 
11 | - [terraform](https://www.terraform.io) (for obvious reasons)
12 | - [pre-commit](https://pre-commit.com/#install) (to run linter/docs)
13 |   - this requires a python installation
14 | - [terraform-docs](https://terraform-docs.io/user-guide/installation/) (to create the inputs/outputs table)
15 | 
16 | ### pre-commit
17 | 
18 | Before you commit, run `pre-commit run -a`.
19 | 
20 | You can also do that automatically before each commit with `pre-commit install`.
21 | 
22 | 


--------------------------------------------------------------------------------
/ssh.tf:
--------------------------------------------------------------------------------
 1 | resource "tls_private_key" "ssh" {
 2 |   count     = var.ssh_private_key_location == null ? 1 : 0
 3 |   algorithm = "RSA"
 4 |   rsa_bits  = 4096
 5 | }
 6 | 
 7 | data "local_file" "custom_ssh_private_key" {
 8 |   count    = var.ssh_private_key_location == null ? 0 : 1
 9 |   filename = var.ssh_private_key_location
10 | }
11 | 
12 | data "tls_public_key" "custom_ssh" {
13 |   count           = var.ssh_private_key_location == null ? 0 : 1
14 |   private_key_pem = data.local_file.custom_ssh_private_key[0].content
15 | }
16 | 
17 | locals {
18 |   ssh_private_key = var.ssh_private_key_location != null ? data.local_file.custom_ssh_private_key[0].content : tls_private_key.ssh[0].private_key_pem
19 |   ssh_public_key  = var.ssh_private_key_location != null ? data.tls_public_key.custom_ssh[0].public_key_openssh : tls_private_key.ssh[0].public_key_openssh
20 | }


--------------------------------------------------------------------------------
/network.tf:
--------------------------------------------------------------------------------
 1 | resource "hcloud_network" "k3s" {
 2 |   count    = var.network_id == null ? 1 : 0
 3 |   name     = "${var.name}-k3s-network"
 4 |   ip_range = var.network_cidr
 5 |   labels   = local.common_labels
 6 | }
 7 | 
 8 | data "hcloud_network" "k3s" {
 9 |   count = var.network_id == null ? 0 : 1
10 |   id    = var.network_id
11 | }
12 | 
13 | locals {
14 |   network_id               = var.network_id == null ? hcloud_network.k3s[0].id : var.network_id
15 |   network_name             = var.network_id == null ? hcloud_network.k3s[0].name : data.hcloud_network.k3s[0].name
16 |   primary_control_plane_ip = cidrhost(hcloud_network_subnet.k3s_nodes.ip_range, var.control_plane_primary_index)
17 | }
18 | 
19 | resource "hcloud_network_subnet" "k3s_nodes" {
20 |   type         = "cloud"
21 |   network_id   = local.network_id
22 |   network_zone = "eu-central"
23 |   ip_range     = var.subnet_cidr
24 | }
25 | 


--------------------------------------------------------------------------------
/main.tf:
--------------------------------------------------------------------------------
 1 | resource "random_password" "k3s_cluster_secret" {
 2 |   length  = 48
 3 |   special = false
 4 | }
 5 | 
 6 | resource "hcloud_ssh_key" "provision_public" {
 7 |   name       = "${var.name} - provisioning SSH key"
 8 |   public_key = local.ssh_public_key
 9 |   labels     = local.common_labels
10 | }
11 | 
12 | data "hcloud_image" "ubuntu" {
13 |   name = "ubuntu-20.04"
14 | }
15 | 
16 | locals {
17 |   server_base_packages = ["wireguard"]
18 |   cluster_dns_ip       = cidrhost(var.service_cidr, 10)
19 |   k3s_setup_args       = "--cluster-cidr ${var.cluster_cidr} --service-cidr ${var.service_cidr} --cluster-dns ${local.cluster_dns_ip} --disable local-storage --disable-cloud-controller --disable traefik --disable servicelb --flannel-backend=wireguard --kubelet-arg='cloud-provider=external'"
20 |   k3s_server_join_cmd  = "sh -s - server --server 'https://${local.primary_control_plane_ip}:6443' ${local.k3s_setup_args}"
21 |   k3s_server_init_cmd  = "sh -s - server --cluster-init ${local.k3s_setup_args}"
22 | }
23 | 


--------------------------------------------------------------------------------
/example/main.tf:
--------------------------------------------------------------------------------
 1 | variable "hcloud_token" {}
 2 | 
 3 | module "demo_cluster" {
 4 |   source = "./.."
 5 |   # Can also point to a git repository, e.g. git::https://github.com/StarpTech/k-andy.git?ref=main
 6 |   hcloud_token     = var.hcloud_token
 7 |   name             = "k-andy-demo"
 8 |   k3s_version      = "v1.21.10+k3s1"
 9 |   server_locations = ["nbg1", "fsn1"]
10 |   agent_groups = {
11 |     "storage" = {
12 |       count     = 2
13 |       type      = "cpx31"
14 |       ip_offset = 13
15 |       taints = [
16 |         "component=storage:NoSchedule"
17 |       ]
18 |     }
19 |     "small" = {
20 |       count     = 2
21 |       type      = "cx21"
22 |       ip_offset = 24
23 |       taints    = []
24 |     }
25 |     "medium" = {
26 |       count     = 1
27 |       type      = "cx31"
28 |       ip_offset = 32
29 |       taints    = []
30 |     }
31 |   }
32 | }
33 | 
34 | output "control_plane_ips" {
35 |   value = module.demo_cluster.control_planes_public_ips
36 | }
37 | 
38 | output "k3s_token" {
39 |   value     = module.demo_cluster.k3s_token
40 |   sensitive = true
41 | }
42 | 


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
 1 | MIT License
 2 | 
 3 | Copyright (c) 2021 Dustin Deus
 4 | 
 5 | Permission is hereby granted, free of charge, to any person obtaining a copy
 6 | of this software and associated documentation files (the "Software"), to deal
 7 | in the Software without restriction, including without limitation the rights
 8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 9 | copies of the Software, and to permit persons to whom the Software is
10 | furnished to do so, subject to the following conditions:
11 | 
12 | The above copyright notice and this permission notice shall be included in all
13 | copies or substantial portions of the Software.
14 | 
15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 | SOFTWARE.
22 | 


--------------------------------------------------------------------------------
/agents.tf:
--------------------------------------------------------------------------------
 1 | module "agent_group" {
 2 |   for_each = var.agent_groups
 3 | 
 4 |   source = "./modules/agent_group"
 5 | 
 6 |   k3s_cluster_secret = random_password.k3s_cluster_secret.result
 7 |   k3s_version        = var.k3s_version
 8 | 
 9 |   taints = each.value.taints
10 | 
11 |   cluster_name = var.name
12 |   group_name   = each.key
13 | 
14 |   server_locations = var.server_locations
15 | 
16 |   provisioning_ssh_key_id = hcloud_ssh_key.provision_public.id
17 |   ssh_private_key         = local.ssh_private_key
18 | 
19 |   control_plane_ip        = local.primary_control_plane_ip
20 |   network_id              = local.network_id
21 |   public_control_plane_ip = hcloud_server.first_control_plane.ipv4_address
22 | 
23 |   subnet_id       = hcloud_network_subnet.k3s_nodes.id
24 |   subnet_ip_range = hcloud_network_subnet.k3s_nodes.ip_range
25 | 
26 |   ip_offset = each.value.ip_offset
27 | 
28 |   server_count  = each.value.count
29 |   server_type   = each.value.type
30 |   common_labels = local.common_labels
31 | 
32 |   additional_packages = concat(local.server_base_packages, var.server_additional_packages)
33 | 
34 |   depends_on = [hcloud_server.first_control_plane]
35 | }
36 | 


--------------------------------------------------------------------------------
/output.tf:
--------------------------------------------------------------------------------
 1 | output "control_planes_public_ips" {
 2 |   value       = concat([hcloud_server.first_control_plane.ipv4_address], [for server in hcloud_server.control_plane : server.ipv4_address])
 3 |   description = "The public IP addresses of the control plane servers"
 4 | }
 5 | 
 6 | output "agents_public_ips" {
 7 |   value       = flatten([for agents in module.agent_group : agents.public_ips])
 8 |   description = "The public IP addresses of the agent servers"
 9 | }
10 | 
11 | output "ssh_private_key" {
12 |   description = "Key to SSH into nodes"
13 |   value       = local.ssh_private_key
14 |   sensitive   = true
15 | }
16 | 
17 | output "k3s_token" {
18 |   description = "Secret k3s authentication token"
19 |   value       = random_password.k3s_cluster_secret.result
20 |   sensitive   = true
21 | }
22 | 
23 | output "network_id" {
24 |   value = local.network_id
25 | }
26 | 
27 | output "subnet_id" {
28 |   value = hcloud_network_subnet.k3s_nodes.id
29 | }
30 | 
31 | output "cidr_block" {
32 |   value = hcloud_network_subnet.k3s_nodes.ip_range
33 | }
34 | 
35 | output "server_locations" {
36 |   description = "Array of hetzner server locations we deploy to"
37 |   value       = var.server_locations
38 | }
39 | 


--------------------------------------------------------------------------------
/example/README.md:
--------------------------------------------------------------------------------
 1 | # Example Usage
 2 | 
 3 | ## Environment Setup
 4 | 
 5 | It's easiest if you set up some environment variables.
 6 | 
 7 | This example uses [direnv](https://direnv.net) with an `.envrc` for that,
 8 | but you can also just execute the `export` statements in your session.
 9 | 
10 | Our `.envrc` here looks like this:
11 | 
12 | ```shell
13 | export TF_VAR_hcloud_token=THETOKENYOUGETFROMTHECLOUDCONSOLE
14 | export KUBECONFIG=$(pwd)/kubeconfig-k-andy-demo.yaml
15 | ```
16 | 
17 | The `hcloud_token` is an API Token from a [Hetzner Cloud](https://console.hetzner.cloud/projects) project.  
18 | 
19 | We also set `KUBECONFIG` so we can later just run `kubectl` in here to interact with the created cluster.
20 | 
21 | If you use `direnv`, don't forget to run `direnv allow`.
22 | 
23 | ## Cluster Creation
24 | 
25 | Now you bring up the cluster with terraform and then test if it's there and looking good.
26 | 
27 | ```shell
28 | terraform init
29 | terraform apply
30 | kubectl cluster-info
31 | kubectl get node
32 | ```
33 | 
34 | ## Demo Application
35 | 
36 | A demo application can be found in [manifests](manifests/hello-kubernetes.yaml). Run:
37 | 
38 | ```sh
39 | kubectl apply -f ../manifests/hello-kubernetes.yaml
40 | ```
41 | 
42 | and try to access `http://<load-balancer-ip>:8080`.
43 | 
44 | You can find the public IP of the service with `kubectl get service hello-kubernetes -o jsonpath='{.status.loadBalancer.ingress}'`
45 | 
46 | ## Destroy your cluster
47 | 
48 | If you no longer need the cluster don't forget to destroy it. Load-Balancers and volumes must be deleted manually.
49 | 
50 | ```sh
51 | terraform destroy
52 | ```
53 | 


--------------------------------------------------------------------------------
/kubeconfig.tf:
--------------------------------------------------------------------------------
 1 | data "remote_file" "kubeconfig" {
 2 |   conn {
 3 |     host        = hcloud_server.first_control_plane.ipv4_address
 4 |     port        = 22
 5 |     user        = "root"
 6 |     private_key = local.ssh_private_key
 7 |   }
 8 |   path = "/etc/rancher/k3s/k3s.yaml"
 9 | }
10 | 
11 | locals {
12 |   kubeconfig_external = replace(data.remote_file.kubeconfig.content, "127.0.0.1", hcloud_server.first_control_plane.ipv4_address)
13 | }
14 | 
15 | resource "local_file" "kubeconfig" {
16 |   count             = var.create_kubeconfig ? 1 : 0
17 |   sensitive_content = local.kubeconfig_external
18 |   filename          = var.kubeconfig_filename == null ? "./kubeconfig-${var.name}.yaml" : var.kubeconfig_filename
19 |   file_permission   = "400"
20 | }
21 | 
22 | locals {
23 |   kubeconfig_parsed = yamldecode(local.kubeconfig_external)
24 |   kubeconfig_data = {
25 |     host                   = local.kubeconfig_parsed["clusters"][0]["cluster"]["server"]
26 |     client_certificate     = base64decode(local.kubeconfig_parsed["users"][0]["user"]["client-certificate-data"])
27 |     client_key             = base64decode(local.kubeconfig_parsed["users"][0]["user"]["client-key-data"])
28 |     cluster_ca_certificate = base64decode(local.kubeconfig_parsed["clusters"][0]["cluster"]["certificate-authority-data"])
29 |   }
30 | }
31 | 
32 | output "kubeconfig_file" {
33 |   value       = local.kubeconfig_external
34 |   description = "Kubeconfig file content with external IP address"
35 |   sensitive   = true
36 | }
37 | 
38 | output "kubeconfig" {
39 |   description = "Structured kubeconfig data to supply to other providers"
40 |   value       = local.kubeconfig_data
41 |   sensitive   = true
42 | }
43 | 


--------------------------------------------------------------------------------
/manifests/hello-kubernetes.yaml:
--------------------------------------------------------------------------------
 1 | apiVersion: apps/v1
 2 | kind: Deployment
 3 | metadata:
 4 |   name: hello-kubernetes
 5 | spec:
 6 |   replicas: 1
 7 |   selector:
 8 |     matchLabels:
 9 |       app: hello-kubernetes
10 |   template:
11 |     metadata:
12 |       labels:
13 |         app: hello-kubernetes
14 |     spec:
15 |       containers:
16 |         - name: hello-kubernetes
17 |           image: paulbouwer/hello-kubernetes:1.10
18 |           ports:
19 |             - name: http
20 |               containerPort: 8080
21 |           livenessProbe:
22 |             httpGet:
23 |               path: /
24 |               port: http
25 |           readinessProbe:
26 |             httpGet:
27 |               path: /
28 |               port: http
29 |           env:
30 |             - name: KUBERNETES_NAMESPACE
31 |               valueFrom:
32 |                 fieldRef:
33 |                   fieldPath: metadata.namespace
34 |             - name: KUBERNETES_POD_NAME
35 |               valueFrom:
36 |                 fieldRef:
37 |                   fieldPath: metadata.name
38 |             - name: KUBERNETES_NODE_NAME
39 |               valueFrom:
40 |                 fieldRef:
41 |                   fieldPath: spec.nodeName
42 |       volumes:
43 |         - name: my-csi-volume
44 |           persistentVolumeClaim:
45 |             claimName: csi-pvc
46 | ---
47 | apiVersion: v1
48 | kind: Service
49 | metadata:
50 |   name: hello-kubernetes
51 |   annotations:
52 |     load-balancer.hetzner.cloud/location: nbg1
53 | spec:
54 |   type: LoadBalancer
55 |   ports:
56 |     - port: 8080
57 |       targetPort: 8080
58 |   selector:
59 |     app: hello-kubernetes
60 | ---
61 | apiVersion: v1
62 | kind: PersistentVolumeClaim
63 | metadata:
64 |   name: csi-pvc
65 | spec:
66 |   accessModes:
67 |     - ReadWriteOnce
68 |   resources:
69 |     requests:
70 |       storage: 10Gi
71 |   storageClassName: hcloud-volumes


--------------------------------------------------------------------------------
/modules/agent_group/variables.tf:
--------------------------------------------------------------------------------
 1 | variable "cluster_name" {
 2 |   description = "Cluster name (used in naming the servers)"
 3 | }
 4 | 
 5 | variable "group_name" {
 6 |   description = "Name of the agent group"
 7 | }
 8 | 
 9 | variable "server_locations" {
10 |   description = "Server locations to create agents in"
11 | }
12 | 
13 | variable "additional_packages" {
14 |   default = []
15 | }
16 | 
17 | variable "server_count" {
18 |   description = "Number of agent nodes"
19 |   default     = 2
20 | }
21 | 
22 | variable "server_type" {
23 |   description = "Server type of agent server group"
24 |   default     = "cx21"
25 | }
26 | 
27 | variable "provisioning_ssh_key_id" {
28 |   description = "ID of the hcloud SSH key to provision the node group with"
29 | }
30 | 
31 | variable "control_plane_ip" {
32 |   description = "Control plane IP to connect to"
33 | }
34 | 
35 | variable "public_control_plane_ip" {
36 |   description = "Public control plane IP"
37 | }
38 | 
39 | variable "taints" {
40 |   description = "Taints each worker gets"
41 |   type        = list(string)
42 | }
43 | 
44 | variable "k3s_version" {
45 |   description = "K3S version, should match the control plane"
46 | }
47 | 
48 | variable "k3s_cluster_secret" {
49 |   description = "K3S cluster token to authenticate against control plane"
50 | }
51 | 
52 | variable "network_id" {
53 |   description = "Network ID to place agents in"
54 | }
55 | 
56 | variable "subnet_id" {
57 |   description = "ID of the subnet in which agents are started"
58 | }
59 | 
60 | variable "subnet_ip_range" {
61 |   description = "CIDR block of the subnet"
62 | }
63 | 
64 | variable "ip_offset" {
65 |   description = "Offset from which agents are IPs are counted upwards. Needs to be adjusted to not cause collisions!"
66 | }
67 | 
68 | 
69 | variable "ssh_private_key" {
70 |   description = "SSH private key to connect directly to server (used for remote-exec)"
71 | }
72 | 
73 | variable "common_labels" {
74 |   description = "Additional labels to add to server instances"
75 |   default     = {}
76 | }


--------------------------------------------------------------------------------
/control_plane.tf:
--------------------------------------------------------------------------------
 1 | resource "hcloud_server" "control_plane" {
 2 |   for_each = { for i in range(1, var.control_plane_server_count) : "#${i}" => i }
 3 |   name     = "${var.name}-control-plane-${each.value}"
 4 | 
 5 |   image       = data.hcloud_image.ubuntu.name
 6 |   server_type = var.control_plane_server_type
 7 |   location    = element(var.server_locations, each.value)
 8 | 
 9 |   ssh_keys = [hcloud_ssh_key.provision_public.id]
10 |   labels = merge({
11 |     node_type = "control-plane"
12 |   }, local.common_labels)
13 | 
14 |   # Join cluster as server after first boot
15 |   user_data = format("%s\n%s", "#cloud-config", yamlencode(
16 |     {
17 |       runcmd = [
18 |         "curl -sfL https://get.k3s.io | K3S_TOKEN='${random_password.k3s_cluster_secret.result}' INSTALL_K3S_VERSION='${var.k3s_version}' ${local.k3s_server_join_cmd}"
19 |       ]
20 |       packages = concat(local.server_base_packages, var.server_additional_packages)
21 |     }
22 |   ))
23 | 
24 |   network {
25 |     network_id = local.network_id
26 |     ip         = cidrhost(hcloud_network_subnet.k3s_nodes.ip_range, each.value + 1)
27 |   }
28 | 
29 |   provisioner "remote-exec" {
30 |     inline = [
31 |       "until systemctl is-active --quiet k3s.service; do sleep 1; done",
32 |       "until kubectl get node ${self.name}; do sleep 1; done",
33 |       # Disable workloads on master node
34 |       "kubectl taint node ${self.name} node-role.kubernetes.io/master=true:NoSchedule",
35 |       "kubectl taint node ${self.name} CriticalAddonsOnly=true:NoExecute",
36 |     ]
37 | 
38 |     connection {
39 |       host        = self.ipv4_address
40 |       type        = "ssh"
41 |       user        = "root"
42 |       private_key = local.ssh_private_key
43 |     }
44 |   }
45 | 
46 |   // Otherwise we would be in a case where this would always be recreated because we switch the primary control plane IP
47 |   lifecycle {
48 |     ignore_changes = [user_data]
49 |   }
50 | 
51 |   depends_on = [
52 |     hcloud_server.first_control_plane
53 |   ]
54 | }
55 | 
56 | resource "hcloud_server_network" "control_plane" {
57 |   for_each  = { for i in range(1, var.control_plane_server_count) : "#${i}" => i } // starts at 1 because master was 0
58 |   subnet_id = hcloud_network_subnet.k3s_nodes.id
59 |   server_id = hcloud_server.control_plane[each.key].id
60 |   ip        = cidrhost(hcloud_network_subnet.k3s_nodes.ip_range, each.value + 1)
61 | }
62 | 


--------------------------------------------------------------------------------
/modules/agent_group/agent.tf:
--------------------------------------------------------------------------------
 1 | locals {
 2 |   node_taint_args_raw = join(" ", [for taint in var.taints : "--node-taint ${taint}"])
 3 |   node_taint_args     = length(var.taints) == 0 ? "" : "${local.node_taint_args_raw} " // has to end with space to not conflict with next arg
 4 | }
 5 | 
 6 | resource "hcloud_server" "agent" {
 7 |   for_each = { for i in range(0, var.server_count) : "#${i}" => i }
 8 |   name     = "${var.cluster_name}-${var.group_name}-${each.value}-${local.agent_pet_names[each.value]}"
 9 | 
10 |   image       = data.hcloud_image.ubuntu.name
11 |   server_type = var.server_type
12 |   location    = element(var.server_locations, each.value)
13 | 
14 |   ssh_keys = [var.provisioning_ssh_key_id]
15 |   labels = merge({
16 |     node_type = "worker"
17 |     cluster   = var.cluster_name
18 |   }, var.common_labels)
19 | 
20 |   # Join cluster as agent after first boot
21 |   # Adding the random pet name as comment is a trick to recreate the server on pet-name change
22 |   user_data = format("%s\n#%s\n%s", "#cloud-config", local.agent_pet_names[each.value], yamlencode(
23 |     {
24 |       runcmd = [
25 |         "curl -sfL https://get.k3s.io | K3S_URL='https://${var.control_plane_ip}:6443' INSTALL_K3S_VERSION='${var.k3s_version}' K3S_TOKEN='${var.k3s_cluster_secret}' sh -s - agent --node-ip='${cidrhost(var.subnet_ip_range, var.ip_offset + each.value)}' ${local.node_taint_args}--kubelet-arg='cloud-provider=external' --kubelet-arg='node-labels=agent-group=${var.group_name},agent-index=${each.value}'"
26 |       ]
27 |       packages = var.additional_packages
28 |     }
29 |   ))
30 | 
31 |   network {
32 |     network_id = var.network_id
33 |     ip         = cidrhost(var.subnet_ip_range, var.ip_offset + each.value)
34 |   }
35 | 
36 |   provisioner "remote-exec" {
37 |     inline = [
38 |       "until systemctl is-active --quiet k3s-agent.service; do sleep 1; done"
39 |     ]
40 | 
41 |     connection {
42 |       host        = self.ipv4_address
43 |       type        = "ssh"
44 |       user        = "root"
45 |       private_key = var.ssh_private_key
46 |     }
47 |   }
48 | }
49 | 
50 | resource "hcloud_server_network" "agent" {
51 |   for_each  = { for i in range(0, var.server_count) : "#${i}" => i }
52 |   subnet_id = var.subnet_id
53 |   server_id = hcloud_server.agent[each.key].id
54 |   ip        = cidrhost(var.subnet_ip_range, var.ip_offset + each.value) // start at x.y.z.OFFSET
55 | }
56 | 


--------------------------------------------------------------------------------
/control_plane_primary.tf:
--------------------------------------------------------------------------------
 1 | resource "hcloud_server" "first_control_plane" {
 2 |   name = "${var.name}-control-plane-0"
 3 | 
 4 |   image       = data.hcloud_image.ubuntu.name
 5 |   server_type = var.control_plane_server_type
 6 |   location    = var.server_locations[0]
 7 | 
 8 |   ssh_keys = [hcloud_ssh_key.provision_public.id]
 9 |   labels = merge({
10 |     node_type = "control-plane"
11 |   }, local.common_labels)
12 | 
13 |   user_data = format("%s\n%s", "#cloud-config", yamlencode(
14 |     {
15 |       runcmd = [
16 |         "curl -sfL https://get.k3s.io | K3S_TOKEN='${random_password.k3s_cluster_secret.result}' INSTALL_K3S_VERSION='${var.k3s_version}' ${var.control_plane_already_initialized ? local.k3s_server_join_cmd : local.k3s_server_init_cmd}"
17 |       ]
18 |       packages = concat(local.server_base_packages, var.server_additional_packages)
19 |     }
20 |   ))
21 | 
22 |   provisioner "remote-exec" {
23 |     inline = [
24 |       "until systemctl is-active --quiet k3s.service; do sleep 1; done",
25 |       "until kubectl get node ${self.name}; do sleep 1; done",
26 |       # Disable workloads on master node
27 |       "kubectl taint node ${self.name} node-role.kubernetes.io/master=true:NoSchedule",
28 |       "kubectl taint node ${self.name} CriticalAddonsOnly=true:NoExecute",
29 |       # Install hetzner CCM
30 |       "kubectl -n kube-system create secret generic hcloud --from-literal=token=${var.hcloud_token} --from-literal=network=${local.network_name}",
31 |       "kubectl apply -f -<<EOF\n${templatefile("${path.module}/manifests/hcloud-ccm-net.yaml", { cluster_cidr = var.cluster_cidr })}\nEOF",
32 |       # Install hetzner CSI plugin
33 |       "kubectl -n kube-system create secret generic hcloud-csi --from-literal=token=${var.hcloud_token}",
34 |       "kubectl apply -f -<<EOF\n${data.http.hcloud_csi_driver_manifest.body}\nEOF",
35 |     ]
36 | 
37 |     connection {
38 |       host        = self.ipv4_address
39 |       type        = "ssh"
40 |       user        = "root"
41 |       private_key = local.ssh_private_key
42 |     }
43 |   }
44 | 
45 |   // Otherwise we would be in a case where this would always be recreated because we switch the primary control plane IP
46 |   lifecycle {
47 |     ignore_changes = [user_data]
48 |   }
49 | 
50 | }
51 | 
52 | resource "hcloud_server_network" "first_control_plane" {
53 |   subnet_id = hcloud_network_subnet.k3s_nodes.id
54 |   server_id = hcloud_server.first_control_plane.id
55 |   ip        = local.primary_control_plane_ip
56 | }
57 | 


--------------------------------------------------------------------------------
/manifests/hcloud-ccm-net.yaml:
--------------------------------------------------------------------------------
 1 | # NOTE: this release was tested against kubernetes v1.18.x
 2 | ---
 3 | apiVersion: v1
 4 | kind: ServiceAccount
 5 | metadata:
 6 |   name: cloud-controller-manager
 7 |   namespace: kube-system
 8 | ---
 9 | kind: ClusterRoleBinding
10 | apiVersion: rbac.authorization.k8s.io/v1
11 | metadata:
12 |   name: system:cloud-controller-manager
13 | roleRef:
14 |   apiGroup: rbac.authorization.k8s.io
15 |   kind: ClusterRole
16 |   name: cluster-admin
17 | subjects:
18 |   - kind: ServiceAccount
19 |     name: cloud-controller-manager
20 |     namespace: kube-system
21 | ---
22 | apiVersion: apps/v1
23 | kind: Deployment
24 | metadata:
25 |   name: hcloud-cloud-controller-manager
26 |   namespace: kube-system
27 | spec:
28 |   replicas: 1
29 |   revisionHistoryLimit: 2
30 |   selector:
31 |     matchLabels:
32 |       app: hcloud-cloud-controller-manager
33 |   template:
34 |     metadata:
35 |       labels:
36 |         app: hcloud-cloud-controller-manager
37 |       annotations:
38 |         scheduler.alpha.kubernetes.io/critical-pod: ''
39 |     spec:
40 |       serviceAccountName: cloud-controller-manager
41 |       dnsPolicy: Default
42 |       tolerations:
43 |         # this taint is set by all kubelets running `--cloud-provider=external`
44 |         # so we should tolerate it to schedule the cloud controller manager
45 |         - key: "node.cloudprovider.kubernetes.io/uninitialized"
46 |           value: "true"
47 |           effect: "NoSchedule"
48 |         - key: "CriticalAddonsOnly"
49 |           operator: "Exists"
50 |         # cloud controller manages should be able to run on masters
51 |         - key: "node-role.kubernetes.io/master"
52 |           operator: Exists
53 |           effect: NoSchedule
54 |         - key: "node-role.kubernetes.io/control-plane"
55 |           effect: NoSchedule
56 |         - key: "node.kubernetes.io/not-ready"
57 |           effect: "NoSchedule"
58 |       hostNetwork: true
59 |       containers:
60 |         - image: hetznercloud/hcloud-cloud-controller-manager:v1.12.0
61 |           name: hcloud-cloud-controller-manager
62 |           command:
63 |             - "/bin/hcloud-cloud-controller-manager"
64 |             - "--cloud-provider=hcloud"
65 |             - "--leader-elect=false"
66 |             - "--allow-untagged-cloud"
67 |             - "--allocate-node-cidrs=true"
68 |             - "--cluster-cidr=${cluster_cidr}"
69 |           resources:
70 |             requests:
71 |               cpu: 100m
72 |               memory: 50Mi
73 |           env:
74 |             - name: NODE_NAME
75 |               valueFrom:
76 |                 fieldRef:
77 |                   fieldPath: spec.nodeName
78 |             - name: HCLOUD_TOKEN
79 |               valueFrom:
80 |                 secretKeyRef:
81 |                   name: hcloud
82 |                   key: token
83 |             - name: HCLOUD_NETWORK
84 |               valueFrom:
85 |                 secretKeyRef:
86 |                   name: hcloud
87 |                   key: network


--------------------------------------------------------------------------------
/manifests/upgrade-controller.yaml:
--------------------------------------------------------------------------------
 1 | apiVersion: v1
 2 | kind: Namespace
 3 | metadata:
 4 |   name: system-upgrade
 5 | ---
 6 | apiVersion: v1
 7 | kind: ServiceAccount
 8 | metadata:
 9 |   name: system-upgrade
10 |   namespace: system-upgrade
11 | ---
12 | apiVersion: rbac.authorization.k8s.io/v1
13 | kind: ClusterRoleBinding
14 | metadata:
15 |   name: system-upgrade
16 | roleRef:
17 |   apiGroup: rbac.authorization.k8s.io
18 |   kind: ClusterRole
19 |   name: cluster-admin
20 | subjects:
21 |   - kind: ServiceAccount
22 |     name: system-upgrade
23 |     namespace: system-upgrade
24 | ---
25 | apiVersion: v1
26 | data:
27 |   SYSTEM_UPGRADE_CONTROLLER_DEBUG: "false"
28 |   SYSTEM_UPGRADE_CONTROLLER_THREADS: "2"
29 |   SYSTEM_UPGRADE_JOB_ACTIVE_DEADLINE_SECONDS: "900"
30 |   SYSTEM_UPGRADE_JOB_BACKOFF_LIMIT: "99"
31 |   SYSTEM_UPGRADE_JOB_IMAGE_PULL_POLICY: Always
32 |   SYSTEM_UPGRADE_JOB_KUBECTL_IMAGE: rancher/kubectl:${kubectl_image_tag}
33 |   SYSTEM_UPGRADE_JOB_PRIVILEGED: "true"
34 |   SYSTEM_UPGRADE_JOB_TTL_SECONDS_AFTER_FINISH: "900"
35 |   SYSTEM_UPGRADE_PLAN_POLLING_INTERVAL: 15m
36 | kind: ConfigMap
37 | metadata:
38 |   name: default-controller-env
39 |   namespace: system-upgrade
40 | ---
41 | apiVersion: apps/v1
42 | kind: Deployment
43 | metadata:
44 |   name: system-upgrade-controller
45 |   namespace: system-upgrade
46 | spec:
47 |   selector:
48 |     matchLabels:
49 |       upgrade.cattle.io/controller: system-upgrade-controller
50 |   template:
51 |     metadata:
52 |       labels:
53 |         upgrade.cattle.io/controller: system-upgrade-controller
54 |     spec:
55 |       affinity:
56 |         nodeAffinity:
57 |           requiredDuringSchedulingIgnoredDuringExecution:
58 |             nodeSelectorTerms:
59 |               - matchExpressions:
60 |                   - key: node-role.kubernetes.io/master
61 |                     operator: In
62 |                     values:
63 |                       - "true"
64 |       containers:
65 |         - env:
66 |             - name: SYSTEM_UPGRADE_CONTROLLER_NAME
67 |               valueFrom:
68 |                 fieldRef:
69 |                   fieldPath: metadata.labels['upgrade.cattle.io/controller']
70 |             - name: SYSTEM_UPGRADE_CONTROLLER_NAMESPACE
71 |               valueFrom:
72 |                 fieldRef:
73 |                   fieldPath: metadata.namespace
74 |           envFrom:
75 |             - configMapRef:
76 |                 name: default-controller-env
77 |           image: rancher/system-upgrade-controller:${upgrade_controller_image_tag}
78 |           imagePullPolicy: IfNotPresent
79 |           name: system-upgrade-controller
80 |           volumeMounts:
81 |             - mountPath: /etc/ssl
82 |               name: etc-ssl
83 |             - mountPath: /tmp
84 |               name: tmp
85 |       serviceAccountName: system-upgrade
86 |       tolerations:
87 |         - key: CriticalAddonsOnly
88 |           operator: Exists
89 |         - effect: NoSchedule
90 |           key: node-role.kubernetes.io/master
91 |           operator: Exists
92 |       volumes:
93 |         - hostPath:
94 |             path: /etc/ssl
95 |             type: Directory
96 |           name: etc-ssl
97 |         - emptyDir: {}
98 |           name: tmp


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
  1 | # Created by https://www.toptal.com/developers/gitignore/api/intellij+all,terraform
  2 | # Edit at https://www.toptal.com/developers/gitignore?templates=intellij+all,terraform
  3 | 
  4 | ### Intellij+all ###
  5 | # Covers JetBrains IDEs: IntelliJ, RubyMine, PhpStorm, AppCode, PyCharm, CLion, Android Studio, WebStorm and Rider
  6 | # Reference: https://intellij-support.jetbrains.com/hc/en-us/articles/206544839
  7 | 
  8 | # User-specific stuff
  9 | .idea/**/workspace.xml
 10 | .idea/**/tasks.xml
 11 | .idea/**/usage.statistics.xml
 12 | .idea/**/dictionaries
 13 | .idea/**/shelf
 14 | 
 15 | # AWS User-specific
 16 | .idea/**/aws.xml
 17 | 
 18 | # Generated files
 19 | .idea/**/contentModel.xml
 20 | 
 21 | # Sensitive or high-churn files
 22 | .idea/**/dataSources/
 23 | .idea/**/dataSources.ids
 24 | .idea/**/dataSources.local.xml
 25 | .idea/**/sqlDataSources.xml
 26 | .idea/**/dynamic.xml
 27 | .idea/**/uiDesigner.xml
 28 | .idea/**/dbnavigator.xml
 29 | 
 30 | # Gradle
 31 | .idea/**/gradle.xml
 32 | .idea/**/libraries
 33 | 
 34 | # Gradle and Maven with auto-import
 35 | # When using Gradle or Maven with auto-import, you should exclude module files,
 36 | # since they will be recreated, and may cause churn.  Uncomment if using
 37 | # auto-import.
 38 | # .idea/artifacts
 39 | # .idea/compiler.xml
 40 | # .idea/jarRepositories.xml
 41 | # .idea/modules.xml
 42 | # .idea/*.iml
 43 | # .idea/modules
 44 | # *.iml
 45 | # *.ipr
 46 | 
 47 | # CMake
 48 | cmake-build-*/
 49 | 
 50 | # Mongo Explorer plugin
 51 | .idea/**/mongoSettings.xml
 52 | 
 53 | # File-based project format
 54 | *.iws
 55 | 
 56 | # IntelliJ
 57 | out/
 58 | 
 59 | # mpeltonen/sbt-idea plugin
 60 | .idea_modules/
 61 | 
 62 | # JIRA plugin
 63 | atlassian-ide-plugin.xml
 64 | 
 65 | # Cursive Clojure plugin
 66 | .idea/replstate.xml
 67 | 
 68 | # Crashlytics plugin (for Android Studio and IntelliJ)
 69 | com_crashlytics_export_strings.xml
 70 | crashlytics.properties
 71 | crashlytics-build.properties
 72 | fabric.properties
 73 | 
 74 | # Editor-based Rest Client
 75 | .idea/httpRequests
 76 | 
 77 | # Android studio 3.1+ serialized cache file
 78 | .idea/caches/build_file_checksums.ser
 79 | 
 80 | ### Intellij+all Patch ###
 81 | # Ignores the whole .idea folder and all .iml files
 82 | # See https://github.com/joeblau/gitignore.io/issues/186 and https://github.com/joeblau/gitignore.io/issues/360
 83 | 
 84 | .idea/
 85 | 
 86 | # Reason: https://github.com/joeblau/gitignore.io/issues/186#issuecomment-249601023
 87 | 
 88 | *.iml
 89 | modules.xml
 90 | .idea/misc.xml
 91 | *.ipr
 92 | 
 93 | # Sonarlint plugin
 94 | .idea/sonarlint
 95 | 
 96 | ### Terraform ###
 97 | # Local .terraform directories
 98 | **/.terraform/*
 99 | 
100 | # .tfstate files
101 | *.tfstate
102 | *.tfstate.*
103 | 
104 | # Crash log files
105 | crash.log
106 | 
107 | # Exclude all .tfvars files, which are likely to contain sentitive data, such as
108 | # password, private keys, and other secrets. These should not be part of version
109 | # control as they are data points which are potentially sensitive and subject
110 | # to change depending on the environment.
111 | #
112 | *.tfvars
113 | 
114 | # Ignore override files as they are usually used to override resources locally and so
115 | # are not checked in
116 | override.tf
117 | override.tf.json
118 | *_override.tf
119 | *_override.tf.json
120 | 
121 | # Include override files you do wish to add to version control using negated pattern
122 | # !example_override.tf
123 | 
124 | # Include tfplan files to ignore the plan output of command: terraform plan -out=tfplan
125 | # example: *tfplan*
126 | 
127 | # Ignore CLI configuration files
128 | .terraformrc
129 | terraform.rc
130 | 
131 | # End of https://www.toptal.com/developers/gitignore/api/intellij+all,terraform


--------------------------------------------------------------------------------
/upgrades.tf:
--------------------------------------------------------------------------------
  1 | data "kubectl_file_documents" "upgrade_controller" {
  2 |   content = var.enable_upgrade_controller ? templatefile("${path.module}/manifests/upgrade-controller.yaml", {
  3 |     kubectl_image_tag            = var.upgrade_controller_kubectl_image_tag
  4 |     upgrade_controller_image_tag = var.upgrade_controller_image_tag
  5 |   }) : ""
  6 | }
  7 | 
  8 | resource "kubectl_manifest" "upgrade_controller" {
  9 |   for_each  = data.kubectl_file_documents.upgrade_controller.manifests
 10 |   yaml_body = each.value
 11 | }
 12 | 
 13 | resource "kubectl_manifest" "upgrade_plan_control_plane" {
 14 |   count = var.upgrade_k3s_target_version != null && var.enable_upgrade_controller ? 1 : 0
 15 |   yaml_body = yamlencode({
 16 |     apiVersion = "upgrade.cattle.io/v1"
 17 |     kind       = "Plan"
 18 |     metadata = {
 19 |       labels = {
 20 |         "k3s-upgrade" = "server"
 21 |       }
 22 |       name      = "k3s-server"
 23 |       namespace = "system-upgrade"
 24 |     }
 25 |     spec = {
 26 |       version            = var.upgrade_k3s_target_version
 27 |       concurrency        = 1
 28 |       cordon             = true
 29 |       serviceAccountName = "system-upgrade"
 30 |       upgrade = {
 31 |         image = "rancher/k3s-upgrade"
 32 |       }
 33 |       nodeSelector = {
 34 |         matchExpressions = [
 35 |           {
 36 |             "key"      = "k3s-upgrade"
 37 |             "operator" = "Exists"
 38 |           },
 39 |           {
 40 |             "key"      = "k3s-upgrade"
 41 |             "operator" = "NotIn"
 42 |             "values" = [
 43 |               "disabled",
 44 |               "false",
 45 |             ]
 46 |           },
 47 |           {
 48 |             "key"      = "node-role.kubernetes.io/master"
 49 |             "operator" = "In"
 50 |             "values" = [
 51 |               "true",
 52 |             ]
 53 |           },
 54 |         ]
 55 |       }
 56 |       tolerations = concat([
 57 |         {
 58 |           "key"      = "node-role.kubernetes.io/master"
 59 |           "operator" = "Exists"
 60 |           "effect"   = "NoSchedule"
 61 |         },
 62 |         {
 63 |           "key"      = "CriticalAddonsOnly"
 64 |           "operator" = "Exists"
 65 |           "effect"   = "NoExecute"
 66 |         },
 67 |       ], var.upgrade_node_additional_tolerations)
 68 |     }
 69 |   })
 70 | }
 71 | 
 72 | resource "kubectl_manifest" "upgrade_plan_agents" {
 73 |   count = var.upgrade_k3s_target_version != null && var.enable_upgrade_controller ? 1 : 0
 74 |   yaml_body = yamlencode({
 75 |     apiVersion = "upgrade.cattle.io/v1"
 76 |     kind       = "Plan"
 77 |     metadata = {
 78 |       labels = {
 79 |         "k3s-upgrade" = "agent"
 80 |       }
 81 |       name      = "k3s-agent"
 82 |       namespace = "system-upgrade"
 83 |     }
 84 |     spec = {
 85 |       version     = var.upgrade_k3s_target_version
 86 |       concurrency = 1
 87 |       drain = {
 88 |         force                    = true
 89 |         skipWaitForDeleteTimeout = 60
 90 |       }
 91 |       serviceAccountName = "system-upgrade"
 92 |       prepare = {
 93 |         args = [
 94 |           "prepare",
 95 |           "k3s-server",
 96 |         ]
 97 |         image = "rancher/k3s-upgrade"
 98 |       }
 99 |       upgrade = {
100 |         image = "rancher/k3s-upgrade"
101 |       }
102 |       nodeSelector = {
103 |         matchExpressions = [
104 |           {
105 |             "key"      = "k3s-upgrade"
106 |             "operator" = "Exists"
107 |           },
108 |           {
109 |             "key"      = "k3s-upgrade"
110 |             "operator" = "NotIn"
111 |             "values" = [
112 |               "disabled",
113 |               "false",
114 |             ]
115 |           },
116 |           {
117 |             "key"      = "node-role.kubernetes.io/master"
118 |             "operator" = "NotIn"
119 |             "values" = [
120 |               "true",
121 |             ]
122 |           },
123 |         ]
124 |       }
125 |       tolerations = var.upgrade_node_additional_tolerations
126 |     }
127 |   })
128 | }
129 | 


--------------------------------------------------------------------------------
/variables.tf:
--------------------------------------------------------------------------------
  1 | # Hetzner Cloud
  2 | 
  3 | variable "hcloud_token" {
  4 |   description = "Token to authenticate against Hetzner Cloud"
  5 | }
  6 | 
  7 | # Cluster Configuration
  8 | 
  9 | variable "name" {
 10 |   description = "Cluster name (used in various places, don't use special chars)"
 11 | }
 12 | 
 13 | variable "create_kubeconfig" {
 14 |   description = "Create a local kubeconfig file to connect to the cluster"
 15 |   default     = true
 16 | }
 17 | 
 18 | variable "kubeconfig_filename" {
 19 |   description = "Specify the filename of the created kubeconfig file (defaults to kubeconfig-$${var.name}.yaml"
 20 |   default     = null
 21 | }
 22 | 
 23 | ## Network
 24 | 
 25 | variable "network_cidr" {
 26 |   description = "Network in which the cluster will be placed. Ignored if network_id is defined"
 27 |   default     = "10.0.0.0/16"
 28 | }
 29 | 
 30 | variable "cluster_cidr" {
 31 |   description = "Network CIDR to use for pod IPs"
 32 |   default     = "10.42.0.0/16"
 33 | }
 34 | 
 35 | variable "service_cidr" {
 36 |   description = "Network CIDR to use for services IPs"
 37 |   default     = "10.43.0.0/16"
 38 | }
 39 | 
 40 | variable "network_id" {
 41 |   description = "If specified, no new network will be created. Make sure cluster_cidr and service_cidr don't collide with anything in the existing network."
 42 |   default     = null
 43 | }
 44 | 
 45 | variable "subnet_cidr" {
 46 |   description = "Subnet in which all nodes are placed"
 47 |   default     = "10.0.1.0/24"
 48 | }
 49 | 
 50 | ## Servers
 51 | variable "control_plane_primary_index" {
 52 |   description = "Which of the servers should be the primary to connect to? If you change it from 1, also set `control_plane_already_initialized` to true. (1-indexed!)"
 53 |   default     = 1
 54 | }
 55 | 
 56 | variable "control_plane_already_initialized" {
 57 |   description = "Use this if you have to replace the first control plane and want the primary to join other already existing ones and not do an init anymore. You have to update `control_plane_primary_index` to something else too."
 58 |   default     = false
 59 | }
 60 | 
 61 | variable "control_plane_server_count" {
 62 |   description = "Number of control plane nodes"
 63 |   default     = 3
 64 | }
 65 | 
 66 | variable "control_plane_server_type" {
 67 |   description = "Server type of control plane servers"
 68 |   default     = "cx11"
 69 | }
 70 | 
 71 | variable "server_locations" {
 72 |   description = "Server locations in which servers will be distributed"
 73 |   default     = ["nbg1", "fsn1", "hel1"]
 74 |   type        = list(string)
 75 | }
 76 | 
 77 | variable "agent_groups" {
 78 |   description = "Configuration of agent groups"
 79 |   default = {
 80 |     "default" = {
 81 |       type      = "cx21"
 82 |       count     = 2
 83 |       ip_offset = 33
 84 |       taints    = []
 85 |     }
 86 |   }
 87 |   type = map(object({
 88 |     type      = string
 89 |     count     = number
 90 |     ip_offset = number
 91 |     taints    = list(string)
 92 |   }))
 93 | }
 94 | 
 95 | ## Server Configuration
 96 | 
 97 | variable "server_additional_packages" {
 98 |   description = "Additional packages which will be installed on node creation"
 99 |   default     = []
100 |   type        = list(string)
101 | }
102 | 
103 | ## Server Access
104 | 
105 | variable "ssh_private_key_location" {
106 |   description = "Use this private SSH key instead of generating a new one (Attention: Encrypted keys are not supported)"
107 |   default     = null
108 |   type        = string
109 | }
110 | 
111 | ## Versions
112 | 
113 | variable "k3s_version" {
114 |   description = "K3s version"
115 |   default     = "v1.21.3+k3s1"
116 | }
117 | 
118 | variable "hcloud_csi_driver_version" {
119 |   default = "v1.6.0"
120 | }
121 | 
122 | ## Upgrade Controller
123 | 
124 | variable "enable_upgrade_controller" {
125 |   description = "Install the rancher system-upgrade-controller"
126 |   default     = false
127 | }
128 | 
129 | variable "upgrade_controller_image_tag" {
130 |   description = "The image tag of the upgrade controller (See https://github.com/rancher/system-upgrade-controller/releases)"
131 |   default     = "v0.8.0"
132 | }
133 | 
134 | variable "upgrade_controller_kubectl_image_tag" {
135 |   default     = "v1.21.5"
136 |   description = "rancher/kubectl image tag"
137 | }
138 | 
139 | variable "upgrade_k3s_target_version" {
140 |   description = "Target version of k3s (See https://github.com/k3s-io/k3s/releases)"
141 |   type        = string
142 |   default     = null
143 | }
144 | 
145 | variable "upgrade_node_additional_tolerations" {
146 |   description = "List of tolerations which upgrade jobs must have to run on every node (for control-plane and agents)"
147 |   default     = []
148 |   type        = list(map(any))
149 | }
150 | 
151 | # Labels
152 | 
153 | locals {
154 |   common_labels = {
155 |     cluster     = var.name
156 |     provisioner = "terraform",
157 |     module      = "k-andy"
158 |     engine      = "k3s",
159 |   }
160 | }


--------------------------------------------------------------------------------
/logo.svg:
--------------------------------------------------------------------------------
  1 | <?xml version="1.0" encoding="iso-8859-1"?>
  2 | <!-- Generator: Adobe Illustrator 19.0.0, SVG Export Plug-In . SVG Version: 6.00 Build 0)  -->
  3 | <svg version="1.1" id="Capa_1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" x="0px" y="0px"
  4 | 	 viewBox="0 0 470 470" style="enable-background:new 0 0 470 470;" xml:space="preserve">
  5 | <g>
  6 | 	<path style="fill:#E7453F;" d="M284.515,267.563c0-23.073,18.771-41.844,41.845-41.844c8.997,0,17.333,2.864,24.164,7.715
  7 | 		c-4.38-10.432-13.711-19.259-24.833-19.259c-4.142,0-7.5-3.358-7.5-7.5s3.358-7.5,7.5-7.5c0.048,0,0.095,0.004,0.143,0.004
  8 | 		c0.12-42.009,0.207-98.774,0-102.8c-0.292-3.544,1.951-6.817,5.378-7.815c12.893-3.754,21.556-15.576,21.556-29.417
  9 | 		c0-16.897-13.747-30.645-30.645-30.645c-4.241,0-8.408,0.891-12.245,2.566c7.176,7.178,13.27,15.308,18.156,24.301
 10 | 		c1.977,3.64,0.629,8.193-3.01,10.17c-1.137,0.618-2.364,0.911-3.573,0.911c-2.661,0-5.238-1.419-6.597-3.921
 11 | 		c-5.69-10.474-13.275-19.598-22.535-27.142C276.186,22.242,255.859,15,235,15c-21.058,0-41.58,7.371-57.785,20.755
 12 | 		c-9.057,7.48-16.48,16.487-22.069,26.775c-1.359,2.502-3.937,3.921-6.597,3.921c-1.209,0-2.436-0.293-3.573-0.911
 13 | 		c-3.64-1.977-4.987-6.531-3.01-10.17c4.88-8.983,10.96-17.127,18.139-24.309c-3.832-1.669-7.994-2.558-12.228-2.558
 14 | 		c-16.897,0-30.645,13.747-30.645,30.645c0,13.841,8.663,25.663,21.556,29.417c3.428,0.998,5.67,4.271,5.378,7.815
 15 | 		c-0.207,4.026-0.12,60.792,0,102.8c0.048,0,0.095-0.004,0.143-0.004c4.142,0,7.5,3.358,7.5,7.5s-3.358,7.5-7.5,7.5
 16 | 		c-11.122,0-20.452,8.827-24.833,19.259c6.831-4.851,15.167-7.715,24.164-7.715c23.073,0,41.845,18.771,41.845,41.844
 17 | 		c0,22.889-18.475,41.534-41.295,41.831v23.11c0.04,0,0.079-0.003,0.119-0.003c4.142,0,7.5,3.358,7.5,7.5s-3.358,7.5-7.5,7.5
 18 | 		c-15.17,0-27.513,12.342-27.513,27.513v8.457c9.151-9.072,21.734-14.686,35.607-14.686c25.356,0,46.412,18.745,50.048,43.104
 19 | 		h65.097c3.636-24.359,24.692-43.104,50.048-43.104c13.873,0,26.456,5.614,35.607,14.686v-8.457
 20 | 		c0-15.171-12.342-27.513-27.513-27.513c-4.142,0-7.5-3.358-7.5-7.5s3.358-7.5,7.5-7.5c0.04,0,0.079,0.003,0.119,0.003v-23.11
 21 | 		C302.99,309.097,284.515,290.452,284.515,267.563z M235,115.028c4.142,0,7.5,3.358,7.5,7.5v18.288
 22 | 		c5.556-1.198,10.798-3.708,15.23-7.36c3.197-2.634,7.924-2.178,10.558,1.019c2.634,3.197,2.178,7.924-1.019,10.558
 23 | 		c-9.069,7.473-20.529,11.588-32.27,11.588s-23.201-4.115-32.27-11.588c-3.197-2.634-3.653-7.361-1.019-10.558
 24 | 		c2.634-3.196,7.361-3.653,10.558-1.019c4.432,3.652,9.675,6.163,15.23,7.36v-18.288C227.5,118.386,230.858,115.028,235,115.028z
 25 | 		 M163.364,81.188c7.54-21.941,25.14-39.542,47.082-47.082c3.917-1.346,8.184,0.738,9.53,4.655c1.346,3.917-0.738,8.184-4.655,9.53
 26 | 		c-17.602,6.049-31.722,20.169-37.771,37.771c-1.068,3.11-3.979,5.064-7.092,5.064c-0.809,0-1.63-0.131-2.438-0.409
 27 | 		C164.103,89.372,162.018,85.105,163.364,81.188z M235,383.786c-21.192,0-38.433-17.241-38.433-38.434c0-4.142,3.358-7.5,7.5-7.5
 28 | 		s7.5,3.358,7.5,7.5c0,12.921,10.512,23.434,23.433,23.434s23.433-10.512,23.433-23.434c0-4.142,3.358-7.5,7.5-7.5
 29 | 		s7.5,3.358,7.5,7.5C273.433,366.544,256.192,383.786,235,383.786z M196.567,315.352v-40.419c0-21.192,17.241-38.433,38.433-38.433
 30 | 		c4.142,0,7.5,3.358,7.5,7.5s-3.358,7.5-7.5,7.5c-12.921,0-23.433,10.512-23.433,23.433v40.419c0,4.142-3.358,7.5-7.5,7.5
 31 | 		S196.567,319.494,196.567,315.352z M235,211.62c-27.624,0-53.766-10.586-73.61-29.81c-2.975-2.882-3.051-7.63-0.168-10.605
 32 | 		c2.881-2.975,7.63-3.051,10.605-0.168c17.031,16.498,39.466,25.583,63.173,25.583c23.708,0,46.143-9.086,63.173-25.583
 33 | 		c2.976-2.882,7.723-2.806,10.605,0.168c2.882,2.975,2.807,7.723-0.168,10.605C288.767,201.033,262.625,211.62,235,211.62z"/>
 34 | 	<path style="fill:#EC6A65;" d="M353.204,267.563c0-14.802-12.042-26.844-26.844-26.844c-14.802,0-26.845,12.042-26.845,26.844
 35 | 		c0,14.802,12.042,26.845,26.845,26.845C341.161,294.408,353.204,282.365,353.204,267.563z"/>
 36 | 	<path style="fill:#EC6A65;" d="M353.204,419.393c0-19.634-15.973-35.607-35.607-35.607s-35.607,15.973-35.607,35.607
 37 | 		S297.963,455,317.597,455S353.204,439.026,353.204,419.393z"/>
 38 | 	<path style="fill:#EC6A65;" d="M188.011,419.393c0-19.634-15.974-35.607-35.607-35.607s-35.607,15.973-35.607,35.607
 39 | 		S132.77,455,152.403,455S188.011,439.026,188.011,419.393z"/>
 40 | 	<path style="fill:#EC6A65;" d="M143.641,294.408c14.802,0,26.845-12.042,26.845-26.845c0-14.802-12.042-26.844-26.845-26.844
 41 | 		c-14.802,0-26.844,12.042-26.844,26.844C116.796,282.365,128.839,294.408,143.641,294.408z"/>
 42 | 	<path style="fill:#3D2A20;" d="M308.778,171.205c-2.882-2.975-7.629-3.051-10.605-0.168c-17.03,16.498-39.466,25.583-63.173,25.583
 43 | 		c-23.707,0-46.143-9.086-63.173-25.583c-2.975-2.882-7.724-2.807-10.605,0.168c-2.882,2.975-2.807,7.723,0.168,10.605
 44 | 		c19.844,19.224,45.986,29.81,73.61,29.81c27.625,0,53.767-10.587,73.61-29.81C311.585,178.928,311.661,174.18,308.778,171.205z"/>
 45 | 	<path style="fill:#3D2A20;" d="M368.204,267.563v-21.521c0-11.238-4.392-22.83-12.05-31.803
 46 | 		c-4.476-5.245-9.693-9.204-15.329-11.749c0.088-29.445,0.219-83.424,0.064-101.508c16.29-7.119,26.88-23.27,26.88-41.834
 47 | 		c0-25.168-20.476-45.645-45.645-45.645c-8.671,0-17.145,2.484-24.41,7.082C279.623,7.271,257.575,0,235,0
 48 | 		s-44.623,7.271-62.714,20.584c-7.265-4.598-15.739-7.082-24.41-7.082c-25.168,0-45.645,20.476-45.645,45.645
 49 | 		c0,18.564,10.59,34.715,26.88,41.834c-0.155,18.085-0.024,72.063,0.064,101.508c-5.636,2.545-10.853,6.504-15.329,11.749
 50 | 		c-7.658,8.974-12.05,20.565-12.05,31.803v21.521c0,17.997,11.42,33.374,27.394,39.271v28.455
 51 | 		c-15.997,6.109-27.394,21.607-27.394,39.725v44.378c0,27.905,22.702,50.607,50.607,50.607c25.358,0,46.415-18.748,50.049-43.11
 52 | 		h65.096c3.634,24.362,24.691,43.11,50.049,43.11c27.905,0,50.607-22.702,50.607-50.607v-44.378
 53 | 		c0-18.118-11.397-33.616-27.394-39.725v-28.455C356.783,300.937,368.204,285.56,368.204,267.563z M325.691,332.501
 54 | 		c-4.142,0-7.5,3.358-7.5,7.5s3.358,7.5,7.5,7.5c15.17,0,27.513,12.342,27.513,27.513v8.457
 55 | 		c-9.151-9.072-21.734-14.686-35.607-14.686c-25.356,0-46.412,18.745-50.048,43.104h-65.097
 56 | 		c-3.636-24.359-24.692-43.104-50.048-43.104c-13.873,0-26.456,5.614-35.607,14.686v-8.457c0-15.171,12.342-27.513,27.513-27.513
 57 | 		c4.142,0,7.5-3.358,7.5-7.5s-3.358-7.5-7.5-7.5c-0.04,0-0.079,0.003-0.119,0.003v-23.11c22.82-0.297,41.295-18.942,41.295-41.831
 58 | 		c0-23.073-18.771-41.844-41.845-41.844c-8.997,0-17.333,2.864-24.164,7.715c4.38-10.432,13.711-19.259,24.833-19.259
 59 | 		c4.142,0,7.5-3.358,7.5-7.5s-3.358-7.5-7.5-7.5c-0.048,0-0.095,0.004-0.143,0.004c-0.12-42.009-0.207-98.774,0-102.8
 60 | 		c0.292-3.544-1.951-6.817-5.378-7.815c-12.893-3.754-21.556-15.576-21.556-29.417c0-16.897,13.747-30.645,30.645-30.645
 61 | 		c4.234,0,8.396,0.889,12.228,2.558c-7.179,7.182-13.259,15.326-18.139,24.309c-1.977,3.64-0.629,8.193,3.01,10.17
 62 | 		c1.138,0.618,2.364,0.911,3.573,0.911c2.661,0,5.238-1.419,6.597-3.921c5.588-10.288,13.012-19.295,22.064-26.771
 63 | 		C193.42,22.371,213.942,15,235,15c20.859,0,41.186,7.242,57.319,20.387c9.259,7.544,16.845,16.669,22.535,27.142
 64 | 		c1.359,2.502,3.937,3.921,6.597,3.921c1.209,0,2.436-0.293,3.573-0.911c3.64-1.978,4.987-6.531,3.01-10.17
 65 | 		c-4.886-8.993-10.979-17.123-18.156-24.301c3.837-1.674,8.005-2.566,12.245-2.566c16.897,0,30.645,13.747,30.645,30.645
 66 | 		c0,13.841-8.663,25.663-21.556,29.417c-3.428,0.998-5.67,4.271-5.378,7.815c0.207,4.026,0.12,60.792,0,102.8
 67 | 		c-0.048,0-0.095-0.004-0.143-0.004c-4.142,0-7.5,3.358-7.5,7.5s3.358,7.5,7.5,7.5c11.122,0,20.452,8.827,24.833,19.259
 68 | 		c-6.831-4.851-15.167-7.715-24.164-7.715c-23.073,0-41.845,18.771-41.845,41.844c0,22.889,18.475,41.534,41.295,41.831v23.11
 69 | 		C325.77,332.504,325.731,332.501,325.691,332.501z M281.989,419.393c0-19.634,15.974-35.607,35.607-35.607
 70 | 		s35.607,15.973,35.607,35.607S337.23,455,317.597,455S281.989,439.026,281.989,419.393z M152.403,455
 71 | 		c-19.634,0-35.607-15.974-35.607-35.607s15.973-35.607,35.607-35.607s35.607,15.973,35.607,35.607S172.037,455,152.403,455z
 72 | 		 M143.641,240.719c14.802,0,26.845,12.042,26.845,26.844c0,14.802-12.042,26.845-26.845,26.845
 73 | 		c-14.802,0-26.844-12.042-26.844-26.845C116.796,252.761,128.839,240.719,143.641,240.719z M326.359,294.408
 74 | 		c-14.802,0-26.845-12.042-26.845-26.845c0-14.802,12.042-26.844,26.845-26.844c14.802,0,26.844,12.042,26.844,26.844
 75 | 		C353.204,282.365,341.161,294.408,326.359,294.408z"/>
 76 | 	<path style="fill:#FFFFFF;" d="M204.067,322.852c4.142,0,7.5-3.358,7.5-7.5v-40.419c0-12.921,10.512-23.433,23.433-23.433
 77 | 		c4.142,0,7.5-3.358,7.5-7.5s-3.358-7.5-7.5-7.5c-21.192,0-38.433,17.241-38.433,38.433v40.419
 78 | 		C196.567,319.494,199.925,322.852,204.067,322.852z"/>
 79 | 	<path style="fill:#FFFFFF;" d="M265.933,337.852c-4.142,0-7.5,3.358-7.5,7.5c0,12.921-10.512,23.434-23.433,23.434
 80 | 		s-23.433-10.512-23.433-23.434c0-4.142-3.358-7.5-7.5-7.5s-7.5,3.358-7.5,7.5c0,21.192,17.241,38.434,38.433,38.434
 81 | 		s38.433-17.241,38.433-38.434C273.433,341.21,270.075,337.852,265.933,337.852z"/>
 82 | 	<path style="fill:#3D2A20;" d="M212.27,133.456c-3.197-2.634-7.924-2.178-10.558,1.019c-2.634,3.197-2.178,7.924,1.019,10.558
 83 | 		c9.069,7.473,20.529,11.588,32.27,11.588s23.201-4.115,32.27-11.588c3.197-2.634,3.653-7.361,1.019-10.558
 84 | 		c-2.634-3.196-7.36-3.652-10.558-1.019c-4.432,3.652-9.675,6.163-15.23,7.36v-18.288c0-4.142-3.358-7.5-7.5-7.5s-7.5,3.358-7.5,7.5
 85 | 		v18.288C221.944,139.619,216.702,137.108,212.27,133.456z"/>
 86 | 	<path style="fill:#FFFFFF;" d="M168.02,90.718c0.808,0.278,1.629,0.409,2.438,0.409c3.114,0,6.024-1.955,7.092-5.064
 87 | 		c6.049-17.602,20.169-31.722,37.771-37.771c3.917-1.346,6.001-5.613,4.655-9.53c-1.347-3.917-5.613-6.001-9.53-4.655
 88 | 		c-21.941,7.54-39.542,25.141-47.082,47.082C162.018,85.105,164.103,89.372,168.02,90.718z"/>
 89 | </g>
 90 | <g>
 91 | </g>
 92 | <g>
 93 | </g>
 94 | <g>
 95 | </g>
 96 | <g>
 97 | </g>
 98 | <g>
 99 | </g>
100 | <g>
101 | </g>
102 | <g>
103 | </g>
104 | <g>
105 | </g>
106 | <g>
107 | </g>
108 | <g>
109 | </g>
110 | <g>
111 | </g>
112 | <g>
113 | </g>
114 | <g>
115 | </g>
116 | <g>
117 | </g>
118 | <g>
119 | </g>
120 | </svg>
121 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
  1 | # k-andy
  2 | 
  3 | <img align="left" height="250" src="logo.svg"/>
  4 | 
  5 | ### Zero friction Kubernetes stack on Hetzner Cloud
  6 | 
  7 | This [terraform](https://www.terraform.io/) module will install a High Availability [K3s](https://k3s.io/) Cluster with Embedded DB in a private network on [Hetzner Cloud](https://www.hetzner.com/de/cloud). The following resources are provisionised by default (**20€/mo**):
  8 | 
  9 | - 3x Control-plane: _CX11_, 2GB RAM, 1VCPU, 20GB NVMe, 20TB Traffic.
 10 | - 2x Worker: _CX21_, 4GB RAM, 2VCPU, 40GB NVMe, 20TB Traffic.
 11 | - Network: Private network with one subnet.
 12 | - Server and agent nodes are distributed across 3 Datacenters (nbg1, fsn1, hel1) for high availability.
 13 | 
 14 | </br>
 15 | </br>
 16 | 
 17 | ---
 18 | 
 19 | > **Note**: Are you looking for the next generation API Developer Platform? 🔎 Have a look at: [WunderGraph](https://github.com/wundergraph/wundergraph)
 20 | Turn your services, databases and 3rd party APIs into a secure unified API in just a few minutes. 🪄
 21 | 
 22 | ---
 23 | 
 24 | **What is K3s?**
 25 | 
 26 | K3s is a lightweight certified kubernetes distribution. It's packaged as single binary and comes with solid defaults for storage and networking but we replaced [local-path-provisioner](https://github.com/rancher/local-path-provisioner) with hetzner [CSI-driver](https://github.com/hetznercloud/csi-driver) and [klipper load-balancer](https://github.com/k3s-io/klipper-lb) with hetzner [Cloud Controller Manager](https://github.com/hetznercloud/hcloud-cloud-controller-manager). The default ingress controller (traefik) has been disabled.
 27 | 
 28 | **Hetzner Cloud integration**:
 29 | 
 30 | - Preinstalled [CSI-driver](https://github.com/hetznercloud/csi-driver) for volume support.
 31 | - Preinstalled [Cloud Controller Manager for Hetzner Cloud](https://github.com/hetznercloud/hcloud-cloud-controller-manager) for Load Balancer support.
 32 | 
 33 | **Auto-K3s-Upgrades**
 34 | 
 35 | Enable the upgrade-controller (`enable_upgrade_controller = true`) and specify your target k3s version (`upgrade_k3s_target_version`). See [here](https://github.com/k3s-io/k3s/releases) for possible versions.
 36 | 
 37 | Label the nodes you want to upgrade, e.g. `kubectl label nodes core-control-plane-1 k3s-upgrade=true`. The concurrency 
 38 | of the upgrade plan is set to 1, so you can also label them all at once.  Agent nodes will be drained one by one during 
 39 | the upgrade.
 40 | 
 41 | You can label all control-plane nodes by using `kubectl label nodes -l node-role.kubernetes.io/control-plane=true k3s-upgrade=true`.
 42 | All agent nodes can be labelled using `kubectl label nodes -l !node-role.kubernetes.io/control-plane k3s-upgrade=true`.
 43 | 
 44 | To remove the label from all nodes you can run `kubectl label nodes --all k3s-upgrade-`.
 45 | 
 46 | After a successful update you can also remove the upgrade controller and the plans again, setting `enable_upgrade_controller` to `false`.
 47 | 
 48 | ## Usage
 49 | 
 50 | See a more detailed example with walk-through in the [example folder](./example).
 51 | 
 52 | <!-- BEGINNING OF PRE-COMMIT-TERRAFORM DOCS HOOK -->
 53 | ### Inputs
 54 | 
 55 | | Name | Description | Type | Default | Required |
 56 | |------|-------------|------|---------|:--------:|
 57 | | <a name="input_agent_groups"></a> [agent\_groups](#input\_agent\_groups) | Configuration of agent groups | <pre>map(object({<br>    type      = string<br>    count     = number<br>    ip_offset = number<br>    taints    = list(string)<br>  }))</pre> | <pre>{<br>  "default": {<br>    "count": 2,<br>    "ip_offset": 33,<br>    "taints": [],<br>    "type": "cx21"<br>  }<br>}</pre> | no |
 58 | | <a name="input_cluster_cidr"></a> [cluster\_cidr](#input\_cluster\_cidr) | Network CIDR to use for pod IPs | `string` | `"10.42.0.0/16"` | no |
 59 | | <a name="input_control_plane_already_initialized"></a> [control\_plane\_already\_initialized](#input\_control\_plane\_already\_initialized) | Use this if you have to replace the first control plane and want the primary to join other already existing ones and not do an init anymore. You have to update `control_plane_primary_index` to something else too. | `bool` | `false` | no |
 60 | | <a name="input_control_plane_primary_index"></a> [control\_plane\_primary\_index](#input\_control\_plane\_primary\_index) | Which of the servers should be the primary to connect to? If you change it from 1, also set `control_plane_already_initialized` to true. (1-indexed!) | `number` | `1` | no |
 61 | | <a name="input_control_plane_server_count"></a> [control\_plane\_server\_count](#input\_control\_plane\_server\_count) | Number of control plane nodes | `number` | `3` | no |
 62 | | <a name="input_control_plane_server_type"></a> [control\_plane\_server\_type](#input\_control\_plane\_server\_type) | Server type of control plane servers | `string` | `"cx11"` | no |
 63 | | <a name="input_create_kubeconfig"></a> [create\_kubeconfig](#input\_create\_kubeconfig) | Create a local kubeconfig file to connect to the cluster | `bool` | `true` | no |
 64 | | <a name="input_enable_upgrade_controller"></a> [enable\_upgrade\_controller](#input\_enable\_upgrade\_controller) | Install the rancher system-upgrade-controller | `bool` | `false` | no |
 65 | | <a name="input_hcloud_csi_driver_version"></a> [hcloud\_csi\_driver\_version](#input\_hcloud\_csi\_driver\_version) | n/a | `string` | `"v1.6.0"` | no |
 66 | | <a name="input_hcloud_token"></a> [hcloud\_token](#input\_hcloud\_token) | Token to authenticate against Hetzner Cloud | `any` | n/a | yes |
 67 | | <a name="input_k3s_version"></a> [k3s\_version](#input\_k3s\_version) | K3s version | `string` | `"v1.21.3+k3s1"` | no |
 68 | | <a name="input_kubeconfig_filename"></a> [kubeconfig\_filename](#input\_kubeconfig\_filename) | Specify the filename of the created kubeconfig file (defaults to kubeconfig-${var.name}.yaml | `any` | `null` | no |
 69 | | <a name="input_name"></a> [name](#input\_name) | Cluster name (used in various places, don't use special chars) | `any` | n/a | yes |
 70 | | <a name="input_network_cidr"></a> [network\_cidr](#input\_network\_cidr) | Network in which the cluster will be placed. Ignored if network\_id is defined | `string` | `"10.0.0.0/16"` | no |
 71 | | <a name="input_network_id"></a> [network\_id](#input\_network\_id) | If specified, no new network will be created. Make sure cluster\_cidr and service\_cidr don't collide with anything in the existing network. | `any` | `null` | no |
 72 | | <a name="input_server_additional_packages"></a> [server\_additional\_packages](#input\_server\_additional\_packages) | Additional packages which will be installed on node creation | `list(string)` | `[]` | no |
 73 | | <a name="input_server_locations"></a> [server\_locations](#input\_server\_locations) | Server locations in which servers will be distributed | `list(string)` | <pre>[<br>  "nbg1",<br>  "fsn1",<br>  "hel1"<br>]</pre> | no |
 74 | | <a name="input_service_cidr"></a> [service\_cidr](#input\_service\_cidr) | Network CIDR to use for services IPs | `string` | `"10.43.0.0/16"` | no |
 75 | | <a name="input_ssh_private_key_location"></a> [ssh\_private\_key\_location](#input\_ssh\_private\_key\_location) | Use this private SSH key instead of generating a new one (Attention: Encrypted keys are not supported) | `string` | `null` | no |
 76 | | <a name="input_subnet_cidr"></a> [subnet\_cidr](#input\_subnet\_cidr) | Subnet in which all nodes are placed | `string` | `"10.0.1.0/24"` | no |
 77 | | <a name="input_upgrade_controller_image_tag"></a> [upgrade\_controller\_image\_tag](#input\_upgrade\_controller\_image\_tag) | The image tag of the upgrade controller (See https://github.com/rancher/system-upgrade-controller/releases) | `string` | `"v0.8.0"` | no |
 78 | | <a name="input_upgrade_controller_kubectl_image_tag"></a> [upgrade\_controller\_kubectl\_image\_tag](#input\_upgrade\_controller\_kubectl\_image\_tag) | rancher/kubectl image tag | `string` | `"v1.21.5"` | no |
 79 | | <a name="input_upgrade_k3s_target_version"></a> [upgrade\_k3s\_target\_version](#input\_upgrade\_k3s\_target\_version) | Target version of k3s (See https://github.com/k3s-io/k3s/releases) | `string` | `null` | no |
 80 | | <a name="input_upgrade_node_additional_tolerations"></a> [upgrade\_node\_additional\_tolerations](#input\_upgrade\_node\_additional\_tolerations) | List of tolerations which upgrade jobs must have to run on every node (for control-plane and agents) | `list(map(any))` | `[]` | no |
 81 | 
 82 | ### Outputs
 83 | 
 84 | | Name | Description |
 85 | |------|-------------|
 86 | | <a name="output_agents_public_ips"></a> [agents\_public\_ips](#output\_agents\_public\_ips) | The public IP addresses of the agent servers |
 87 | | <a name="output_cidr_block"></a> [cidr\_block](#output\_cidr\_block) | n/a |
 88 | | <a name="output_control_planes_public_ips"></a> [control\_planes\_public\_ips](#output\_control\_planes\_public\_ips) | The public IP addresses of the control plane servers |
 89 | | <a name="output_k3s_token"></a> [k3s\_token](#output\_k3s\_token) | Secret k3s authentication token |
 90 | | <a name="output_kubeconfig"></a> [kubeconfig](#output\_kubeconfig) | Structured kubeconfig data to supply to other providers |
 91 | | <a name="output_kubeconfig_file"></a> [kubeconfig\_file](#output\_kubeconfig\_file) | Kubeconfig file content with external IP address |
 92 | | <a name="output_network_id"></a> [network\_id](#output\_network\_id) | n/a |
 93 | | <a name="output_server_locations"></a> [server\_locations](#output\_server\_locations) | Array of hetzner server locations we deploy to |
 94 | | <a name="output_ssh_private_key"></a> [ssh\_private\_key](#output\_ssh\_private\_key) | Key to SSH into nodes |
 95 | | <a name="output_subnet_id"></a> [subnet\_id](#output\_subnet\_id) | n/a |
 96 | <!-- END OF PRE-COMMIT-TERRAFORM DOCS HOOK -->
 97 | 
 98 | ## Common Operations
 99 | 
100 | ### Agent server replacement (common case)
101 | 
102 | If you need to cycle an agent, you can do that with a single node following this procedure.
103 | Replace the group name and number with the server you want to recreate!
104 | 
105 | Make sure you drain the nodes first. 
106 | 
107 | ```shell
108 | kubectl drain that-agent
109 | terraform taint 'module.my_cluster.module.agent_group["GROUP_NAME"].random_pet.agent_suffix[1]'
110 | terraform apply
111 | ```
112 | 
113 | This will recreate the agent in that group on next apply.
114 | 
115 | ### Sophisticated agent server replacement
116 | 
117 | If you did some weird config change or recreate them by changing the base k3s version in the terraform configuration and
118 | terraform wants to replace all your agents at once you can do this. Replacing all by one is probably not a good idea.
119 | 
120 | Example for replacement of one agent (the first one of that group):
121 | 
122 | ```shell
123 | kubectl drain that-agent
124 | terragrunt taint 'module.agent_group["GROUP_NAME"].random_pet.agent_suffix[0]'
125 | terraform apply --target='module.agent_group["GROUP_NAME"].hcloud_server.agent["#0"]' --target='module.agent_group["GROUP_NAME"].hcloud_server_network.agent["#0"]' --target='module.agent_group["GROUP_NAME"].random_pet.agent_suffix[0]'
126 | ```
127 | 
128 | ### Control Plane server replacement
129 | 
130 | Control plane servers do not get recreated when the user-data for cloud-init changes. If you want to recreate one after
131 | you changed something which would change the cloud-init you need to taint them.
132 | 
133 | #### Primary server
134 | 
135 | If you for some reason need to replace the primary control plane, you'll need to tell it to join the others.
136 | 
137 | Set the variable `control_plane_primary_index` to one of the other control plane nodes (e.g. 2 or 3).
138 | Also set `control_plane_already_initialized` to `true` so it won't run a `cluster-init` again. This will make the primary
139 | connect to control-plane 2 or 3 after recreation.
140 | 
141 | #### Secondary servers
142 | 
143 | This is how you can replace the servers which didn't initialize the cluster.
144 | 
145 | ```shell
146 | terraform taint 'module.my_cluster.hcloud_server.control_plane["#1"]'
147 | terraform apply
148 | ```
149 | 
150 | ## Auto-Upgrade
151 | 
152 | ### Prerequisite
153 | 
154 | Install the system-upgrade-controller in your cluster.
155 | 
156 | ```
157 | KUBECONFIG=kubeconfig.yaml kubectl apply -f ./upgrade/controller.yaml
158 | ```
159 | 
160 | ## Upgrade procedure
161 | 
162 | 1. Mark the nodes you want to upgrade (The script will mark all nodes).
163 | 
164 | ```
165 | KUBECONFIG=kubeconfig.yaml kubectl label --all node k3s-upgrade=true
166 | ```
167 | 
168 | 2. Run the plan for the **servers**.
169 | 
170 | ```
171 | KUBECONFIG=kubeconfig.yaml kubectl apply -f ./upgrade/server-plan.yaml
172 | ```
173 | 
174 | > **Warning:** Wait for completion [before you start upgrading your agents](https://github.com/k3s-io/k3s/issues/2996#issuecomment-788352375).
175 | 
176 | 3. Run the plan for the **agents**.
177 | 
178 | ```
179 | KUBECONFIG=kubeconfig.yaml kubectl apply -f ./upgrade/agent-plan.yaml
180 | ```
181 | 
182 | ## Backups
183 | 
184 | K3s will automatically backup your embedded etcd datastore every 12 hours to `/var/lib/rancher/k3s/server/db/snapshots/`.
185 | You can reset the cluster by pointing to a specific snapshot.
186 | 
187 | 1. Stop the master server.
188 | 
189 | ```sh
190 | sudo systemctl stop k3s
191 | ```
192 | 
193 | 2. Restore the master server with a snapshot
194 | 
195 | ```sh
196 | ./k3s server \
197 |   --cluster-reset \
198 |   --cluster-reset-restore-path=<PATH-TO-SNAPSHOT>
199 | ```
200 | 
201 | > **Warning:** This forget all peers and the server becomes the sole member of a new cluster. You have to manually rejoin all servers.
202 | 
203 | 3. Connect you with the different servers. Backup and delete `/var/lib/rancher/k3s/server/db` on each server.
204 | 
205 | ```sh
206 | sudo systemctl stop k3s
207 | rm -rf /var/lib/rancher/k3s/server/db
208 | sudo systemctl start k3s
209 | ```
210 | 
211 | This will rejoin the server one after another. After some time, all servers should be in sync again. Run `kubectl get node` to verify it.
212 | 
213 | > **Info:** It exists no official tool to automate the procedure. In future, rancher might provide an operator to handle this ([issue](https://github.com/k3s-io/k3s/issues/3174)).
214 | 
215 | ## Debugging
216 | 
217 | Cloud init logs can be found on the remote machines in:
218 | 
219 | - `/var/log/cloud-init-output.log`
220 | - `/var/log/cloud-init.log`
221 | - `journalctl -u k3s.service -e` last logs of the server
222 | - `journalctl -u k3s-agent.service -e` last logs of the agent
223 | 
224 | ## Credits
225 | 
226 | - [terraform-hcloud-k3s](https://github.com/cicdteam/terraform-hcloud-k3s) Terraform module which creates a single node cluster.
227 | - [terraform-module-k3](https://github.com/xunleii/terraform-module-k3s) Terraform module which creates a k3s cluster, with multi-server and management features.
228 | - Icon created by [Freepik](https://www.freepik.com) from [www.flaticon.com](https://www.flaticon.com/de/)
229 | 


--------------------------------------------------------------------------------