Skip to content

Commit

Permalink
tools: periodically clean up bare-metal servers
Browse files Browse the repository at this point in the history
  • Loading branch information
davidweisse committed Oct 21, 2024
1 parent 0db5c0e commit 72030f2
Show file tree
Hide file tree
Showing 4 changed files with 154 additions and 0 deletions.
58 changes: 58 additions & 0 deletions packages/cleanup-bm.sh
Original file line number Diff line number Diff line change
@@ -0,0 +1,58 @@
#!/usr/bin/env bash
# Copyright 2024 Edgeless Systems GmbH
# SPDX-License-Identifier: AGPL-3.0-only

set -euo pipefail

echo "Starting cleanup"

resourcesToCheck=(
"pods"
"deployments"
"statefulsets"
"daemonsets"
"replicasets"
"jobs"
"cronjobs"
)

touch usedRuntimeClasses
for resource in "${resourcesToCheck[@]}"; do
kubectl get "${resource}" --all-namespaces -o jsonpath='{.items[*].spec.runtimeClassName} {.items[*].spec.template.spec.runtimeClassName} {.items[*].spec.jobTemplate.spec.template.spec.runtimeClassName}' 2>/dev/null |
tr ' ' '\n' >>usedRuntimeClasses
done

kubectl get pods --all-namespaces -o jsonpath='{.items[?(@.metadata.annotations.contrast\.edgeless\.systems/pod-role=="contrast-node-installer")].spec.containers[0].args[1]}' |
tr ' ' '\n' |
grep -o "contrast-cc-.\+" >>usedRuntimeClasses
sort -u usedRuntimeClasses -o usedRuntimeClasses

mapfile -t unusedRuntimeClasses < <(
comm -13 usedRuntimeClasses <(
kubectl get runtimeclass -o jsonpath='{.items[*].metadata.name}' |
tr ' ' '\n' |
grep '^contrast-cc' |
sort -u
)
)

for runtimeClass in "${unusedRuntimeClasses[@]}"; do
# Delete unused runtime classes
echo "Deleting runtimeclass ${runtimeClass} ..."
kubectl delete runtimeclass "${runtimeClass}"

# Delete unused files
if [ -d "${OPTEDGELESS}/${runtimeClass}" ]; then
echo "Deleting files from ${OPTEDGELESS}/${runtimeClass} ..."
rm -rf "${OPTEDGELESS:?}/${runtimeClass}"
fi
if [ -d "/var/lib/${SNAPSHOTTER}-snapshotter" ]; then
echo "Deleting files from /var/lib/${SNAPSHOTTER}-snapshotter/${runtimeClass} ..."
rm -rf "/var/lib/${SNAPSHOTTER}-snapshotter/${runtimeClass}"
fi

# Remove references from containerd config
echo "Removing ${runtimeClass} from ${CONFIG} ..."
dasel delete --file "${CONFIG}" --indent 0 --read toml --write toml "plugins.io\.containerd\.grpc\.v1\.cri.containerd.runtimes.${runtimeClass}" 2>/dev/null
dasel delete --file "${CONFIG}" --indent 0 --read toml --write toml "proxy_plugins.${SNAPSHOTTER}-${runtimeClass}" 2>/dev/null
done
8 changes: 8 additions & 0 deletions packages/containers.nix
Original file line number Diff line number Diff line change
Expand Up @@ -155,6 +155,14 @@ let
Env = [ "PATH=/bin" ]; # This is only here for policy generation.
};
};

cleanup-bm = dockerTools.buildImage {
name = "cleanup-bm";
tag = "v0.0.1";
config = {
Cmd = [ "${lib.getExe pkgs.scripts.cleanup-bm}" ];
};
};
};
in
containers
Expand Down
10 changes: 10 additions & 0 deletions packages/scripts.nix
Original file line number Diff line number Diff line change
Expand Up @@ -490,4 +490,14 @@
kubectl apply -k "$tmpdir/overlays/azure"
'';
};

cleanup-bm = writeShellApplication {
name = "cleanup-bm";
runtimeInputs = with pkgs; [
busybox
kubectl
dasel
];
text = builtins.readFile ./cleanup-bm.sh;
};
}
78 changes: 78 additions & 0 deletions tools/bm-maintenance/deployment_tdx_snp.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,78 @@
apiVersion: v1
kind: ServiceAccount
metadata:
name: cleanup-sa
---
apiVersion: rbac.authorization.k8s.io/v1
kind: ClusterRole
metadata:
name: cleanup-role
rules:
- apiGroups: [""]
resources: ["pods"]
verbs: ["list"]
- apiGroups: ["apps"]
resources: ["deployments", "statefulsets", "daemonsets", "replicasets"]
verbs: ["list"]
- apiGroups: ["batch"]
resources: ["jobs", "cronjobs"]
verbs: ["list"]
- apiGroups: ["node.k8s.io"]
resources: ["runtimeclasses"]
verbs: ["list", "delete"]
---
apiVersion: rbac.authorization.k8s.io/v1
kind: ClusterRoleBinding
metadata:
name: cleanup-binding
subjects:
- kind: ServiceAccount
name: cleanup-sa
namespace: default
roleRef:
kind: ClusterRole
name: cleanup-role
apiGroup: rbac.authorization.k8s.io
---
apiVersion: batch/v1
kind: CronJob
metadata:
name: cleanup-maintenance
spec:
schedule: "0 0 * * 0"
jobTemplate:
spec:
template:
spec:
serviceAccountName: cleanup-sa
containers:
- name: cleanup
image: ghcr.io/edgelesssys/contrast/cleanup-bm:v0.0.1
env:
- name: OPTEDGELESS
value: /opt/edgeless
- name: CONFIG
value: /var/lib/rancher/k3s/agent/etc/containerd/config.toml.tmpl
- name: SNAPSHOTTER
value: nydus
volumeMounts:
- name: opt-edgeless
mountPath: /opt/edgeless
- name: snapshotter-data
mountPath: /var/lib/nydus-snapshotter
- name: containerd-config
mountPath: /var/lib/rancher/k3s/agent/etc/containerd
volumes:
- name: opt-edgeless
hostPath:
path: /opt/edgeless
type: Directory
- name: snapshotter-data
hostPath:
path: /var/lib/nydus-snapshotter
type: Directory
- name: containerd-config
hostPath:
path: /var/lib/rancher/k3s/agent/etc/containerd
type: Directory
restartPolicy: OnFailure

0 comments on commit 72030f2

Please sign in to comment.