From ea7e123e25b44c6eb67a760a5d9ab09f445a245c Mon Sep 17 00:00:00 2001 From: Yash Gorana Date: Thu, 19 Sep 2024 23:02:15 +0530 Subject: [PATCH] improve commands + reset script + delete ns speed --- justfile | 284 ++++++++++++++++++++++--------------------- scripts/reset_k8s.sh | 52 ++++---- 2 files changed, 169 insertions(+), 167 deletions(-) diff --git a/justfile b/justfile index 8df4a9637b5..78caf7bc747 100644 --- a/justfile +++ b/justfile @@ -1,19 +1,43 @@ +# Rules for new commands +# - Start with a verb +# - Keep it short (max. 3 words) +# - Group commands by context. Include group name in the command name. +# - Mark things private that are util functions with [private] or _var +# - Don't over-engineer, keep it simple. +# - Don't break existing commands + set dotenv-load # --------------------------------------------------------------------------------------------------------------------- - -cluster_default := "k3d-syft-dev" -cluster_high := "k3d-syft-high" -cluster_low := "k3d-syft-low" -cluster_gw := "k3d-syft-gw" -cluster_signoz := "k3d-signoz" -ns_default := "syft" -ns_high := "high" -ns_low := "low" -ns_gw := "gw" +# K3D cluster names +# Note: These are private (_ prefix) because we don't want it to be editable from CLI. +_name_default := "syft-dev" +_name_high := "syft-high" +_name_low := "syft-low" +_name_gw := "syft-gw" +_name_signoz := "signoz" + +# K3D Registry name is used only in k3d. +_name_registry := "registry.localhost" + +# Kubernetes namespaces for the deployments +# Note: These are private (_ prefix) because we don't want it to be editable from CLI. +_ns_default := "syft" +_ns_high := "high" +_ns_low := "low" +_ns_gw := "gw" + +# Kubernetes context names generated for the K3D clusters +# Note: These are private (_ prefix) because we don't want it to be editable from CLI. +_ctx_default := "k3d-" + _name_default +_ctx_high := "k3d-" + _name_high +_ctx_low := "k3d-" + _name_low +_ctx_gw := "k3d-" + _name_gw +_ctx_signoz := "k3d-" + _name_signoz # --------------------------------------------------------------------------------------------------------------------- +# Static Ports for the clusters port_default := "8080" port_high := port_default port_low := "8081" @@ -22,21 +46,27 @@ port_signoz_ui := "3301" port_signoz_otel := "4317" port_registry := "5800" -registry_url := "k3d-registry.localhost:" + port_registry +# Registry URL is used for +# - setting up the registry for k3d clusters +# - setting up the --var CONTAINER_REGISTRY for devspace deployments +# Note: Do not add http:// or https:// prefix +registry_url := "k3d-" + _name_registry + ":" + port_registry + +# Signoz OTel endpoint is used for setting up the Otel collector signoz_otel_url := "http://host.k3d.internal:" + port_signoz_otel # --------------------------------------------------------------------------------------------------------------------- - # devspace profiles (comma-separated) profiles := "" # enable tracing by adding "tracing" profile in devspace tracing := "true" +# add tracing profile if enabled +# This is private ( _prefix) to have a simple `just tracing=true ...` _g_profiles := if tracing == "true" { profiles + ",tracing" } else { profiles } # --------------------------------------------------------------------------------------------------------------------- - # this might break if you have alias python = python3 or either of the executable not pointing to the correct one # just fix your system instead of making of fixing this python_path := `which python || which python3` @@ -48,126 +78,112 @@ python_path := `which python || which python3` # --------------------------------------------------------------------------------------------------------------------- -# Start a local registry on http://k3d-registry.localhost:{{port_registry}} +# Start a local registry on http://k3d-registry.local:5800 (port_registry=5800 or registry_url="gcr.io/path/to/registry") [group('registry')] start-registry: k3d --version @-docker volume create k3d-registry-vol - @-k3d registry create registry.localhost --port {{ port_registry }} -v k3d-registry-vol:/var/lib/registry --no-help + @-k3d registry create {{ _name_registry }} --port {{ port_registry }} -v k3d-registry-vol:/var/lib/registry --no-help - if ! grep -q k3d-registry.localhost /etc/hosts; then \ + if ! grep -q {{ _name_registry }} /etc/hosts; then \ sudo {{ python_path }} scripts/patch_hosts.py --add-k3d-registry --fix-docker-hosts; \ fi - @curl --silent --retry 5 --retry-all-errors http://k3d-registry.localhost:{{ port_registry }}/v2/_catalog | jq - @echo "\033[1;32mRegistring running at http://k3d-registry.localhost:{{ port_registry }}\033[0m" + @curl --silent --retry 5 --retry-all-errors http://{{ registry_url }}/v2/_catalog | jq + @echo "\033[1;32mRegistring running at http://{{ registry_url }}\033[0m" [group('registry')] delete-registry: - -k3d registry delete registry.localhost + -k3d registry delete {{ _name_registry }} -docker volume rm k3d-registry-vol # --------------------------------------------------------------------------------------------------------------------- -# Launch a Datasite high-side cluster on http://localhost:{{port_high}} +# Launch a Datasite high-side cluster on http://localhost:8080 (port_high=8080) [group('highside')] -start-high: (delete-cluster cluster_high) (create-cluster cluster_high port_high) +start-high: (create-cluster _name_high port_high) # Stop the Datasite high-side cluster [group('highside')] -delete-high: (delete-cluster cluster_high) +delete-high: (delete-cluster _name_high) # Deploy Syft to the high-side cluster [group('highside')] -deploy-high: (deploy-devspace cluster_high ns_default) +deploy-high: (deploy-devspace _ctx_high _ns_default) # Reset Syft DB state in the high-side cluster [group('highside')] -reset-high: (reset-syft cluster_high ns_default) +reset-high: (reset-syft _ctx_high _ns_default) -# Remove devpsace deployment + namespace from the high-side cluster +# Remove namespace from the high-side cluster [group('highside')] -cleanup-high: (purge-devspace cluster_high ns_default) (delete-ns cluster_high ns_default) +cleanup-high: (yank-ns _ctx_high _ns_default) + +# K9s into the Datasite High cluster +[group('highside')] +k9s-high: + k9s --context {{ _ctx_high }} # --------------------------------------------------------------------------------------------------------------------- -# Launch a Datasite low-side cluster on http://localhost:{{port_low}} +# Launch a Datasite low-side cluster on http://localhost:8081 (port_low=8081) [group('lowside')] -start-low: (create-cluster cluster_low port_low) +start-low: (create-cluster _name_low port_low) # Stop the Datasite low-side cluster [group('lowside')] -delete-low: (delete-cluster cluster_low) +delete-low: (delete-cluster _name_low) # Deploy Syft to the low-side cluster [group('lowside')] -deploy-low: (deploy-devspace cluster_low ns_default "-p datasite-low") +deploy-low: (deploy-devspace _ctx_low _ns_default "-p datasite-low") # Reset Syft DB state in the low-side cluster [group('lowside')] -reset-low: (reset-syft cluster_low ns_default) +reset-low: (reset-syft _ctx_low _ns_default) -# Remove devpsace deployment + namespace from the low-side cluster +# Remove namespace from the low-side cluster [group('lowside')] -cleanup-low: (purge-devspace cluster_low ns_default) (delete-ns cluster_low ns_default) +cleanup-low: (yank-ns _ctx_low _ns_default) + +# K9s into the Datesite Low cluster +[group('lowside')] +k9s-low: + k9s --context {{ _ctx_low }} # --------------------------------------------------------------------------------------------------------------------- -# Launch a Gateway cluster on http://localhost:{{port_gw}} +# Launch a Gateway cluster on http://localhost:8083 (port_gw=8083) [group('gateway')] -start-gw: (create-cluster cluster_gw port_gw) +start-gw: (create-cluster _name_gw port_gw) # Delete the Gateway cluster [group('gateway')] -delete-gw: (delete-cluster cluster_gw) +delete-gw: (delete-cluster _name_gw) # Deploy Syft to the gateway cluster [group('gateway')] -deploy-gw: (deploy-devspace cluster_gw ns_default "-p gateway") +deploy-gw: (deploy-devspace _ctx_gw _ns_default "-p gateway") # Reset Syft DB state in the gateway cluster [group('gateway')] -reset-gw: (reset-syft cluster_gw ns_default) +reset-gw: (reset-syft _ctx_gw _ns_default) -# Remove devpsace deployment + namespace from the gateway cluster +# Remove namespace from the gateway cluster [group('gateway')] -cleanup-gw: (purge-devspace cluster_gw ns_default) (delete-ns cluster_gw ns_default) - -# --------------------------------------------------------------------------------------------------------------------- +cleanup-gw: (yank-ns _ctx_gw _ns_default) -# TODO - multi-namespace -> unique k3d ports -# # Launch a multi-agent cluster on http://localhost:{{port_default}} -# [group('shared')] -# start-shared: (create-cluster cluster_default port_default "--agents 2") - -# # Stop the multi-agent cluster -# [group('shared')] -# delete-shared: (delete-cluster cluster_default) - -# [group('shared')] -# deploy-ns-high: (deploy-devspace cluster_default ns_high) - -# [group('shared')] -# delete-ns-high: (delete-ns cluster_default ns_high) - -# [group('shared')] -# deploy-ns-low: (deploy-devspace cluster_default ns_low "-p datasite-low") - -# [group('shared')] -# delete-ns-low: (delete-ns cluster_default ns_low) - -# [group('shared')] -# deploy-ns-gw: (deploy-devspace cluster_default ns_gw "-p gateway") - -# [group('shared')] -# delete-ns-gw: (delete-ns cluster_default ns_gw) +# K9s into the Gateway cluster +[group('gateway')] +k9s-gw: + k9s --context {{ _ctx_gw }} # --------------------------------------------------------------------------------------------------------------------- -# Launch SigNoz on http://localhost:{{port_signoz_ui}} +# Launch SigNoz. UI=http://localhost:3301 OTEL=http://localhost:4317 (port_signoz_ui=3301 port_signoz_otel=4317) [group('signoz')] -start-signoz: && apply-signoz setup-signoz - k3d cluster create signoz \ +start-signoz: && (apply-signoz _ctx_signoz) (setup-signoz _ctx_signoz) + k3d cluster create {{ _name_signoz }} \ --port {{ port_signoz_ui }}:3301@loadbalancer \ --port {{ port_signoz_otel }}:4317@loadbalancer \ --k3s-arg "--disable=metrics-server@server:*" @@ -176,6 +192,11 @@ start-signoz: && apply-signoz setup-signoz Dashboard: \033[1;36mhttp://localhost:{{ port_signoz_ui }}\033[0m\n\ OTEL Endpoint: \033[1;36mhttp://localhost:{{ port_signoz_otel }}\033[0m\n" +# K9s into the Signoz cluster +[group('signoz')] +k9s-signoz: + k9s --context {{ _ctx_signoz }} + # Remove SigNoz from the cluster [group('signoz')] delete-collector: @@ -183,17 +204,17 @@ delete-collector: # Remove SigNoz from the cluster [group('signoz')] -delete-signoz: (delete-cluster cluster_signoz) +delete-signoz: (delete-cluster _name_signoz) [group('signoz')] [private] -apply-collector cluster: - @echo "Installing SigNoz OTel Collector" +apply-collector kube_context: + @echo "Installing SigNoz OTel Collector in kubernetes context {{ kube_context }}" helm install k8s-infra k8s-infra \ --repo https://charts.signoz.io \ - --kube-context {{ cluster }} \ + --kube-context {{ kube_context }} \ --set global.deploymentEnvironment=local \ - --set clusterName={{ cluster }} \ + --set clusterName={{ kube_context }} \ --set otelCollectorEndpoint={{ signoz_otel_url }} \ --set otelInsecure=true \ --set presets.otlpExporter.enabled=true \ @@ -201,11 +222,11 @@ apply-collector cluster: [group('signoz')] [private] -apply-signoz: - @echo "Installing SigNoz on the cluster" +apply-signoz kube_context: + @echo "Installing SigNoz in kube context {{ kube_context }}" helm install signoz signoz \ --repo https://charts.signoz.io \ - --kube-context {{ cluster_signoz }} \ + --kube-context {{ kube_context }} \ --namespace platform \ --create-namespace \ --version 0.52.0 \ @@ -215,10 +236,10 @@ apply-signoz: [group('signoz')] [private] -setup-signoz: +setup-signoz kube_context: @echo "Waiting for SigNoz frontend to be available..." @bash ./packages/grid/scripts/wait_for.sh service signoz-frontend \ - --namespace platform --context {{ cluster_signoz }} &> /dev/null + --namespace platform --context {{ kube_context }} &> /dev/null @echo "Setting up SigNoz account" @curl --retry 5 --retry-all-errors -X POST \ @@ -244,16 +265,10 @@ delete-clusters: [group('cluster')] [private] -create-cluster cluster port *args='': start-registry && (apply-coredns cluster) (apply-collector cluster) - #!/bin/bash - set -euo pipefail - - # remove the k3d- prefix - CLUSTER_NAME=$(echo "{{ cluster }}" | sed -e 's/k3d-//g') - - k3d cluster create $CLUSTER_NAME \ +create-cluster cluster_name port *args='': start-registry && (apply-coredns "k3d-" + cluster_name) (apply-collector "k3d-" + cluster_name) + k3d cluster create {{ cluster_name }} \ --port {{ port }}:80@loadbalancer \ - --registry-use k3d-registry.localhost:5800 {{ args }} + --registry-use {{ registry_url }} {{ args }} [group('cluster')] [private] @@ -267,22 +282,17 @@ delete-cluster *args='': [group('cluster')] [private] -delete-ns context namespace: - kubectl delete ns {{ namespace }} --force --grace-period=0 --context {{ context }} - -[group('cluster')] -[private] -apply-coredns cluster: +apply-coredns kube_context: @echo "Applying custom CoreDNS config" - kubectl apply -f ./scripts/k8s-coredns-custom.yml --context {{ cluster }} - kubectl delete pod -n kube-system -l k8s-app=kube-dns --context {{ cluster }} + kubectl apply -f ./scripts/k8s-coredns-custom.yml --context {{ kube_context }} + kubectl delete pod -n kube-system -l k8s-app=kube-dns --context {{ kube_context }} # --------------------------------------------------------------------------------------------------------------------- [group('devspace')] [private] -deploy-devspace cluster namespace *args='': +deploy-devspace kube_context namespace *args='': #!/bin/bash set -euo pipefail @@ -294,11 +304,11 @@ deploy-devspace cluster namespace *args='': PROFILE="-p $PROFILE" fi - echo "Deploying to {{ cluster }}" + echo "Deploying to kube context {{ kube_context }}" devspace deploy -b \ --no-warn \ - --kube-context {{ cluster }} \ + --kube-context {{ kube_context }} \ --namespace {{ namespace }} \ $PROFILE \ {{ args }} \ @@ -306,12 +316,12 @@ deploy-devspace cluster namespace *args='': [group('devspace')] [private] -purge-devspace cluster namespace: +purge-devspace kube_context namespace: #!/bin/bash set -euo pipefail cd packages/grid - devspace purge --force-purge --kube-context {{ cluster }} --no-warn --namespace {{ namespace }} + devspace purge --force-purge --kube-context {{ kube_context }} --no-warn --namespace {{ namespace }} sleep 3 # --------------------------------------------------------------------------------------------------------------------- @@ -338,13 +348,13 @@ check-platform: [group('cloud')] [private] -deploy-cloud cluster_ctx registry_url namespace profile: check-platform +deploy-cloud kube_context registry_url namespace profile: check-platform #!/bin/bash - CONTEXT_NAME=$(kubectl config get-contexts -o=name | grep "{{ cluster_ctx }}") + CONTEXT_NAME=$(kubectl config get-contexts -o=name | grep "{{ kube_context }}") if [ -z "$CONTEXT_NAME" ]; then - echo "Context not found: {{ cluster_ctx }}. Authorized with cloud providers to get relevant K8s cluster contexts" + echo "Context not found: {{ kube_context }}. Authorized with cloud providers to get relevant K8s cluster contexts" exit 1 fi @@ -356,13 +366,13 @@ deploy-cloud cluster_ctx registry_url namespace profile: check-platform [group('cloud')] [private] -purge-cloud cluster_ctx namespace: +purge-cloud kube_context namespace: #!/bin/bash - CONTEXT_NAME=$(kubectl config get-contexts -o=name | grep "{{ cluster_ctx }}") + CONTEXT_NAME=$(kubectl config get-contexts -o=name | grep "{{ kube_context }}") if [ -z "$CONTEXT_NAME" ]; then - echo "Context not found: {{ cluster_ctx }}. Authorized with cloud providers to get relevant K8s cluster contexts" + echo "Context not found: {{ kube_context }}. Authorized with cloud providers to get relevant K8s cluster contexts" exit 1 fi @@ -428,47 +438,39 @@ deploy-az-high aks_cluster az_registry namespace="syft": (deploy-cloud aks_clust # Reset Syft state in a cluster [group('utils')] -[private] -reset-syft name namespace: - kubectl config use-context {{ name }} - scripts/reset_k8s.sh +reset-syft kube_context namespace: + scripts/reset_k8s.sh --context {{ kube_context }} --namespace {{ namespace }} -# K9s into the Datasite High cluster -[group('utils')] -k9s-high: - k9s --context {{ cluster_high }} - -# K9s into the Datesite Low cluster -[group('utils')] -k9s-low: - k9s --context {{ cluster_low }} - -# K9s into the Gateway cluster -[group('utils')] -k9s-gw: - k9s --context {{ cluster_gw }} - -# K9s into the Signoz cluster -[group('utils')] -k9s-signoz: - k9s --context {{ cluster_signoz }} - -# Stop all Syft clusters + registry +# Delete all local clusters and registry [group('utils')] delete-all: delete-clusters delete-registry - @echo "Stopped all Syft components" -[confirm('Confirm prune all docker resources?')] +# Prune local docker cache. Run atleast once a month. [group('utils')] prune-docker: -docker container prune -f -docker volume prune -af -docker image prune -af - -docker builder prune -af - -docker buildx prune -af -docker system prune -af --volumes +# Delete all resources in a namespace [group('utils')] -yank-ns namespace: - -kubectl delete ns {{ namespace }} --now --timeout=5s - kubectl get ns {{ namespace }} -o json | jq '.spec.finalizers = []' | kubectl replace --raw /api/v1/namespaces/{{ namespace }}/finalize -f - +yank-ns kube_context namespace: + # delete pods 𝙛 𝙖 𝙨 𝙩 + -kubectl delete statefulsets --all --context {{ kube_context }} --namespace {{ namespace }} --now + -kubectl delete deployments --all --context {{ kube_context }} --namespace {{ namespace }} --now + -kubectl delete pods --all --namespace {{ namespace }} --grace-period=0 --force + + # delete resources 𝙛 𝙖 𝙨 𝙩 + -kubectl delete configmap --all --context {{ kube_context }} --namespace {{ namespace }} --now + -kubectl delete secrets --all --context {{ kube_context }} --namespace {{ namespace }} --now + -kubectl delete ingress --all --context {{ kube_context }} --namespace {{ namespace }} --now + + # delete namespace NOT 𝙛 𝙖 𝙨 𝙩 :( + -kubectl delete ns {{ namespace }} --context {{ kube_context }} --grace-period=0 --force --timeout=5s + + # Too slow... yanking it + -kubectl get ns {{ namespace }} --context {{ kube_context }} -o json | jq '.spec.finalizers = []' | \ + kubectl replace --context {{ kube_context }} --raw /api/v1/namespaces/{{ namespace }}/finalize -f - + + @echo "Done" diff --git a/scripts/reset_k8s.sh b/scripts/reset_k8s.sh index 033cb24ed31..68c317a6232 100755 --- a/scripts/reset_k8s.sh +++ b/scripts/reset_k8s.sh @@ -1,12 +1,13 @@ #!/bin/bash -echo $1 +KUBECTL_ARGS="$@" +NAMESPACE="syft" +POSTGRES_POD_NAME="postgres-0" -# Default pod name -DEFAULT_POD_NAME="postgres-0" - -# Use the provided pod name or the default -POSTGRES_POD_NAME=${1:-$DEFAULT_POD_NAME} +# if kubectl args doesn't have a namespace, add it +if [[ ! "$KUBECTL_ARGS" =~ (-n|--namespace) ]]; then + KUBECTL_ARGS="$KUBECTL_ARGS --namespace $NAMESPACE" +fi # SQL commands to reset all tables RESET_COMMAND=" @@ -38,32 +39,31 @@ END \$\$; " # Execute the SQL commands -echo "Resetting all tables in $POSTGRES_POD_NAME..." -kubectl exec -i -n syft $POSTGRES_POD_NAME -- psql -U syft_postgres -d syftdb_postgres << EOF +echo ">>> Resetting database '$POSTGRES_POD_NAME'. psql output:" +kubectl exec $KUBECTL_ARGS -i $POSTGRES_POD_NAME -- psql -U syft_postgres -d syftdb_postgres << EOF $RESET_COMMAND EOF -echo "All tables in $POSTGRES_POD_NAME have been reset." - -# Resetting the backend pod -BACKEND_POD=$(kubectl get pods -n syft -o jsonpath="{.items[*].metadata.name}" | tr ' ' '\n' | grep -E ".*backend.*") -if [ -n "$BACKEND_POD" ]; then - kubectl delete pod -n syft $BACKEND_POD - echo "Backend pod $BACKEND_POD has been deleted and will be restarted." -else - echo "No backend pod found." -fi - # Deleting StatefulSets that end with -pool -POOL_STATEFULSETS=$(kubectl get statefulsets -n syft -o jsonpath="{.items[*].metadata.name}" | tr ' ' '\n' | grep -E ".*-pool$") +POOL_STATEFULSETS=$(kubectl get statefulsets $KUBECTL_ARGS -o jsonpath="{.items[*].metadata.name}" | tr ' ' '\n' | grep -E ".*-pool$") if [ -n "$POOL_STATEFULSETS" ]; then + echo ">>> Deleting '$POOL_STATEFULSETS'" for STATEFULSET in $POOL_STATEFULSETS; do - kubectl delete statefulset -n syft $STATEFULSET - echo "StatefulSet $STATEFULSET has been deleted." + kubectl delete statefulsets $KUBECTL_ARGS $STATEFULSET + kubectl delete pods $KUBECTL_ARGS -l "app.kubernetes.io/component=$STATEFULSET" --grace-period=0 --force done -else - echo "No StatefulSets ending with '-pool' found." fi -# wait for backend to come back up -bash packages/grid/scripts/wait_for.sh service backend --namespace syft +# Resetting the backend pod +BACKEND_POD=$(kubectl get pods $KUBECTL_ARGS -o jsonpath="{.items[*].metadata.name}" | tr ' ' '\n' | grep -E ".*backend.*") +if [ -n "$BACKEND_POD" ]; then + echo ">>> Re-creating '$BACKEND_POD'" + kubectl delete pod $KUBECTL_ARGS $BACKEND_POD --grace-period=0 --force + + # wait for backend to come back up + echo ">>> Waiting for '$BACKEND_POD' to be ready..." + export WAIT_TIME=5 + bash packages/grid/scripts/wait_for.sh service backend $KUBECTL_ARGS > /dev/null +fi + +echo ">>> Done"