name: Kubeadm Reset run-name: ${{ gitea.actor }} requested kubeadm reset on: workflow_dispatch: inputs: confirm: description: "Type RESET to run kubeadm reset on all nodes" required: true type: string concurrency: group: kubeadm-bootstrap cancel-in-progress: false jobs: reset: name: "Reset Cluster Nodes" runs-on: ubuntu-latest steps: - name: Validate confirmation phrase run: | if [ "${{ inputs.confirm }}" != "RESET" ]; then echo "Confirmation failed. You must type RESET." exit 1 fi - name: Checkout repository uses: https://gitea.com/actions/checkout@v4 - name: Create SSH key run: | install -m 0700 -d ~/.ssh KEY_SOURCE="" KEY_CONTENT="" KEY_B64="$(printf '%s' "${{ secrets.SSH_KEY_PRIVATE_BASE64 }}")" if [ -n "$KEY_B64" ]; then KEY_SOURCE="SSH_KEY_PRIVATE_BASE64" KEY_CONTENT="$(printf '%s' "$KEY_B64" | base64 -d)" else KEY_CONTENT="$(printf '%s' "${{ secrets.SSH_KEY_PRIVATE }}")" if [ -n "$KEY_CONTENT" ]; then KEY_SOURCE="SSH_KEY_PRIVATE" else KEY_CONTENT="$(printf '%s' "${{ secrets.KUBEADM_SSH_PRIVATE_KEY }}")" KEY_SOURCE="KUBEADM_SSH_PRIVATE_KEY" fi fi if [ -z "$KEY_CONTENT" ]; then echo "Missing SSH private key secret. Set SSH_KEY_PRIVATE_BASE64, SSH_KEY_PRIVATE, or KUBEADM_SSH_PRIVATE_KEY." exit 1 fi KEY_CONTENT="$(printf '%s' "$KEY_CONTENT" | tr -d '\r')" if printf '%s' "$KEY_CONTENT" | grep -q '\\n'; then printf '%b' "$KEY_CONTENT" > ~/.ssh/id_ed25519 else printf '%s\n' "$KEY_CONTENT" > ~/.ssh/id_ed25519 fi chmod 0600 ~/.ssh/id_ed25519 if ! ssh-keygen -y -f ~/.ssh/id_ed25519 >/dev/null 2>&1; then echo "Invalid private key content from $KEY_SOURCE" exit 1 fi - name: Set up Terraform uses: hashicorp/setup-terraform@v2 with: terraform_version: 1.6.6 terraform_wrapper: false - name: Build Terraform backend files working-directory: terraform run: | cat > secrets.auto.tfvars << EOF pm_api_token_secret = "${{ secrets.PM_API_TOKEN_SECRET }}" SSH_KEY_PUBLIC = "$(printf '%s' "${{ secrets.SSH_KEY_PUBLIC }}" | tr -d '\r\n')" EOF cat > backend.hcl << EOF bucket = "${{ secrets.B2_TF_BUCKET }}" key = "terraform.tfstate" region = "us-east-005" endpoints = { s3 = "${{ secrets.B2_TF_ENDPOINT }}" } access_key = "$(printf '%s' "${{ secrets.B2_KEY_ID }}" | tr -d '\r\n')" secret_key = "$(printf '%s' "${{ secrets.B2_APPLICATION_KEY }}" | tr -d '\r\n')" skip_credentials_validation = true skip_metadata_api_check = true skip_region_validation = true skip_requesting_account_id = true use_path_style = true EOF - name: Terraform init for state read working-directory: terraform run: terraform init -reconfigure -backend-config=backend.hcl - name: Create kubeadm inventory env: KUBEADM_SSH_USER: ${{ secrets.KUBEADM_SSH_USER }} KUBEADM_SUBNET_PREFIX: ${{ secrets.KUBEADM_SUBNET_PREFIX }} run: | set -euo pipefail TF_OUTPUT_JSON="" for attempt in 1 2 3 4 5 6; do echo "Inventory render attempt $attempt/6" TF_OUTPUT_JSON="$(terraform -chdir=terraform output -json)" if printf '%s' "$TF_OUTPUT_JSON" | ./nixos/kubeadm/scripts/render-inventory-from-tf-output.py > nixos/kubeadm/scripts/inventory.env; then exit 0 fi if [ "$attempt" -lt 6 ]; then echo "VM IPv4s not available yet; waiting 30s before retry" sleep 30 fi done echo "Falling back to SSH-based inventory discovery" printf '%s' "$TF_OUTPUT_JSON" | ./nixos/kubeadm/scripts/discover-inventory-from-ssh.py > nixos/kubeadm/scripts/inventory.env - name: Run cluster reset run: | ./nixos/kubeadm/scripts/reset-cluster-nodes.sh