From 789a6d15a691abaefe2720f2ff6639da887eb746 Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Sat, 28 Feb 2026 05:53:34 +0000
Subject: [PATCH 1/6] Initial plan


From 5dd892a8fcf9707bc2ce3d071cbc85e0ae430df3 Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Sat, 28 Feb 2026 06:03:51 +0000
Subject: [PATCH 2/6] Add E2E test cases for apply -f usage with kubeadm join
 flow

Co-authored-by: bcho <1975118+bcho@users.noreply.github.com>
---
 hack/e2e/README.md        |  39 ++++--
 hack/e2e/infra/main.bicep |  88 +++++++++++++-
 hack/e2e/lib/cleanup.sh   |  24 ++--
 hack/e2e/lib/infra.sh     |  20 ++-
 hack/e2e/lib/node-join.sh | 247 ++++++++++++++++++++++++++++++++++++--
 hack/e2e/lib/validate.sh  |  18 +--
 hack/e2e/run.sh           |  30 +++--
 7 files changed, 410 insertions(+), 56 deletions(-)

diff --git a/hack/e2e/README.md b/hack/e2e/README.md
index 2f1e418..7582b10 100644
--- a/hack/e2e/README.md
+++ b/hack/e2e/README.md
@@ -1,7 +1,8 @@
 # AKS Flex Node E2E Tests
 
-End-to-end tests that provision an AKS cluster and two Ubuntu VMs in Azure, join
-them as flex nodes (one via MSI, one via bootstrap token), and run smoke tests.
+End-to-end tests that provision an AKS cluster and three Ubuntu VMs in Azure,
+join them as flex nodes (one via MSI, one via bootstrap token, one via kubeadm
+join using `apply -f`), and run smoke tests.
 
 ## Prerequisites
 
@@ -27,8 +28,8 @@ export E2E_LOCATION=westus2
 make e2e
 ```
 
-This will build the agent binary, deploy infrastructure via Bicep, join both
-nodes, run validations, collect logs, and tear everything down.
+This will build the agent binary, deploy infrastructure via Bicep, join all
+three nodes, run validations, collect logs, and tear everything down.
 
 ## Commands
 
@@ -38,10 +39,11 @@ omitted it defaults to `all`.
 | Command | Description |
 |---------|-------------|
 | `all` | Full flow: build, infra, join, validate, cleanup (default) |
-| `infra` | Deploy AKS cluster + 2 VMs via Bicep |
-| `join` | Join both nodes to the cluster |
+| `infra` | Deploy AKS cluster + 3 VMs via Bicep |
+| `join` | Join all nodes to the cluster |
 | `join-msi` | Join only the MSI-authenticated node |
 | `join-token` | Join only the bootstrap-token node |
+| `join-kubeadm` | Join only the kubeadm node (`apply -f` with `KubeadmNodeJoin`) |
 | `validate` | Verify nodes joined and run smoke tests |
 | `smoke` | Run smoke tests only (nginx pods on flex nodes) |
 | `logs` | Collect logs from VMs |
@@ -72,6 +74,21 @@ Additional environment variables:
 | `AZURE_SUBSCRIPTION_ID` | (auto-detected) | Azure subscription |
 | `AZURE_TENANT_ID` | (auto-detected) | Azure tenant |
 
+## Node Join Modes
+
+The E2E suite tests three node join methods:
+
+| VM | Auth Mode | Join Method |
+|----|-----------|-------------|
+| `vm-e2e-msi-*` | Managed Identity (MSI) | `aks-flex-node agent --config config.json` |
+| `vm-e2e-token-*` | Bootstrap Token | `aks-flex-node agent --config config.json` |
+| `vm-e2e-kubeadm-*` | Bootstrap Token | `aks-flex-node apply -f kubeadm-join.json` |
+
+The kubeadm VM uses the `apply -f` command with a JSON action file that
+contains a sequence of component actions (configure OS, download CRI/kube/CNI
+binaries, start containerd, then `KubeadmNodeJoin`) to join the cluster using
+the kubeadm join flow.
+
 ## Iterative Development
 
 The subcommands make it easy to deploy infrastructure once and iterate on the
@@ -84,6 +101,7 @@ join or validation steps without re-provisioning every time.
 # Iterate on the join logic
 ./hack/e2e/run.sh join-msi
 ./hack/e2e/run.sh join-token
+./hack/e2e/run.sh join-kubeadm
 
 # Run validation
 ./hack/e2e/run.sh validate
@@ -114,11 +132,11 @@ make e2e-cleanup  # Tear down resources
 hack/e2e/
   run.sh              Main entry point / orchestrator
   infra/
-    main.bicep        Bicep template (AKS + VNet + NSG + 2 VMs + role assignments)
+    main.bicep        Bicep template (AKS + VNet + NSG + 3 VMs + role assignments)
   lib/
     common.sh         Logging, prereqs, config, state management, SSH helpers
     infra.sh          Bicep deployment, output extraction, kubeconfig fetch
-    node-join.sh      MSI and token node join logic
+    node-join.sh      MSI, token, and kubeadm node join logic
     validate.sh       Node-ready checks and smoke tests (nginx pods)
     cleanup.sh        Log collection and Azure resource teardown
 ```
@@ -135,7 +153,10 @@ previous one left off. Use `run.sh status` to inspect it.
   your SSH key is available (defaults to `~/.ssh/id_rsa.pub`). Check the state
   file for the correct VM public IPs with `run.sh status`.
 - **Node not joining**: Run `run.sh logs` to pull `journalctl` and agent logs
-  from both VMs. Logs are saved to `$E2E_WORK_DIR/logs/`.
+  from all VMs. Logs are saved to `$E2E_WORK_DIR/logs/`.
+- **Kubeadm join failures**: Check `kubeadm-agent-journal.log` and
+  `kubeadm-kubelet.log` in the logs directory. The `apply -f` approach runs
+  sequentially; each action step must succeed before the next one starts.
 - **Timeouts**: Adjust `E2E_SSH_WAIT_TIMEOUT`, `E2E_NODE_JOIN_TIMEOUT`, or
   `E2E_POD_READY_TIMEOUT` environment variables (in seconds).
 - **Leftover resources**: If a previous run didn't clean up, run
diff --git a/hack/e2e/infra/main.bicep b/hack/e2e/infra/main.bicep
index 06da42c..0073957 100644
--- a/hack/e2e/infra/main.bicep
+++ b/hack/e2e/infra/main.bicep
@@ -34,11 +34,12 @@ param tags object = {}
 // ---------------------------------------------------------------------------
 // Variables
 // ---------------------------------------------------------------------------
-var clusterName = 'aks-e2e-${nameSuffix}'
-var msiVmName   = 'vm-e2e-msi-${nameSuffix}'
-var tokenVmName = 'vm-e2e-token-${nameSuffix}'
-var vnetName    = 'vnet-e2e-${nameSuffix}'
-var nsgName     = 'nsg-e2e-${nameSuffix}'
+var clusterName   = 'aks-e2e-${nameSuffix}'
+var msiVmName     = 'vm-e2e-msi-${nameSuffix}'
+var tokenVmName   = 'vm-e2e-token-${nameSuffix}'
+var kubeadmVmName = 'vm-e2e-kubeadm-${nameSuffix}'
+var vnetName      = 'vnet-e2e-${nameSuffix}'
+var nsgName       = 'nsg-e2e-${nameSuffix}'
 
 var subnetAksName = 'snet-aks'
 var subnetVmName  = 'snet-vm'
@@ -158,6 +159,16 @@ resource pipToken 'Microsoft.Network/publicIPAddresses@2023-11-01' = {
   }
 }
 
+resource pipKubeadm 'Microsoft.Network/publicIPAddresses@2023-11-01' = {
+  name: '${kubeadmVmName}-pip'
+  location: location
+  tags: tags
+  sku: { name: 'Standard' }
+  properties: {
+    publicIPAllocationMethod: 'Static'
+  }
+}
+
 // ---------------------------------------------------------------------------
 // NICs
 // ---------------------------------------------------------------------------
@@ -205,6 +216,28 @@ resource nicToken 'Microsoft.Network/networkInterfaces@2023-11-01' = {
   }
 }
 
+resource nicKubeadm 'Microsoft.Network/networkInterfaces@2023-11-01' = {
+  name: '${kubeadmVmName}-nic'
+  location: location
+  tags: tags
+  properties: {
+    ipConfigurations: [
+      {
+        name: 'ipconfig1'
+        properties: {
+          subnet: {
+            id: vnet.properties.subnets[1].id
+          }
+          publicIPAddress: {
+            id: pipKubeadm.id
+          }
+          privateIPAllocationMethod: 'Dynamic'
+        }
+      }
+    ]
+  }
+}
+
 // ---------------------------------------------------------------------------
 // VM: MSI (system-assigned managed identity)
 // ---------------------------------------------------------------------------
@@ -292,6 +325,48 @@ resource vmToken 'Microsoft.Compute/virtualMachines@2024-03-01' = {
   }
 }
 
+// ---------------------------------------------------------------------------
+// VM: Kubeadm (no managed identity - uses apply -f with kubeadm join flow)
+// ---------------------------------------------------------------------------
+resource vmKubeadm 'Microsoft.Compute/virtualMachines@2024-03-01' = {
+  name: kubeadmVmName
+  location: location
+  tags: tags
+  properties: {
+    hardwareProfile: { vmSize: vmSize }
+    osProfile: {
+      computerName: kubeadmVmName
+      adminUsername: adminUsername
+      linuxConfiguration: {
+        disablePasswordAuthentication: true
+        ssh: {
+          publicKeys: [
+            {
+              path: '/home/${adminUsername}/.ssh/authorized_keys'
+              keyData: sshPublicKey
+            }
+          ]
+        }
+      }
+    }
+    storageProfile: {
+      imageReference: {
+        publisher: 'Canonical'
+        offer: '0001-com-ubuntu-server-jammy'
+        sku: '22_04-lts-gen2'
+        version: 'latest'
+      }
+      osDisk: {
+        createOption: 'FromImage'
+        managedDisk: { storageAccountType: 'StandardSSD_LRS' }
+      }
+    }
+    networkProfile: {
+      networkInterfaces: [ { id: nicKubeadm.id } ]
+    }
+  }
+}
+
 // ---------------------------------------------------------------------------
 // Role assignments: grant MSI VM permissions on the AKS cluster
 // ---------------------------------------------------------------------------
@@ -331,4 +406,7 @@ output msiVmPrincipalId string = vmMsi.identity.principalId
 output tokenVmName string = vmToken.name
 output tokenVmIp string = pipToken.properties.ipAddress
 
+output kubeadmVmName string = vmKubeadm.name
+output kubeadmVmIp string = pipKubeadm.properties.ipAddress
+
 output adminUsername string = adminUsername
diff --git a/hack/e2e/lib/cleanup.sh b/hack/e2e/lib/cleanup.sh
index 2ed7676..16ecb3a 100755
--- a/hack/e2e/lib/cleanup.sh
+++ b/hack/e2e/lib/cleanup.sh
@@ -43,16 +43,17 @@ _collect_vm_logs() {
 }
 
 # ---------------------------------------------------------------------------
-# collect_logs - Collect logs from both VMs
+# collect_logs - Collect logs from all VMs
 # ---------------------------------------------------------------------------
 collect_logs() {
   log_section "Collecting Logs"
 
   mkdir -p "${E2E_LOG_DIR}"
 
-  local msi_vm_ip token_vm_ip
+  local msi_vm_ip token_vm_ip kubeadm_vm_ip
   msi_vm_ip="$(state_get msi_vm_ip)"
   token_vm_ip="$(state_get token_vm_ip)"
+  kubeadm_vm_ip="$(state_get kubeadm_vm_ip)"
 
   if [[ -n "${msi_vm_ip}" ]]; then
     _collect_vm_logs "${msi_vm_ip}" "msi" || true
@@ -62,6 +63,10 @@ collect_logs() {
     _collect_vm_logs "${token_vm_ip}" "token" || true
   fi
 
+  if [[ -n "${kubeadm_vm_ip}" ]]; then
+    _collect_vm_logs "${kubeadm_vm_ip}" "kubeadm" || true
+  fi
+
   # Also capture cluster-side info
   {
     echo "=== Nodes ==="
@@ -91,11 +96,12 @@ cleanup() {
     return 0
   fi
 
-  local resource_group cluster_name msi_vm_name token_vm_name
+  local resource_group cluster_name msi_vm_name token_vm_name kubeadm_vm_name
   resource_group="$(state_get resource_group)"
   cluster_name="$(state_get cluster_name)"
   msi_vm_name="$(state_get msi_vm_name)"
   token_vm_name="$(state_get token_vm_name)"
+  kubeadm_vm_name="$(state_get kubeadm_vm_name)"
   local deployment_name
   deployment_name="$(state_get deployment_name)"
 
@@ -105,16 +111,20 @@ cleanup() {
   fi
 
   # Delete VMs first (faster than waiting for full RG delete)
-  log_info "[1/4] Deleting MSI VM: ${msi_vm_name}..."
+  log_info "[1/5] Deleting MSI VM: ${msi_vm_name}..."
   az vm delete --resource-group "${resource_group}" --name "${msi_vm_name}" \
     --force-deletion yes --yes --no-wait 2>/dev/null || true
 
-  log_info "[2/4] Deleting Token VM: ${token_vm_name}..."
+  log_info "[2/5] Deleting Token VM: ${token_vm_name}..."
   az vm delete --resource-group "${resource_group}" --name "${token_vm_name}" \
     --force-deletion yes --yes --no-wait 2>/dev/null || true
 
+  log_info "[3/5] Deleting Kubeadm VM: ${kubeadm_vm_name}..."
+  az vm delete --resource-group "${resource_group}" --name "${kubeadm_vm_name}" \
+    --force-deletion yes --yes --no-wait 2>/dev/null || true
+
   # Clean up leftover networking resources tied to our deployment
-  log_info "[3/4] Cleaning up networking resources..."
+  log_info "[4/5] Cleaning up networking resources..."
   local run_id="${GITHUB_RUN_ID:-}"
   if [[ -n "${run_id}" ]]; then
     for res_type in networkInterfaces publicIPAddresses networkSecurityGroups disks; do
@@ -126,7 +136,7 @@ cleanup() {
     done
   fi
 
-  log_info "[4/4] Deleting AKS cluster: ${cluster_name}..."
+  log_info "[5/5] Deleting AKS cluster: ${cluster_name}..."
   az aks delete --resource-group "${resource_group}" --name "${cluster_name}" \
     --yes --no-wait 2>/dev/null || true
 
diff --git a/hack/e2e/lib/infra.sh b/hack/e2e/lib/infra.sh
index 1ba134d..b30a7d6 100755
--- a/hack/e2e/lib/infra.sh
+++ b/hack/e2e/lib/infra.sh
@@ -105,7 +105,7 @@ infra_deploy() {
     -o json)
 
   local cluster_name cluster_id msi_vm_name msi_vm_ip msi_vm_principal_id
-  local token_vm_name token_vm_ip admin_username
+  local token_vm_name token_vm_ip kubeadm_vm_name kubeadm_vm_ip admin_username
 
   cluster_name=$(echo "${outputs}"    | jq -r '.clusterName.value')
   cluster_id=$(echo "${outputs}"      | jq -r '.clusterId.value')
@@ -114,6 +114,8 @@ infra_deploy() {
   msi_vm_principal_id=$(echo "${outputs}" | jq -r '.msiVmPrincipalId.value')
   token_vm_name=$(echo "${outputs}"   | jq -r '.tokenVmName.value')
   token_vm_ip=$(echo "${outputs}"     | jq -r '.tokenVmIp.value')
+  kubeadm_vm_name=$(echo "${outputs}" | jq -r '.kubeadmVmName.value')
+  kubeadm_vm_ip=$(echo "${outputs}"   | jq -r '.kubeadmVmIp.value')
   admin_username=$(echo "${outputs}"  | jq -r '.adminUsername.value')
 
   # Persist to state
@@ -124,6 +126,8 @@ infra_deploy() {
   state_set "msi_vm_principal_id"  "${msi_vm_principal_id}"
   state_set "token_vm_name"        "${token_vm_name}"
   state_set "token_vm_ip"          "${token_vm_ip}"
+  state_set "kubeadm_vm_name"      "${kubeadm_vm_name}"
+  state_set "kubeadm_vm_ip"        "${kubeadm_vm_ip}"
   state_set "admin_username"       "${admin_username}"
   state_set "resource_group"       "${E2E_RESOURCE_GROUP}"
   state_set "location"             "${E2E_LOCATION}"
@@ -131,23 +135,27 @@ infra_deploy() {
   state_set "tenant_id"            "${AZURE_TENANT_ID}"
   state_set "deployment_name"      "${deployment_name}"
 
-  log_info "Cluster:   ${cluster_name} (${cluster_id})"
-  log_info "MSI VM:    ${msi_vm_name} @ ${msi_vm_ip}"
-  log_info "Token VM:  ${token_vm_name} @ ${token_vm_ip}"
+  log_info "Cluster:     ${cluster_name} (${cluster_id})"
+  log_info "MSI VM:      ${msi_vm_name} @ ${msi_vm_ip}"
+  log_info "Token VM:    ${token_vm_name} @ ${token_vm_ip}"
+  log_info "Kubeadm VM:  ${kubeadm_vm_name} @ ${kubeadm_vm_ip}"
 
   # Get kubeconfig and extract cluster info
   infra_get_kubeconfig
 
-  # Wait for SSH on both VMs (in parallel)
-  log_info "Waiting for SSH on both VMs..."
+  # Wait for SSH on all VMs (in parallel)
+  log_info "Waiting for SSH on all VMs..."
   wait_for_ssh "${msi_vm_ip}" &
   local pid_msi=$!
   wait_for_ssh "${token_vm_ip}" &
   local pid_token=$!
+  wait_for_ssh "${kubeadm_vm_ip}" &
+  local pid_kubeadm=$!
 
   local ssh_failed=0
   wait "${pid_msi}" || ssh_failed=1
   wait "${pid_token}" || ssh_failed=1
+  wait "${pid_kubeadm}" || ssh_failed=1
 
   if [[ "${ssh_failed}" -eq 1 ]]; then
     log_error "One or more VMs not reachable via SSH"
diff --git a/hack/e2e/lib/node-join.sh b/hack/e2e/lib/node-join.sh
index f56ace3..3b1eb06 100755
--- a/hack/e2e/lib/node-join.sh
+++ b/hack/e2e/lib/node-join.sh
@@ -3,13 +3,15 @@
 # hack/e2e/lib/node-join.sh - Bootstrap flex nodes into the AKS cluster
 #
 # Functions:
-#   node_join_msi   - Install Azure CLI + MSI auth, deploy binary, run agent
-#   node_join_token - Create bootstrap token/RBAC, deploy binary, run agent
-#   node_join_all   - Join both nodes (MSI first, then token)
+#   node_join_msi      - Install Azure CLI + MSI auth, deploy binary, run agent
+#   node_join_token    - Create bootstrap token/RBAC, deploy binary, run agent
+#   node_join_kubeadm  - Create bootstrap token, deploy binary, run apply -f
+#                        with a KubeadmNodeJoin action (kubeadm join flow)
+#   node_join_all      - Join all nodes (MSI, token, and kubeadm) in parallel
 #
 # Each function:
-#   1. Generates the appropriate config.json
-#   2. SCPs the binary + config onto the VM
+#   1. Generates the appropriate config / action file
+#   2. SCPs the binary + config/action file onto the VM
 #   3. Starts the agent via systemd-run
 #   4. Waits for kubelet to report running
 # =============================================================================
@@ -309,15 +311,231 @@ EOF
 }
 
 # ---------------------------------------------------------------------------
-# node_join_all - Join both nodes in parallel
+# node_join_kubeadm - Join the Kubeadm VM using apply -f with KubeadmNodeJoin
+# ---------------------------------------------------------------------------
+node_join_kubeadm() {
+  log_section "Joining Kubeadm Node (apply -f)"
+  local start
+  start=$(timer_start)
+
+  local vm_ip
+  vm_ip="$(state_get kubeadm_vm_ip)"
+  local server_url
+  server_url="$(state_get server_url)"
+  local ca_cert_data
+  ca_cert_data="$(state_get ca_cert_data)"
+
+  # Step 1: Create bootstrap token & RBAC in the cluster
+  log_info "Creating bootstrap token and RBAC resources for kubeadm join..."
+  local token_id token_secret bootstrap_token expiration
+
+  token_id="$(openssl rand -hex 3)"
+  token_secret="$(openssl rand -hex 8)"
+  bootstrap_token="${token_id}.${token_secret}"
+
+  # Use a portable date command for expiration (24h from now)
+  if date --version &>/dev/null; then
+    # GNU date
+    expiration="$(date -u -d "+24 hours" +"%Y-%m-%dT%H:%M:%SZ")"
+  else
+    # BSD/macOS date
+    expiration="$(date -u -v+24H +"%Y-%m-%dT%H:%M:%SZ")"
+  fi
+
+  log_info "Token ID: ${token_id} | Expires: ${expiration}"
+
+  # Create the bootstrap token secret
+  kubectl apply -f - <<EOF
+apiVersion: v1
+kind: Secret
+metadata:
+  name: bootstrap-token-${token_id}
+  namespace: kube-system
+type: bootstrap.kubernetes.io/token
+stringData:
+  description: "AKS Flex Node E2E kubeadm bootstrap token"
+  token-id: "${token_id}"
+  token-secret: "${token_secret}"
+  expiration: "${expiration}"
+  usage-bootstrap-authentication: "true"
+  usage-bootstrap-signing: "true"
+  auth-extra-groups: "system:bootstrappers:aks-flex-node"
+EOF
+
+  # Create RBAC bindings for TLS bootstrapping (idempotent)
+  kubectl apply -f - <<EOF
+apiVersion: rbac.authorization.k8s.io/v1
+kind: ClusterRoleBinding
+metadata:
+  name: aks-flex-node-bootstrapper
+roleRef:
+  apiGroup: rbac.authorization.k8s.io
+  kind: ClusterRole
+  name: system:node-bootstrapper
+subjects:
+- apiGroup: rbac.authorization.k8s.io
+  kind: Group
+  name: system:bootstrappers:aks-flex-node
+---
+apiVersion: rbac.authorization.k8s.io/v1
+kind: ClusterRoleBinding
+metadata:
+  name: aks-flex-node-auto-approve-csr
+roleRef:
+  apiGroup: rbac.authorization.k8s.io
+  kind: ClusterRole
+  name: system:certificates.k8s.io:certificatesigningrequests:nodeclient
+subjects:
+- apiGroup: rbac.authorization.k8s.io
+  kind: Group
+  name: system:bootstrappers:aks-flex-node
+---
+apiVersion: rbac.authorization.k8s.io/v1
+kind: ClusterRoleBinding
+metadata:
+  name: aks-flex-node-role
+roleRef:
+  apiGroup: rbac.authorization.k8s.io
+  kind: ClusterRole
+  name: system:node
+subjects:
+- apiGroup: rbac.authorization.k8s.io
+  kind: Group
+  name: system:bootstrappers:aks-flex-node
+EOF
+
+  log_success "Bootstrap token and RBAC configured"
+  state_set "kubeadm_bootstrap_token" "${bootstrap_token}"
+
+  # Step 2: Generate the apply -f action file (JSON array of all bootstrap steps
+  #         ending with the KubeadmNodeJoin action)
+  local action_file="${E2E_WORK_DIR}/kubeadm-join.json"
+  cat > "${action_file}" <<EOF
+[
+  {
+    "metadata": {
+      "type": "type.googleapis.com/aks.flex.components.linux.ConfigureBaseOS",
+      "name": "configure-os"
+    },
+    "spec": {}
+  },
+  {
+    "metadata": {
+      "type": "type.googleapis.com/aks.flex.components.cri.DownloadCRIBinaries",
+      "name": "download-cri-binaries"
+    },
+    "spec": {
+      "containerdVersion": "${E2E_CONTAINERD_VERSION}",
+      "runcVersion": "${E2E_RUNC_VERSION}"
+    }
+  },
+  {
+    "metadata": {
+      "type": "type.googleapis.com/aks.flex.components.kubebins.DownloadKubeBinaries",
+      "name": "download-kube-binaries"
+    },
+    "spec": {
+      "kubernetesVersion": "${E2E_KUBERNETES_VERSION}"
+    }
+  },
+  {
+    "metadata": {
+      "type": "type.googleapis.com/aks.flex.components.cni.DownloadCNIBinaries",
+      "name": "download-cni-binaries"
+    },
+    "spec": {}
+  },
+  {
+    "metadata": {
+      "type": "type.googleapis.com/aks.flex.components.cni.ConfigureCNI",
+      "name": "configure-cni"
+    },
+    "spec": {}
+  },
+  {
+    "metadata": {
+      "type": "type.googleapis.com/aks.flex.components.cri.StartContainerdService",
+      "name": "start-containerd"
+    },
+    "spec": {}
+  },
+  {
+    "metadata": {
+      "type": "type.googleapis.com/aks.flex.components.kubeadm.KubeadmNodeJoin",
+      "name": "kubeadm-node-join"
+    },
+    "spec": {
+      "controlPlane": {
+        "server": "${server_url}",
+        "certificateAuthorityData": "${ca_cert_data}"
+      },
+      "kubelet": {
+        "bootstrapAuthInfo": {
+          "token": "${bootstrap_token}"
+        }
+      }
+    }
+  }
+]
+EOF
+
+  # Step 3: Upload binary and action file, then run apply -f via systemd
+  local unit_name="aks-flex-node-kubeadm"
+
+  log_info "Uploading binary and action file to ${vm_ip}..."
+  remote_copy "${E2E_BINARY}" "${vm_ip}" "/tmp/aks-flex-node-binary"
+  remote_copy "${action_file}" "${vm_ip}" "/tmp/kubeadm-join.json"
+
+  log_info "Starting kubeadm join via apply -f on ${vm_ip}..."
+  remote_exec "${vm_ip}" 'bash -s' <<REMOTE
+set -euo pipefail
+
+sudo cp /tmp/aks-flex-node-binary /usr/local/bin/aks-flex-node
+sudo chmod +x /usr/local/bin/aks-flex-node
+aks-flex-node version
+
+sudo mkdir -p /etc/aks-flex-node /var/log/aks-flex-node
+sudo cp /tmp/kubeadm-join.json /etc/aks-flex-node/
+
+sudo systemd-run \
+  --unit=${unit_name} \
+  --description="AKS Flex Node E2E kubeadm join (${unit_name})" \
+  --remain-after-exit \
+  /usr/local/bin/aks-flex-node apply --no-prettyui -f /etc/aks-flex-node/kubeadm-join.json
+
+echo "Waiting ${E2E_BOOTSTRAP_SETTLE_TIME}s for bootstrap to complete..."
+sleep ${E2E_BOOTSTRAP_SETTLE_TIME}
+
+if systemctl is-active --quiet ${unit_name}; then
+  echo "Apply service is running"
+else
+  echo "Apply service failed:"
+  sudo journalctl -u ${unit_name} -n 50 --no-pager || true
+  exit 1
+fi
+
+sleep 10
+if systemctl is-active --quiet kubelet; then
+  echo "kubelet is running"
+else
+  echo "kubelet status:"
+  systemctl status kubelet --no-pager -l 2>&1 || true
+fi
+REMOTE
+
+  log_success "Kubeadm node joined via apply -f in $(timer_elapsed "${start}")s"
+}
+
+# ---------------------------------------------------------------------------
+# node_join_all - Join all nodes in parallel
 # ---------------------------------------------------------------------------
 node_join_all() {
-  log_section "Joining Both Nodes (parallel)"
+  log_section "Joining All Nodes (parallel)"
   local start
   start=$(timer_start)
 
-  local msi_pid token_pid
-  local msi_exit=0 token_exit=0
+  local msi_pid token_pid kubeadm_pid
+  local msi_exit=0 token_exit=0 kubeadm_exit=0
 
   node_join_msi &
   msi_pid=$!
@@ -325,8 +543,12 @@ node_join_all() {
   node_join_token &
   token_pid=$!
 
+  node_join_kubeadm &
+  kubeadm_pid=$!
+
   wait "${msi_pid}" || msi_exit=$?
   wait "${token_pid}" || token_exit=$?
+  wait "${kubeadm_pid}" || kubeadm_exit=$?
 
   local duration
   duration=$(timer_elapsed "${start}")
@@ -337,11 +559,14 @@ node_join_all() {
   if [[ "${token_exit}" -ne 0 ]]; then
     log_error "Token node join failed (exit ${token_exit})"
   fi
+  if [[ "${kubeadm_exit}" -ne 0 ]]; then
+    log_error "Kubeadm node join failed (exit ${kubeadm_exit})"
+  fi
 
-  if [[ "${msi_exit}" -ne 0 || "${token_exit}" -ne 0 ]]; then
+  if [[ "${msi_exit}" -ne 0 || "${token_exit}" -ne 0 || "${kubeadm_exit}" -ne 0 ]]; then
     log_error "Node joins failed (${duration}s)"
     return 1
   fi
 
-  log_success "Both nodes joined in ${duration}s"
+  log_success "All nodes joined in ${duration}s"
 }
diff --git a/hack/e2e/lib/validate.sh b/hack/e2e/lib/validate.sh
index 5ee92b8..f40ff1b 100755
--- a/hack/e2e/lib/validate.sh
+++ b/hack/e2e/lib/validate.sh
@@ -4,9 +4,9 @@
 #
 # Functions:
 #   validate_node_joined  <vm_name>  - Wait for a specific node to appear in kubectl
-#   validate_all_nodes                - Verify both MSI and token nodes joined
+#   validate_all_nodes                - Verify MSI, token, and kubeadm nodes joined
 #   smoke_test            <vm_name> <label>  - Schedule an nginx pod on a node
-#   smoke_test_all                    - Run smoke tests on both nodes
+#   smoke_test_all                    - Run smoke tests on all nodes
 # =============================================================================
 set -euo pipefail
 
@@ -47,7 +47,7 @@ validate_node_joined() {
 }
 
 # ---------------------------------------------------------------------------
-# validate_all_nodes - Check both MSI and token VMs joined
+# validate_all_nodes - Check all MSI, token, and kubeadm VMs joined
 # ---------------------------------------------------------------------------
 validate_all_nodes() {
   log_section "Validating Node Join"
@@ -63,13 +63,15 @@ validate_all_nodes() {
     --overwrite-existing \
     --admin
 
-  local msi_vm_name token_vm_name
+  local msi_vm_name token_vm_name kubeadm_vm_name
   msi_vm_name="$(state_get msi_vm_name)"
   token_vm_name="$(state_get token_vm_name)"
+  kubeadm_vm_name="$(state_get kubeadm_vm_name)"
 
   local failed=0
   validate_node_joined "${msi_vm_name}" || failed=1
   validate_node_joined "${token_vm_name}" || failed=1
+  validate_node_joined "${kubeadm_vm_name}" || failed=1
 
   if [[ "${failed}" -eq 1 ]]; then
     log_error "One or more nodes failed to join"
@@ -79,7 +81,7 @@ validate_all_nodes() {
   echo ""
   log_info "All cluster nodes:"
   kubectl get nodes -o wide
-  log_success "Both nodes verified in cluster"
+  log_success "All nodes verified in cluster"
 }
 
 # ---------------------------------------------------------------------------
@@ -133,18 +135,20 @@ EOF
 }
 
 # ---------------------------------------------------------------------------
-# smoke_test_all - Run smoke tests on both nodes
+# smoke_test_all - Run smoke tests on all nodes
 # ---------------------------------------------------------------------------
 smoke_test_all() {
   log_section "Running Smoke Tests"
 
-  local msi_vm_name token_vm_name
+  local msi_vm_name token_vm_name kubeadm_vm_name
   msi_vm_name="$(state_get msi_vm_name)"
   token_vm_name="$(state_get token_vm_name)"
+  kubeadm_vm_name="$(state_get kubeadm_vm_name)"
 
   local failed=0
   smoke_test "${msi_vm_name}" "msi" || failed=1
   smoke_test "${token_vm_name}" "token" || failed=1
+  smoke_test "${kubeadm_vm_name}" "kubeadm" || failed=1
 
   if [[ "${failed}" -eq 1 ]]; then
     log_error "One or more smoke tests failed"
diff --git a/hack/e2e/run.sh b/hack/e2e/run.sh
index 9471472..12a0d52 100755
--- a/hack/e2e/run.sh
+++ b/hack/e2e/run.sh
@@ -6,16 +6,17 @@
 #   ./hack/e2e/run.sh [command] [options]
 #
 # Commands:
-#   all        Run the full E2E flow (default): build, infra, join, validate, cleanup
-#   infra      Deploy infrastructure only (Bicep: AKS + 2 VMs)
-#   join       Join both nodes to the cluster (requires prior infra)
-#   join-msi   Join only the MSI node
-#   join-token Join only the token node
-#   validate   Verify nodes joined + run smoke tests
-#   smoke      Run smoke tests only (pods on flex nodes)
-#   logs       Collect logs from VMs
-#   cleanup    Tear down Azure resources
-#   status     Show current state (deployment outputs)
+#   all           Run the full E2E flow (default): build, infra, join, validate, cleanup
+#   infra         Deploy infrastructure only (Bicep: AKS + 3 VMs)
+#   join          Join all nodes to the cluster (requires prior infra)
+#   join-msi      Join only the MSI node
+#   join-token    Join only the token node
+#   join-kubeadm  Join only the kubeadm node (apply -f with KubeadmNodeJoin)
+#   validate      Verify nodes joined + run smoke tests
+#   smoke         Run smoke tests only (pods on flex nodes)
+#   logs          Collect logs from VMs
+#   cleanup       Tear down Azure resources
+#   status        Show current state (deployment outputs)
 #
 # Options:
 #   -g, --resource-group  Azure resource group      (or E2E_RESOURCE_GROUP env)
@@ -56,6 +57,9 @@
 #   ./hack/e2e/run.sh join
 #   ./hack/e2e/run.sh validate
 #
+#   # Test only the kubeadm join flow (apply -f)
+#   ./hack/e2e/run.sh join-kubeadm
+#
 #   # Use a pre-built binary
 #   ./hack/e2e/run.sh --binary ./aks-flex-node all
 #
@@ -101,7 +105,7 @@ usage() {
 parse_args() {
   while [[ $# -gt 0 ]]; do
     case "$1" in
-      all|infra|join|join-msi|join-token|validate|smoke|logs|cleanup|status)
+      all|infra|join|join-msi|join-token|join-kubeadm|validate|smoke|logs|cleanup|status)
         COMMAND="$1"; shift ;;
       -g|--resource-group) export E2E_RESOURCE_GROUP="$2"; shift 2 ;;
       -l|--location)       export E2E_LOCATION="$2"; shift 2 ;;
@@ -213,6 +217,10 @@ main() {
       ensure_binary
       node_join_token
       ;;
+    join-kubeadm)
+      ensure_binary
+      node_join_kubeadm
+      ;;
     validate)
       validate_all_nodes
       smoke_test_all

From 949e7bcad93318fe7b60431116b1cb184deb3c85 Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Sat, 28 Feb 2026 06:17:09 +0000
Subject: [PATCH 3/6] Address review feedback: Bicep module, kubeadm
 cert-rotation RBAC, direct apply invocation

Co-authored-by: bcho <1975118+bcho@users.noreply.github.com>
---
 hack/e2e/infra/main.bicep       | 281 ++++++--------------------------
 hack/e2e/infra/modules/vm.bicep | 122 ++++++++++++++
 hack/e2e/lib/node-join.sh       |  44 ++---
 3 files changed, 193 insertions(+), 254 deletions(-)
 create mode 100644 hack/e2e/infra/modules/vm.bicep

diff --git a/hack/e2e/infra/main.bicep b/hack/e2e/infra/main.bicep
index 0073957..646906c 100644
--- a/hack/e2e/infra/main.bicep
+++ b/hack/e2e/infra/main.bicep
@@ -5,8 +5,10 @@
 //   - AKS cluster (1-node control plane)
 //   - VM with system-assigned managed identity  (MSI auth mode)
 //   - VM without managed identity               (bootstrap token auth mode)
+//   - VM without managed identity               (kubeadm apply -f auth mode)
 //
-// Both VMs run Ubuntu 22.04 LTS, have public IPs, and allow SSH ingress.
+// All flex-node VMs run Ubuntu 22.04 LTS, have public IPs, and allow SSH
+// ingress.  VM creation is delegated to the reusable modules/vm.bicep module.
 // =============================================================================
 
 @description('Azure region for all resources.')
@@ -137,233 +139,47 @@ resource aksCluster 'Microsoft.ContainerService/managedClusters@2024-01-01' = {
 }
 
 // ---------------------------------------------------------------------------
-// Public IPs for VMs
+// Flex-node VMs (via reusable module)
 // ---------------------------------------------------------------------------
-resource pipMsi 'Microsoft.Network/publicIPAddresses@2023-11-01' = {
-  name: '${msiVmName}-pip'
-  location: location
-  tags: tags
-  sku: { name: 'Standard' }
-  properties: {
-    publicIPAllocationMethod: 'Static'
-  }
-}
-
-resource pipToken 'Microsoft.Network/publicIPAddresses@2023-11-01' = {
-  name: '${tokenVmName}-pip'
-  location: location
-  tags: tags
-  sku: { name: 'Standard' }
-  properties: {
-    publicIPAllocationMethod: 'Static'
-  }
-}
-
-resource pipKubeadm 'Microsoft.Network/publicIPAddresses@2023-11-01' = {
-  name: '${kubeadmVmName}-pip'
-  location: location
-  tags: tags
-  sku: { name: 'Standard' }
-  properties: {
-    publicIPAllocationMethod: 'Static'
-  }
-}
-
-// ---------------------------------------------------------------------------
-// NICs
-// ---------------------------------------------------------------------------
-resource nicMsi 'Microsoft.Network/networkInterfaces@2023-11-01' = {
-  name: '${msiVmName}-nic'
-  location: location
-  tags: tags
-  properties: {
-    ipConfigurations: [
-      {
-        name: 'ipconfig1'
-        properties: {
-          subnet: {
-            id: vnet.properties.subnets[1].id
-          }
-          publicIPAddress: {
-            id: pipMsi.id
-          }
-          privateIPAllocationMethod: 'Dynamic'
-        }
-      }
-    ]
-  }
-}
-
-resource nicToken 'Microsoft.Network/networkInterfaces@2023-11-01' = {
-  name: '${tokenVmName}-nic'
-  location: location
-  tags: tags
-  properties: {
-    ipConfigurations: [
-      {
-        name: 'ipconfig1'
-        properties: {
-          subnet: {
-            id: vnet.properties.subnets[1].id
-          }
-          publicIPAddress: {
-            id: pipToken.id
-          }
-          privateIPAllocationMethod: 'Dynamic'
-        }
-      }
-    ]
-  }
-}
-
-resource nicKubeadm 'Microsoft.Network/networkInterfaces@2023-11-01' = {
-  name: '${kubeadmVmName}-nic'
-  location: location
-  tags: tags
-  properties: {
-    ipConfigurations: [
-      {
-        name: 'ipconfig1'
-        properties: {
-          subnet: {
-            id: vnet.properties.subnets[1].id
-          }
-          publicIPAddress: {
-            id: pipKubeadm.id
-          }
-          privateIPAllocationMethod: 'Dynamic'
-        }
-      }
-    ]
+module vmMsi 'modules/vm.bicep' = {
+  name: 'deploy-vm-msi'
+  params: {
+    location: location
+    vmName: msiVmName
+    vmSize: vmSize
+    adminUsername: adminUsername
+    sshPublicKey: sshPublicKey
+    subnetId: vnet.properties.subnets[1].id
+    assignManagedIdentity: true
+    tags: tags
   }
 }
 
-// ---------------------------------------------------------------------------
-// VM: MSI (system-assigned managed identity)
-// ---------------------------------------------------------------------------
-resource vmMsi 'Microsoft.Compute/virtualMachines@2024-03-01' = {
-  name: msiVmName
-  location: location
-  tags: tags
-  identity: {
-    type: 'SystemAssigned'
-  }
-  properties: {
-    hardwareProfile: { vmSize: vmSize }
-    osProfile: {
-      computerName: msiVmName
-      adminUsername: adminUsername
-      linuxConfiguration: {
-        disablePasswordAuthentication: true
-        ssh: {
-          publicKeys: [
-            {
-              path: '/home/${adminUsername}/.ssh/authorized_keys'
-              keyData: sshPublicKey
-            }
-          ]
-        }
-      }
-    }
-    storageProfile: {
-      imageReference: {
-        publisher: 'Canonical'
-        offer: '0001-com-ubuntu-server-jammy'
-        sku: '22_04-lts-gen2'
-        version: 'latest'
-      }
-      osDisk: {
-        createOption: 'FromImage'
-        managedDisk: { storageAccountType: 'StandardSSD_LRS' }
-      }
-    }
-    networkProfile: {
-      networkInterfaces: [ { id: nicMsi.id } ]
-    }
+module vmToken 'modules/vm.bicep' = {
+  name: 'deploy-vm-token'
+  params: {
+    location: location
+    vmName: tokenVmName
+    vmSize: vmSize
+    adminUsername: adminUsername
+    sshPublicKey: sshPublicKey
+    subnetId: vnet.properties.subnets[1].id
+    assignManagedIdentity: false
+    tags: tags
   }
 }
 
-// ---------------------------------------------------------------------------
-// VM: Token (no managed identity)
-// ---------------------------------------------------------------------------
-resource vmToken 'Microsoft.Compute/virtualMachines@2024-03-01' = {
-  name: tokenVmName
-  location: location
-  tags: tags
-  properties: {
-    hardwareProfile: { vmSize: vmSize }
-    osProfile: {
-      computerName: tokenVmName
-      adminUsername: adminUsername
-      linuxConfiguration: {
-        disablePasswordAuthentication: true
-        ssh: {
-          publicKeys: [
-            {
-              path: '/home/${adminUsername}/.ssh/authorized_keys'
-              keyData: sshPublicKey
-            }
-          ]
-        }
-      }
-    }
-    storageProfile: {
-      imageReference: {
-        publisher: 'Canonical'
-        offer: '0001-com-ubuntu-server-jammy'
-        sku: '22_04-lts-gen2'
-        version: 'latest'
-      }
-      osDisk: {
-        createOption: 'FromImage'
-        managedDisk: { storageAccountType: 'StandardSSD_LRS' }
-      }
-    }
-    networkProfile: {
-      networkInterfaces: [ { id: nicToken.id } ]
-    }
-  }
-}
-
-// ---------------------------------------------------------------------------
-// VM: Kubeadm (no managed identity - uses apply -f with kubeadm join flow)
-// ---------------------------------------------------------------------------
-resource vmKubeadm 'Microsoft.Compute/virtualMachines@2024-03-01' = {
-  name: kubeadmVmName
-  location: location
-  tags: tags
-  properties: {
-    hardwareProfile: { vmSize: vmSize }
-    osProfile: {
-      computerName: kubeadmVmName
-      adminUsername: adminUsername
-      linuxConfiguration: {
-        disablePasswordAuthentication: true
-        ssh: {
-          publicKeys: [
-            {
-              path: '/home/${adminUsername}/.ssh/authorized_keys'
-              keyData: sshPublicKey
-            }
-          ]
-        }
-      }
-    }
-    storageProfile: {
-      imageReference: {
-        publisher: 'Canonical'
-        offer: '0001-com-ubuntu-server-jammy'
-        sku: '22_04-lts-gen2'
-        version: 'latest'
-      }
-      osDisk: {
-        createOption: 'FromImage'
-        managedDisk: { storageAccountType: 'StandardSSD_LRS' }
-      }
-    }
-    networkProfile: {
-      networkInterfaces: [ { id: nicKubeadm.id } ]
-    }
+module vmKubeadm 'modules/vm.bicep' = {
+  name: 'deploy-vm-kubeadm'
+  params: {
+    location: location
+    vmName: kubeadmVmName
+    vmSize: vmSize
+    adminUsername: adminUsername
+    sshPublicKey: sshPublicKey
+    subnetId: vnet.properties.subnets[1].id
+    assignManagedIdentity: false
+    tags: tags
   }
 }
 
@@ -372,10 +188,10 @@ resource vmKubeadm 'Microsoft.Compute/virtualMachines@2024-03-01' = {
 // ---------------------------------------------------------------------------
 // Azure Kubernetes Service Cluster Admin Role
 resource roleClusterAdmin 'Microsoft.Authorization/roleAssignments@2022-04-01' = {
-  name: guid(aksCluster.id, vmMsi.id, 'aks-cluster-admin')
+  name: guid(aksCluster.id, vmMsi.outputs.principalId, 'aks-cluster-admin')
   scope: aksCluster
   properties: {
-    principalId: vmMsi.identity.principalId
+    principalId: vmMsi.outputs.principalId
     principalType: 'ServicePrincipal'
     roleDefinitionId: subscriptionResourceId('Microsoft.Authorization/roleDefinitions', '0ab0b1a8-8aac-4efd-b8c2-3ee1fb270be8')
   }
@@ -383,10 +199,10 @@ resource roleClusterAdmin 'Microsoft.Authorization/roleAssignments@2022-04-01' =
 
 // Azure Kubernetes Service RBAC Cluster Admin
 resource roleRbacAdmin 'Microsoft.Authorization/roleAssignments@2022-04-01' = {
-  name: guid(aksCluster.id, vmMsi.id, 'aks-rbac-cluster-admin')
+  name: guid(aksCluster.id, vmMsi.outputs.principalId, 'aks-rbac-cluster-admin')
   scope: aksCluster
   properties: {
-    principalId: vmMsi.identity.principalId
+    principalId: vmMsi.outputs.principalId
     principalType: 'ServicePrincipal'
     roleDefinitionId: subscriptionResourceId('Microsoft.Authorization/roleDefinitions', 'b1ff04bb-8a4e-4dc4-8eb5-8693973ce19b')
   }
@@ -399,14 +215,15 @@ output clusterName string = aksCluster.name
 output clusterId string = aksCluster.id
 output clusterFqdn string = aksCluster.properties.fqdn
 
-output msiVmName string = vmMsi.name
-output msiVmIp string = pipMsi.properties.ipAddress
-output msiVmPrincipalId string = vmMsi.identity.principalId
+output msiVmName string = vmMsi.outputs.vmName
+output msiVmIp string = vmMsi.outputs.publicIpAddress
+output msiVmPrincipalId string = vmMsi.outputs.principalId
 
-output tokenVmName string = vmToken.name
-output tokenVmIp string = pipToken.properties.ipAddress
+output tokenVmName string = vmToken.outputs.vmName
+output tokenVmIp string = vmToken.outputs.publicIpAddress
 
-output kubeadmVmName string = vmKubeadm.name
-output kubeadmVmIp string = pipKubeadm.properties.ipAddress
+output kubeadmVmName string = vmKubeadm.outputs.vmName
+output kubeadmVmIp string = vmKubeadm.outputs.publicIpAddress
 
 output adminUsername string = adminUsername
+
diff --git a/hack/e2e/infra/modules/vm.bicep b/hack/e2e/infra/modules/vm.bicep
new file mode 100644
index 0000000..70fdbd6
--- /dev/null
+++ b/hack/e2e/infra/modules/vm.bicep
@@ -0,0 +1,122 @@
+// =============================================================================
+// modules/vm.bicep - Reusable Ubuntu flex-node VM module
+//
+// Creates a public IP, NIC, and Ubuntu 22.04 VM in the given subnet.
+// =============================================================================
+
+@description('Azure region for all resources.')
+param location string
+
+@description('VM name (also used as prefix for NIC and public IP names).')
+param vmName string
+
+@description('VM size.')
+param vmSize string
+
+@description('Admin username.')
+param adminUsername string
+
+@description('SSH public key.')
+@secure()
+param sshPublicKey string
+
+@description('Subnet resource ID to attach the NIC to.')
+param subnetId string
+
+@description('Whether to assign a system-assigned managed identity to the VM.')
+param assignManagedIdentity bool = false
+
+@description('Tags applied to all resources in this module.')
+param tags object = {}
+
+// ---------------------------------------------------------------------------
+// Public IP
+// ---------------------------------------------------------------------------
+resource pip 'Microsoft.Network/publicIPAddresses@2023-11-01' = {
+  name: '${vmName}-pip'
+  location: location
+  tags: tags
+  sku: { name: 'Standard' }
+  properties: {
+    publicIPAllocationMethod: 'Static'
+  }
+}
+
+// ---------------------------------------------------------------------------
+// NIC
+// ---------------------------------------------------------------------------
+resource nic 'Microsoft.Network/networkInterfaces@2023-11-01' = {
+  name: '${vmName}-nic'
+  location: location
+  tags: tags
+  properties: {
+    ipConfigurations: [
+      {
+        name: 'ipconfig1'
+        properties: {
+          subnet: {
+            id: subnetId
+          }
+          publicIPAddress: {
+            id: pip.id
+          }
+          privateIPAllocationMethod: 'Dynamic'
+        }
+      }
+    ]
+  }
+}
+
+// ---------------------------------------------------------------------------
+// VM
+// ---------------------------------------------------------------------------
+resource vm 'Microsoft.Compute/virtualMachines@2024-03-01' = {
+  name: vmName
+  location: location
+  tags: tags
+  identity: assignManagedIdentity ? {
+    type: 'SystemAssigned'
+  } : {
+    type: 'None'
+  }
+  properties: {
+    hardwareProfile: { vmSize: vmSize }
+    osProfile: {
+      computerName: vmName
+      adminUsername: adminUsername
+      linuxConfiguration: {
+        disablePasswordAuthentication: true
+        ssh: {
+          publicKeys: [
+            {
+              path: '/home/${adminUsername}/.ssh/authorized_keys'
+              keyData: sshPublicKey
+            }
+          ]
+        }
+      }
+    }
+    storageProfile: {
+      imageReference: {
+        publisher: 'Canonical'
+        offer: '0001-com-ubuntu-server-jammy'
+        sku: '22_04-lts-gen2'
+        version: 'latest'
+      }
+      osDisk: {
+        createOption: 'FromImage'
+        managedDisk: { storageAccountType: 'StandardSSD_LRS' }
+      }
+    }
+    networkProfile: {
+      networkInterfaces: [ { id: nic.id } ]
+    }
+  }
+}
+
+// ---------------------------------------------------------------------------
+// Outputs
+// ---------------------------------------------------------------------------
+output vmName string = vm.name
+output publicIpAddress string = pip.properties.ipAddress
+output principalId string = assignManagedIdentity ? vm.identity.principalId : ''
diff --git a/hack/e2e/lib/node-join.sh b/hack/e2e/lib/node-join.sh
index 3b1eb06..8da2d51 100755
--- a/hack/e2e/lib/node-join.sh
+++ b/hack/e2e/lib/node-join.sh
@@ -362,7 +362,11 @@ stringData:
   auth-extra-groups: "system:bootstrappers:aks-flex-node"
 EOF
 
-  # Create RBAC bindings for TLS bootstrapping (idempotent)
+  # Create RBAC bindings for TLS bootstrapping (idempotent).
+  # These three bindings mirror what kubeadm init normally sets up:
+  #  1. system:node-bootstrapper          – allows nodes to create CSRs
+  #  2. nodeclient auto-approval          – auto-approves initial node certs
+  #  3. selfnodeclient auto-approval      – auto-approves certificate rotations
   kubectl apply -f - <<EOF
 apiVersion: rbac.authorization.k8s.io/v1
 kind: ClusterRoleBinding
@@ -402,6 +406,19 @@ subjects:
 - apiGroup: rbac.authorization.k8s.io
   kind: Group
   name: system:bootstrappers:aks-flex-node
+---
+apiVersion: rbac.authorization.k8s.io/v1
+kind: ClusterRoleBinding
+metadata:
+  name: aks-flex-node-auto-approve-certificate-rotation
+roleRef:
+  apiGroup: rbac.authorization.k8s.io
+  kind: ClusterRole
+  name: system:certificates.k8s.io:certificatesigningrequests:selfnodeclient
+subjects:
+- apiGroup: rbac.authorization.k8s.io
+  kind: Group
+  name: system:nodes
 EOF
 
   log_success "Bootstrap token and RBAC configured"
@@ -479,14 +496,12 @@ EOF
 ]
 EOF
 
-  # Step 3: Upload binary and action file, then run apply -f via systemd
-  local unit_name="aks-flex-node-kubeadm"
-
+  # Step 3: Upload binary and action file, then run apply -f directly
   log_info "Uploading binary and action file to ${vm_ip}..."
   remote_copy "${E2E_BINARY}" "${vm_ip}" "/tmp/aks-flex-node-binary"
   remote_copy "${action_file}" "${vm_ip}" "/tmp/kubeadm-join.json"
 
-  log_info "Starting kubeadm join via apply -f on ${vm_ip}..."
+  log_info "Running kubeadm join via apply -f on ${vm_ip}..."
   remote_exec "${vm_ip}" 'bash -s' <<REMOTE
 set -euo pipefail
 
@@ -497,24 +512,9 @@ aks-flex-node version
 sudo mkdir -p /etc/aks-flex-node /var/log/aks-flex-node
 sudo cp /tmp/kubeadm-join.json /etc/aks-flex-node/
 
-sudo systemd-run \
-  --unit=${unit_name} \
-  --description="AKS Flex Node E2E kubeadm join (${unit_name})" \
-  --remain-after-exit \
-  /usr/local/bin/aks-flex-node apply --no-prettyui -f /etc/aks-flex-node/kubeadm-join.json
-
-echo "Waiting ${E2E_BOOTSTRAP_SETTLE_TIME}s for bootstrap to complete..."
-sleep ${E2E_BOOTSTRAP_SETTLE_TIME}
-
-if systemctl is-active --quiet ${unit_name}; then
-  echo "Apply service is running"
-else
-  echo "Apply service failed:"
-  sudo journalctl -u ${unit_name} -n 50 --no-pager || true
-  exit 1
-fi
+sudo /usr/local/bin/aks-flex-node apply --no-prettyui -f /etc/aks-flex-node/kubeadm-join.json \
+  2>&1 | sudo tee /var/log/aks-flex-node/aks-flex-node.log
 
-sleep 10
 if systemctl is-active --quiet kubelet; then
   echo "kubelet is running"
 else

From 836de59465b4edd2e41d83858d6b0e03216f1667 Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Sat, 28 Feb 2026 06:23:42 +0000
Subject: [PATCH 4/6] Add full kubeadm bootstrap config and VHD
 parameterization in vm.bicep module

Co-authored-by: bcho <1975118+bcho@users.noreply.github.com>
---
 hack/e2e/infra/modules/vm.bicep |  23 ++++--
 hack/e2e/lib/node-join.sh       | 140 ++++++++++++++++++++++++++++++--
 2 files changed, 149 insertions(+), 14 deletions(-)

diff --git a/hack/e2e/infra/modules/vm.bicep b/hack/e2e/infra/modules/vm.bicep
index 70fdbd6..b1b9e56 100644
--- a/hack/e2e/infra/modules/vm.bicep
+++ b/hack/e2e/infra/modules/vm.bicep
@@ -1,7 +1,8 @@
 // =============================================================================
 // modules/vm.bicep - Reusable Ubuntu flex-node VM module
 //
-// Creates a public IP, NIC, and Ubuntu 22.04 VM in the given subnet.
+// Creates a public IP, NIC, and Ubuntu VM in the given subnet.
+// The VHD image defaults to Ubuntu 24.04 LTS (Noble) but can be overridden.
 // =============================================================================
 
 @description('Azure region for all resources.')
@@ -26,6 +27,18 @@ param subnetId string
 @description('Whether to assign a system-assigned managed identity to the VM.')
 param assignManagedIdentity bool = false
 
+@description('Marketplace image publisher.')
+param imagePublisher string = 'Canonical'
+
+@description('Marketplace image offer.')
+param imageOffer string = 'ubuntu-24_04-lts'
+
+@description('Marketplace image SKU.')
+param imageSku string = 'server'
+
+@description('Marketplace image version.')
+param imageVersion string = 'latest'
+
 @description('Tags applied to all resources in this module.')
 param tags object = {}
 
@@ -98,10 +111,10 @@ resource vm 'Microsoft.Compute/virtualMachines@2024-03-01' = {
     }
     storageProfile: {
       imageReference: {
-        publisher: 'Canonical'
-        offer: '0001-com-ubuntu-server-jammy'
-        sku: '22_04-lts-gen2'
-        version: 'latest'
+        publisher: imagePublisher
+        offer: imageOffer
+        sku: imageSku
+        version: imageVersion
       }
       osDisk: {
         createOption: 'FromImage'
diff --git a/hack/e2e/lib/node-join.sh b/hack/e2e/lib/node-join.sh
index 8da2d51..5b61aa1 100755
--- a/hack/e2e/lib/node-join.sh
+++ b/hack/e2e/lib/node-join.sh
@@ -363,10 +363,13 @@ stringData:
 EOF
 
   # Create RBAC bindings for TLS bootstrapping (idempotent).
-  # These three bindings mirror what kubeadm init normally sets up:
-  #  1. system:node-bootstrapper          – allows nodes to create CSRs
-  #  2. nodeclient auto-approval          – auto-approves initial node certs
-  #  3. selfnodeclient auto-approval      – auto-approves certificate rotations
+  # Mirrors the full set of resources that kubeadm init sets up:
+  #  - ClusterRoleBindings for CSR creation and auto-approval
+  #  - Roles/RoleBindings granting bootstrappers read access to kubeadm config
+  #    and kubelet config (required by kubeadm join's preflight phase)
+  #  - ClusterRole/ClusterRoleBinding for bootstrappers to GET nodes
+  #  - ConfigMaps: cluster-info (kube-public), kubeadm-config and
+  #    kubelet-config (kube-system) consumed by kubeadm join
   kubectl apply -f - <<EOF
 apiVersion: rbac.authorization.k8s.io/v1
 kind: ClusterRoleBinding
@@ -396,6 +399,19 @@ subjects:
 ---
 apiVersion: rbac.authorization.k8s.io/v1
 kind: ClusterRoleBinding
+metadata:
+  name: aks-flex-node-auto-approve-certificate-rotation
+roleRef:
+  apiGroup: rbac.authorization.k8s.io
+  kind: ClusterRole
+  name: system:certificates.k8s.io:certificatesigningrequests:selfnodeclient
+subjects:
+- apiGroup: rbac.authorization.k8s.io
+  kind: Group
+  name: system:nodes
+---
+apiVersion: rbac.authorization.k8s.io/v1
+kind: ClusterRoleBinding
 metadata:
   name: aks-flex-node-role
 roleRef:
@@ -408,17 +424,123 @@ subjects:
   name: system:bootstrappers:aks-flex-node
 ---
 apiVersion: rbac.authorization.k8s.io/v1
+kind: Role
+metadata:
+  namespace: kube-system
+  name: kubeadm:nodes-kubeadm-config
+rules:
+- verbs: ["get"]
+  apiGroups: [""]
+  resources: ["configmaps"]
+  resourceNames: ["kubeadm-config"]
+---
+apiVersion: rbac.authorization.k8s.io/v1
+kind: RoleBinding
+metadata:
+  namespace: kube-system
+  name: kubeadm:nodes-kubeadm-config
+roleRef:
+  apiGroup: rbac.authorization.k8s.io
+  kind: Role
+  name: kubeadm:nodes-kubeadm-config
+subjects:
+- kind: Group
+  apiGroup: rbac.authorization.k8s.io
+  name: system:bootstrappers:aks-flex-node
+---
+apiVersion: rbac.authorization.k8s.io/v1
+kind: Role
+metadata:
+  namespace: kube-system
+  name: kubeadm:kubelet-config
+rules:
+- verbs: ["get"]
+  apiGroups: [""]
+  resources: ["configmaps"]
+  resourceNames: ["kubelet-config"]
+---
+apiVersion: rbac.authorization.k8s.io/v1
+kind: RoleBinding
+metadata:
+  namespace: kube-system
+  name: kubeadm:kubelet-config
+roleRef:
+  apiGroup: rbac.authorization.k8s.io
+  kind: Role
+  name: kubeadm:kubelet-config
+subjects:
+- kind: Group
+  apiGroup: rbac.authorization.k8s.io
+  name: system:bootstrappers:aks-flex-node
+---
+apiVersion: rbac.authorization.k8s.io/v1
+kind: ClusterRole
+metadata:
+  name: kubeadm:get-nodes
+rules:
+- verbs: ["get"]
+  apiGroups: [""]
+  resources: ["nodes"]
+---
+apiVersion: rbac.authorization.k8s.io/v1
 kind: ClusterRoleBinding
 metadata:
-  name: aks-flex-node-auto-approve-certificate-rotation
+  name: kubeadm:get-nodes
 roleRef:
   apiGroup: rbac.authorization.k8s.io
   kind: ClusterRole
-  name: system:certificates.k8s.io:certificatesigningrequests:selfnodeclient
+  name: kubeadm:get-nodes
 subjects:
-- apiGroup: rbac.authorization.k8s.io
-  kind: Group
-  name: system:nodes
+- kind: Group
+  apiGroup: rbac.authorization.k8s.io
+  name: system:bootstrappers:aks-flex-node
+EOF
+
+  # Publish the ConfigMaps that kubeadm join reads during its preflight phase.
+  # cluster-info goes into kube-public (publicly readable).
+  # kubeadm-config and kubelet-config go into kube-system (bootstrapper-readable).
+  kubectl apply -f - <<EOF
+apiVersion: v1
+kind: ConfigMap
+metadata:
+  namespace: kube-public
+  name: cluster-info
+data:
+  kubeconfig: |
+    apiVersion: v1
+    kind: Config
+    clusters:
+    - cluster:
+        certificate-authority-data: ${ca_cert_data}
+        server: ${server_url}
+      name: ""
+    contexts: []
+    current-context: ""
+    preferences: {}
+    users: []
+---
+apiVersion: v1
+kind: ConfigMap
+metadata:
+  namespace: kube-system
+  name: kubeadm-config
+data:
+  ClusterConfiguration: |
+    apiVersion: kubeadm.k8s.io/v1beta4
+    kind: ClusterConfiguration
+    kubernetesVersion: ${E2E_KUBERNETES_VERSION}
+    networking:
+      serviceSubnet: 10.0.0.0/16
+---
+apiVersion: v1
+kind: ConfigMap
+metadata:
+  namespace: kube-system
+  name: kubelet-config
+data:
+  kubelet: |
+    apiVersion: kubelet.config.k8s.io/v1beta1
+    kind: KubeletConfiguration
 EOF
 
   log_success "Bootstrap token and RBAC configured"

From 9c59f4c54e1bff4ebca2691d6a8711285a2e8047 Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Sat, 28 Feb 2026 06:39:21 +0000
Subject: [PATCH 5/6] Fix BCP120: use msiVmName var instead of module output in
 roleAssignment names

Co-authored-by: bcho <1975118+bcho@users.noreply.github.com>
---
 hack/e2e/infra/main.bicep | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/hack/e2e/infra/main.bicep b/hack/e2e/infra/main.bicep
index 646906c..491c7d7 100644
--- a/hack/e2e/infra/main.bicep
+++ b/hack/e2e/infra/main.bicep
@@ -188,7 +188,7 @@ module vmKubeadm 'modules/vm.bicep' = {
 // ---------------------------------------------------------------------------
 // Azure Kubernetes Service Cluster Admin Role
 resource roleClusterAdmin 'Microsoft.Authorization/roleAssignments@2022-04-01' = {
-  name: guid(aksCluster.id, vmMsi.outputs.principalId, 'aks-cluster-admin')
+  name: guid(aksCluster.id, msiVmName, 'aks-cluster-admin')
   scope: aksCluster
   properties: {
     principalId: vmMsi.outputs.principalId
@@ -199,7 +199,7 @@ resource roleClusterAdmin 'Microsoft.Authorization/roleAssignments@2022-04-01' =
 
 // Azure Kubernetes Service RBAC Cluster Admin
 resource roleRbacAdmin 'Microsoft.Authorization/roleAssignments@2022-04-01' = {
-  name: guid(aksCluster.id, vmMsi.outputs.principalId, 'aks-rbac-cluster-admin')
+  name: guid(aksCluster.id, msiVmName, 'aks-rbac-cluster-admin')
   scope: aksCluster
   properties: {
     principalId: vmMsi.outputs.principalId

From eba1003157b866d0b186149d606060b9cbceeb2d Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Sat, 28 Feb 2026 06:59:09 +0000
Subject: [PATCH 6/6] Split node-join.sh into node-join-msi.sh,
 node-join-token.sh, node-join-kubeadm.sh

Co-authored-by: bcho <1975118+bcho@users.noreply.github.com>
---
 hack/e2e/README.md                |  13 +-
 hack/e2e/lib/node-join-kubeadm.sh | 353 ++++++++++++++++++
 hack/e2e/lib/node-join-msi.sh     | 104 ++++++
 hack/e2e/lib/node-join-token.sh   | 158 ++++++++
 hack/e2e/lib/node-join.sh         | 594 +-----------------------------
 5 files changed, 635 insertions(+), 587 deletions(-)
 create mode 100644 hack/e2e/lib/node-join-kubeadm.sh
 create mode 100644 hack/e2e/lib/node-join-msi.sh
 create mode 100644 hack/e2e/lib/node-join-token.sh

diff --git a/hack/e2e/README.md b/hack/e2e/README.md
index 7582b10..1066529 100644
--- a/hack/e2e/README.md
+++ b/hack/e2e/README.md
@@ -134,11 +134,14 @@ hack/e2e/
   infra/
     main.bicep        Bicep template (AKS + VNet + NSG + 3 VMs + role assignments)
   lib/
-    common.sh         Logging, prereqs, config, state management, SSH helpers
-    infra.sh          Bicep deployment, output extraction, kubeconfig fetch
-    node-join.sh      MSI, token, and kubeadm node join logic
-    validate.sh       Node-ready checks and smoke tests (nginx pods)
-    cleanup.sh        Log collection and Azure resource teardown
+    common.sh             Logging, prereqs, config, state management, SSH helpers
+    infra.sh              Bicep deployment, output extraction, kubeconfig fetch
+    node-join.sh          Shared helper (_deploy_and_start_agent) + node_join_all orchestration
+    node-join-msi.sh      MSI auth node join (node_join_msi)
+    node-join-token.sh    Bootstrap token node join (node_join_token)
+    node-join-kubeadm.sh  Kubeadm apply -f node join (node_join_kubeadm)
+    validate.sh           Node-ready checks and smoke tests (nginx pods)
+    cleanup.sh            Log collection and Azure resource teardown
 ```
 
 ## State File
diff --git a/hack/e2e/lib/node-join-kubeadm.sh b/hack/e2e/lib/node-join-kubeadm.sh
new file mode 100644
index 0000000..23eae1e
--- /dev/null
+++ b/hack/e2e/lib/node-join-kubeadm.sh
@@ -0,0 +1,353 @@
+#!/usr/bin/env bash
+# =============================================================================
+# hack/e2e/lib/node-join-kubeadm.sh - Join an AKS flex node using the kubeadm join flow
+#
+# Functions:
+#   node_join_kubeadm  - Create bootstrap token, generate action file,
+#                        run aks-flex-node apply -f (KubeadmNodeJoin)
+# =============================================================================
+set -euo pipefail
+
+[[ -n "${_E2E_NODE_JOIN_KUBEADM_LOADED:-}" ]] && return 0
+readonly _E2E_NODE_JOIN_KUBEADM_LOADED=1
+
+# shellcheck disable=SC1091
+source "$(dirname "${BASH_SOURCE[0]}")/common.sh"
+
+# ---------------------------------------------------------------------------
+# node_join_kubeadm - Join the Kubeadm VM using apply -f with KubeadmNodeJoin
+# ---------------------------------------------------------------------------
+node_join_kubeadm() {
+  log_section "Joining Kubeadm Node (apply -f)"
+  local start
+  start=$(timer_start)
+
+  local vm_ip
+  vm_ip="$(state_get kubeadm_vm_ip)"
+  local server_url
+  server_url="$(state_get server_url)"
+  local ca_cert_data
+  ca_cert_data="$(state_get ca_cert_data)"
+
+  # Step 1: Create bootstrap token & RBAC in the cluster
+  log_info "Creating bootstrap token and RBAC resources for kubeadm join..."
+  local token_id token_secret bootstrap_token expiration
+
+  token_id="$(openssl rand -hex 3)"
+  token_secret="$(openssl rand -hex 8)"
+  bootstrap_token="${token_id}.${token_secret}"
+
+  # Use a portable date command for expiration (24h from now)
+  if date --version &>/dev/null; then
+    # GNU date
+    expiration="$(date -u -d "+24 hours" +"%Y-%m-%dT%H:%M:%SZ")"
+  else
+    # BSD/macOS date
+    expiration="$(date -u -v+24H +"%Y-%m-%dT%H:%M:%SZ")"
+  fi
+
+  log_info "Token ID: ${token_id} | Expires: ${expiration}"
+
+  # Create the bootstrap token secret
+  kubectl apply -f - <<EOF
+apiVersion: v1
+kind: Secret
+metadata:
+  name: bootstrap-token-${token_id}
+  namespace: kube-system
+type: bootstrap.kubernetes.io/token
+stringData:
+  description: "AKS Flex Node E2E kubeadm bootstrap token"
+  token-id: "${token_id}"
+  token-secret: "${token_secret}"
+  expiration: "${expiration}"
+  usage-bootstrap-authentication: "true"
+  usage-bootstrap-signing: "true"
+  auth-extra-groups: "system:bootstrappers:aks-flex-node"
+EOF
+
+  # Create RBAC bindings for TLS bootstrapping (idempotent).
+  # Mirrors the full set of resources that kubeadm init sets up:
+  #  - ClusterRoleBindings for CSR creation and auto-approval
+  #  - Roles/RoleBindings granting bootstrappers read access to kubeadm config
+  #    and kubelet config (required by kubeadm join's preflight phase)
+  #  - ClusterRole/ClusterRoleBinding for bootstrappers to GET nodes
+  #  - ConfigMaps: cluster-info (kube-public), kubeadm-config and
+  #    kubelet-config (kube-system) consumed by kubeadm join
+  kubectl apply -f - <<EOF
+apiVersion: rbac.authorization.k8s.io/v1
+kind: ClusterRoleBinding
+metadata:
+  name: aks-flex-node-bootstrapper
+roleRef:
+  apiGroup: rbac.authorization.k8s.io
+  kind: ClusterRole
+  name: system:node-bootstrapper
+subjects:
+- apiGroup: rbac.authorization.k8s.io
+  kind: Group
+  name: system:bootstrappers:aks-flex-node
+---
+apiVersion: rbac.authorization.k8s.io/v1
+kind: ClusterRoleBinding
+metadata:
+  name: aks-flex-node-auto-approve-csr
+roleRef:
+  apiGroup: rbac.authorization.k8s.io
+  kind: ClusterRole
+  name: system:certificates.k8s.io:certificatesigningrequests:nodeclient
+subjects:
+- apiGroup: rbac.authorization.k8s.io
+  kind: Group
+  name: system:bootstrappers:aks-flex-node
+---
+apiVersion: rbac.authorization.k8s.io/v1
+kind: ClusterRoleBinding
+metadata:
+  name: aks-flex-node-auto-approve-certificate-rotation
+roleRef:
+  apiGroup: rbac.authorization.k8s.io
+  kind: ClusterRole
+  name: system:certificates.k8s.io:certificatesigningrequests:selfnodeclient
+subjects:
+- apiGroup: rbac.authorization.k8s.io
+  kind: Group
+  name: system:nodes
+---
+apiVersion: rbac.authorization.k8s.io/v1
+kind: ClusterRoleBinding
+metadata:
+  name: aks-flex-node-role
+roleRef:
+  apiGroup: rbac.authorization.k8s.io
+  kind: ClusterRole
+  name: system:node
+subjects:
+- apiGroup: rbac.authorization.k8s.io
+  kind: Group
+  name: system:bootstrappers:aks-flex-node
+---
+apiVersion: rbac.authorization.k8s.io/v1
+kind: Role
+metadata:
+  namespace: kube-system
+  name: kubeadm:nodes-kubeadm-config
+rules:
+- verbs: ["get"]
+  apiGroups: [""]
+  resources: ["configmaps"]
+  resourceNames: ["kubeadm-config"]
+---
+apiVersion: rbac.authorization.k8s.io/v1
+kind: RoleBinding
+metadata:
+  namespace: kube-system
+  name: kubeadm:nodes-kubeadm-config
+roleRef:
+  apiGroup: rbac.authorization.k8s.io
+  kind: Role
+  name: kubeadm:nodes-kubeadm-config
+subjects:
+- kind: Group
+  apiGroup: rbac.authorization.k8s.io
+  name: system:bootstrappers:aks-flex-node
+---
+apiVersion: rbac.authorization.k8s.io/v1
+kind: Role
+metadata:
+  namespace: kube-system
+  name: kubeadm:kubelet-config
+rules:
+- verbs: ["get"]
+  apiGroups: [""]
+  resources: ["configmaps"]
+  resourceNames: ["kubelet-config"]
+---
+apiVersion: rbac.authorization.k8s.io/v1
+kind: RoleBinding
+metadata:
+  namespace: kube-system
+  name: kubeadm:kubelet-config
+roleRef:
+  apiGroup: rbac.authorization.k8s.io
+  kind: Role
+  name: kubeadm:kubelet-config
+subjects:
+- kind: Group
+  apiGroup: rbac.authorization.k8s.io
+  name: system:bootstrappers:aks-flex-node
+---
+apiVersion: rbac.authorization.k8s.io/v1
+kind: ClusterRole
+metadata:
+  name: kubeadm:get-nodes
+rules:
+- verbs: ["get"]
+  apiGroups: [""]
+  resources: ["nodes"]
+---
+apiVersion: rbac.authorization.k8s.io/v1
+kind: ClusterRoleBinding
+metadata:
+  name: kubeadm:get-nodes
+roleRef:
+  apiGroup: rbac.authorization.k8s.io
+  kind: ClusterRole
+  name: kubeadm:get-nodes
+subjects:
+- kind: Group
+  apiGroup: rbac.authorization.k8s.io
+  name: system:bootstrappers:aks-flex-node
+EOF
+
+  # Publish the ConfigMaps that kubeadm join reads during its preflight phase.
+  # cluster-info goes into kube-public (publicly readable).
+  # kubeadm-config and kubelet-config go into kube-system (bootstrapper-readable).
+  kubectl apply -f - <<EOF
+apiVersion: v1
+kind: ConfigMap
+metadata:
+  namespace: kube-public
+  name: cluster-info
+data:
+  kubeconfig: |
+    apiVersion: v1
+    kind: Config
+    clusters:
+    - cluster:
+        certificate-authority-data: ${ca_cert_data}
+        server: ${server_url}
+      name: ""
+    contexts: []
+    current-context: ""
+    preferences: {}
+    users: []
+---
+apiVersion: v1
+kind: ConfigMap
+metadata:
+  namespace: kube-system
+  name: kubeadm-config
+data:
+  ClusterConfiguration: |
+    apiVersion: kubeadm.k8s.io/v1beta4
+    kind: ClusterConfiguration
+    kubernetesVersion: ${E2E_KUBERNETES_VERSION}
+    networking:
+      serviceSubnet: 10.0.0.0/16
+---
+apiVersion: v1
+kind: ConfigMap
+metadata:
+  namespace: kube-system
+  name: kubelet-config
+data:
+  kubelet: |
+    apiVersion: kubelet.config.k8s.io/v1beta1
+    kind: KubeletConfiguration
+EOF
+
+  log_success "Bootstrap token and RBAC configured"
+  state_set "kubeadm_bootstrap_token" "${bootstrap_token}"
+
+  # Step 2: Generate the apply -f action file (JSON array of all bootstrap steps
+  #         ending with the KubeadmNodeJoin action)
+  local action_file="${E2E_WORK_DIR}/kubeadm-join.json"
+  cat > "${action_file}" <<EOF
+[
+  {
+    "metadata": {
+      "type": "type.googleapis.com/aks.flex.components.linux.ConfigureBaseOS",
+      "name": "configure-os"
+    },
+    "spec": {}
+  },
+  {
+    "metadata": {
+      "type": "type.googleapis.com/aks.flex.components.cri.DownloadCRIBinaries",
+      "name": "download-cri-binaries"
+    },
+    "spec": {
+      "containerdVersion": "${E2E_CONTAINERD_VERSION}",
+      "runcVersion": "${E2E_RUNC_VERSION}"
+    }
+  },
+  {
+    "metadata": {
+      "type": "type.googleapis.com/aks.flex.components.kubebins.DownloadKubeBinaries",
+      "name": "download-kube-binaries"
+    },
+    "spec": {
+      "kubernetesVersion": "${E2E_KUBERNETES_VERSION}"
+    }
+  },
+  {
+    "metadata": {
+      "type": "type.googleapis.com/aks.flex.components.cni.DownloadCNIBinaries",
+      "name": "download-cni-binaries"
+    },
+    "spec": {}
+  },
+  {
+    "metadata": {
+      "type": "type.googleapis.com/aks.flex.components.cni.ConfigureCNI",
+      "name": "configure-cni"
+    },
+    "spec": {}
+  },
+  {
+    "metadata": {
+      "type": "type.googleapis.com/aks.flex.components.cri.StartContainerdService",
+      "name": "start-containerd"
+    },
+    "spec": {}
+  },
+  {
+    "metadata": {
+      "type": "type.googleapis.com/aks.flex.components.kubeadm.KubeadmNodeJoin",
+      "name": "kubeadm-node-join"
+    },
+    "spec": {
+      "controlPlane": {
+        "server": "${server_url}",
+        "certificateAuthorityData": "${ca_cert_data}"
+      },
+      "kubelet": {
+        "bootstrapAuthInfo": {
+          "token": "${bootstrap_token}"
+        }
+      }
+    }
+  }
+]
+EOF
+
+  # Step 3: Upload binary and action file, then run apply -f directly
+  log_info "Uploading binary and action file to ${vm_ip}..."
+  remote_copy "${E2E_BINARY}" "${vm_ip}" "/tmp/aks-flex-node-binary"
+  remote_copy "${action_file}" "${vm_ip}" "/tmp/kubeadm-join.json"
+
+  log_info "Running kubeadm join via apply -f on ${vm_ip}..."
+  remote_exec "${vm_ip}" 'bash -s' <<REMOTE
+set -euo pipefail
+
+sudo cp /tmp/aks-flex-node-binary /usr/local/bin/aks-flex-node
+sudo chmod +x /usr/local/bin/aks-flex-node
+aks-flex-node version
+
+sudo mkdir -p /etc/aks-flex-node /var/log/aks-flex-node
+sudo cp /tmp/kubeadm-join.json /etc/aks-flex-node/
+
+sudo /usr/local/bin/aks-flex-node apply --no-prettyui -f /etc/aks-flex-node/kubeadm-join.json \
+  2>&1 | sudo tee /var/log/aks-flex-node/aks-flex-node.log
+
+if systemctl is-active --quiet kubelet; then
+  echo "kubelet is running"
+else
+  echo "kubelet status:"
+  systemctl status kubelet --no-pager -l 2>&1 || true
+fi
+REMOTE
+
+  log_success "Kubeadm node joined via apply -f in $(timer_elapsed "${start}")s"
+}
diff --git a/hack/e2e/lib/node-join-msi.sh b/hack/e2e/lib/node-join-msi.sh
new file mode 100644
index 0000000..846d42e
--- /dev/null
+++ b/hack/e2e/lib/node-join-msi.sh
@@ -0,0 +1,104 @@
+#!/usr/bin/env bash
+# =============================================================================
+# hack/e2e/lib/node-join-msi.sh - Join an AKS flex node using MSI auth
+#
+# Functions:
+#   node_join_msi  - Install Azure CLI + MSI auth, deploy binary, run agent
+# =============================================================================
+set -euo pipefail
+
+[[ -n "${_E2E_NODE_JOIN_MSI_LOADED:-}" ]] && return 0
+readonly _E2E_NODE_JOIN_MSI_LOADED=1
+
+# shellcheck disable=SC1091
+source "$(dirname "${BASH_SOURCE[0]}")/common.sh"
+
+# ---------------------------------------------------------------------------
+# node_join_msi - Join the MSI VM
+# ---------------------------------------------------------------------------
+node_join_msi() {
+  log_section "Joining MSI Node"
+  local start
+  start=$(timer_start)
+
+  local vm_ip
+  vm_ip="$(state_get msi_vm_ip)"
+  local cluster_id
+  cluster_id="$(state_get cluster_id)"
+  local subscription_id
+  subscription_id="$(state_get subscription_id)"
+  local tenant_id
+  tenant_id="$(state_get tenant_id)"
+  local location
+  location="$(state_get location)"
+  local server_url
+  server_url="$(state_get server_url)"
+  local ca_cert_data
+  ca_cert_data="$(state_get ca_cert_data)"
+
+  # Step 1: Install Azure CLI on VM and log in with MSI
+  log_info "Installing Azure CLI on MSI VM (${vm_ip})..."
+  remote_exec "${vm_ip}" 'bash -s' <<'AZURECLI'
+set -euo pipefail
+
+MAX_RETRIES=5
+RETRY_DELAY=15
+for attempt in $(seq 1 $MAX_RETRIES); do
+  while sudo fuser /var/lib/dpkg/lock-frontend >/dev/null 2>&1; do
+    sleep 5
+  done
+
+  if sudo apt-get update -qq && curl -sL https://aka.ms/InstallAzureCLIDeb | sudo bash; then
+    echo "Azure CLI installed"
+    break
+  fi
+
+  if [ "$attempt" -lt "$MAX_RETRIES" ]; then
+    sudo dpkg --configure -a 2>/dev/null || true
+    sleep $RETRY_DELAY
+  else
+    echo "Azure CLI installation failed after ${MAX_RETRIES} attempts"
+    exit 1
+  fi
+done
+
+az login --identity --output none
+sudo az login --identity --output none
+echo "Azure CLI authenticated with managed identity"
+AZURECLI
+
+  # Step 2: Generate MSI config
+  local config_file="${E2E_WORK_DIR}/config-msi.json"
+  cat > "${config_file}" <<EOF
+{
+  "azure": {
+    "subscriptionId": "${subscription_id}",
+    "tenantId": "${tenant_id}",
+    "cloud": "AzurePublicCloud",
+    "managedIdentity": {},
+    "targetCluster": {
+      "resourceId": "${cluster_id}",
+      "location": "${location}"
+    }
+  },
+  "node": {
+    "kubelet": {
+      "serverURL": "${server_url}",
+      "caCertData": "${ca_cert_data}"
+    }
+  },
+  "agent": {
+    "logLevel": "debug",
+    "logDir": "/var/log/aks-flex-node"
+  },
+  "kubernetes": { "version": "${E2E_KUBERNETES_VERSION}" },
+  "containerd": { "version": "${E2E_CONTAINERD_VERSION}" },
+  "runc": { "version": "${E2E_RUNC_VERSION}" }
+}
+EOF
+
+  # Step 3: Deploy and start
+  _deploy_and_start_agent "${vm_ip}" "${config_file}" "aks-flex-node-msi"
+
+  log_success "MSI node joined in $(timer_elapsed "${start}")s"
+}
diff --git a/hack/e2e/lib/node-join-token.sh b/hack/e2e/lib/node-join-token.sh
new file mode 100644
index 0000000..b351d8a
--- /dev/null
+++ b/hack/e2e/lib/node-join-token.sh
@@ -0,0 +1,158 @@
+#!/usr/bin/env bash
+# =============================================================================
+# hack/e2e/lib/node-join-token.sh - Join an AKS flex node using bootstrap token auth
+#
+# Functions:
+#   node_join_token  - Create bootstrap token/RBAC, deploy binary, run agent
+# =============================================================================
+set -euo pipefail
+
+[[ -n "${_E2E_NODE_JOIN_TOKEN_LOADED:-}" ]] && return 0
+readonly _E2E_NODE_JOIN_TOKEN_LOADED=1
+
+# shellcheck disable=SC1091
+source "$(dirname "${BASH_SOURCE[0]}")/common.sh"
+
+# ---------------------------------------------------------------------------
+# node_join_token - Join the Token VM
+# ---------------------------------------------------------------------------
+node_join_token() {
+  log_section "Joining Token Node"
+  local start
+  start=$(timer_start)
+
+  local vm_ip
+  vm_ip="$(state_get token_vm_ip)"
+  local cluster_id
+  cluster_id="$(state_get cluster_id)"
+  local subscription_id
+  subscription_id="$(state_get subscription_id)"
+  local tenant_id
+  tenant_id="$(state_get tenant_id)"
+  local location
+  location="$(state_get location)"
+  local server_url
+  server_url="$(state_get server_url)"
+  local ca_cert_data
+  ca_cert_data="$(state_get ca_cert_data)"
+
+  # Step 1: Create bootstrap token & RBAC in the cluster
+  log_info "Creating bootstrap token and RBAC resources..."
+  local token_id token_secret bootstrap_token expiration
+
+  token_id="$(openssl rand -hex 3)"
+  token_secret="$(openssl rand -hex 8)"
+  bootstrap_token="${token_id}.${token_secret}"
+
+  # Use a portable date command for expiration (24h from now)
+  if date --version &>/dev/null 2>&1; then
+    # GNU date
+    expiration="$(date -u -d "+24 hours" +"%Y-%m-%dT%H:%M:%SZ")"
+  else
+    # BSD/macOS date
+    expiration="$(date -u -v+24H +"%Y-%m-%dT%H:%M:%SZ")"
+  fi
+
+  log_info "Token ID: ${token_id} | Expires: ${expiration}"
+
+  # Create the bootstrap token secret
+  kubectl apply -f - <<EOF
+apiVersion: v1
+kind: Secret
+metadata:
+  name: bootstrap-token-${token_id}
+  namespace: kube-system
+type: bootstrap.kubernetes.io/token
+stringData:
+  description: "AKS Flex Node E2E bootstrap token"
+  token-id: "${token_id}"
+  token-secret: "${token_secret}"
+  expiration: "${expiration}"
+  usage-bootstrap-authentication: "true"
+  usage-bootstrap-signing: "true"
+  auth-extra-groups: "system:bootstrappers:aks-flex-node"
+EOF
+
+  # Create RBAC bindings for TLS bootstrapping
+  kubectl apply -f - <<EOF
+apiVersion: rbac.authorization.k8s.io/v1
+kind: ClusterRoleBinding
+metadata:
+  name: aks-flex-node-bootstrapper
+roleRef:
+  apiGroup: rbac.authorization.k8s.io
+  kind: ClusterRole
+  name: system:node-bootstrapper
+subjects:
+- apiGroup: rbac.authorization.k8s.io
+  kind: Group
+  name: system:bootstrappers:aks-flex-node
+---
+apiVersion: rbac.authorization.k8s.io/v1
+kind: ClusterRoleBinding
+metadata:
+  name: aks-flex-node-auto-approve-csr
+roleRef:
+  apiGroup: rbac.authorization.k8s.io
+  kind: ClusterRole
+  name: system:certificates.k8s.io:certificatesigningrequests:nodeclient
+subjects:
+- apiGroup: rbac.authorization.k8s.io
+  kind: Group
+  name: system:bootstrappers:aks-flex-node
+---
+apiVersion: rbac.authorization.k8s.io/v1
+kind: ClusterRoleBinding
+metadata:
+  name: aks-flex-node-role
+roleRef:
+  apiGroup: rbac.authorization.k8s.io
+  kind: ClusterRole
+  name: system:node
+subjects:
+- apiGroup: rbac.authorization.k8s.io
+  kind: Group
+  name: system:bootstrappers:aks-flex-node
+EOF
+
+  log_success "Bootstrap token and RBAC configured"
+  state_set "bootstrap_token" "${bootstrap_token}"
+
+  # Step 2: Generate token config
+  local config_file="${E2E_WORK_DIR}/config-token.json"
+  cat > "${config_file}" <<EOF
+{
+  "azure": {
+    "subscriptionId": "${subscription_id}",
+    "tenantId": "${tenant_id}",
+    "cloud": "AzurePublicCloud",
+    "bootstrapToken": {
+      "token": "${bootstrap_token}"
+    },
+    "arc": { "enabled": false },
+    "targetCluster": {
+      "resourceId": "${cluster_id}",
+      "location": "${location}"
+    }
+  },
+  "node": {
+    "kubelet": {
+      "serverURL": "${server_url}",
+      "caCertData": "${ca_cert_data}"
+    }
+  },
+  "agent": {
+    "logLevel": "debug",
+    "logDir": "/var/log/aks-flex-node"
+  },
+  "kubernetes": { "version": "${E2E_KUBERNETES_VERSION}" },
+  "containerd": { "version": "${E2E_CONTAINERD_VERSION}" },
+  "runc": { "version": "${E2E_RUNC_VERSION}" }
+}
+EOF
+
+  # Step 3: Deploy and start
+  _deploy_and_start_agent "${vm_ip}" "${config_file}" "aks-flex-node-token"
+
+  log_success "Token node joined in $(timer_elapsed "${start}")s"
+}
diff --git a/hack/e2e/lib/node-join.sh b/hack/e2e/lib/node-join.sh
index 5b61aa1..92d0c07 100755
--- a/hack/e2e/lib/node-join.sh
+++ b/hack/e2e/lib/node-join.sh
@@ -2,18 +2,13 @@
 # =============================================================================
 # hack/e2e/lib/node-join.sh - Bootstrap flex nodes into the AKS cluster
 #
-# Functions:
-#   node_join_msi      - Install Azure CLI + MSI auth, deploy binary, run agent
-#   node_join_token    - Create bootstrap token/RBAC, deploy binary, run agent
-#   node_join_kubeadm  - Create bootstrap token, deploy binary, run apply -f
-#                        with a KubeadmNodeJoin action (kubeadm join flow)
-#   node_join_all      - Join all nodes (MSI, token, and kubeadm) in parallel
+# Sources:
+#   node-join-msi.sh     - MSI auth node join     (node_join_msi)
+#   node-join-token.sh   - Bootstrap token join   (node_join_token)
+#   node-join-kubeadm.sh - Kubeadm apply -f join  (node_join_kubeadm)
 #
-# Each function:
-#   1. Generates the appropriate config / action file
-#   2. SCPs the binary + config/action file onto the VM
-#   3. Starts the agent via systemd-run
-#   4. Waits for kubelet to report running
+# Functions:
+#   node_join_all  - Join all nodes (MSI, token, and kubeadm) in parallel
 # =============================================================================
 set -euo pipefail
 
@@ -76,577 +71,12 @@ REMOTE
   log_success "Agent started on ${vm_ip}"
 }
 
-# ---------------------------------------------------------------------------
-# node_join_msi - Join the MSI VM
-# ---------------------------------------------------------------------------
-node_join_msi() {
-  log_section "Joining MSI Node"
-  local start
-  start=$(timer_start)
-
-  local vm_ip
-  vm_ip="$(state_get msi_vm_ip)"
-  local cluster_id
-  cluster_id="$(state_get cluster_id)"
-  local subscription_id
-  subscription_id="$(state_get subscription_id)"
-  local tenant_id
-  tenant_id="$(state_get tenant_id)"
-  local location
-  location="$(state_get location)"
-  local server_url
-  server_url="$(state_get server_url)"
-  local ca_cert_data
-  ca_cert_data="$(state_get ca_cert_data)"
-
-  # Step 1: Install Azure CLI on VM and log in with MSI
-  log_info "Installing Azure CLI on MSI VM (${vm_ip})..."
-  remote_exec "${vm_ip}" 'bash -s' <<'AZURECLI'
-set -euo pipefail
-
-MAX_RETRIES=5
-RETRY_DELAY=15
-for attempt in $(seq 1 $MAX_RETRIES); do
-  while sudo fuser /var/lib/dpkg/lock-frontend >/dev/null 2>&1; do
-    sleep 5
-  done
-
-  if sudo apt-get update -qq && curl -sL https://aka.ms/InstallAzureCLIDeb | sudo bash; then
-    echo "Azure CLI installed"
-    break
-  fi
-
-  if [ "$attempt" -lt "$MAX_RETRIES" ]; then
-    sudo dpkg --configure -a 2>/dev/null || true
-    sleep $RETRY_DELAY
-  else
-    echo "Azure CLI installation failed after ${MAX_RETRIES} attempts"
-    exit 1
-  fi
-done
-
-az login --identity --output none
-sudo az login --identity --output none
-echo "Azure CLI authenticated with managed identity"
-AZURECLI
-
-  # Step 2: Generate MSI config
-  local config_file="${E2E_WORK_DIR}/config-msi.json"
-  cat > "${config_file}" <<EOF
-{
-  "azure": {
-    "subscriptionId": "${subscription_id}",
-    "tenantId": "${tenant_id}",
-    "cloud": "AzurePublicCloud",
-    "managedIdentity": {},
-    "targetCluster": {
-      "resourceId": "${cluster_id}",
-      "location": "${location}"
-    }
-  },
-  "node": {
-    "kubelet": {
-      "serverURL": "${server_url}",
-      "caCertData": "${ca_cert_data}"
-    }
-  },
-  "agent": {
-    "logLevel": "debug",
-    "logDir": "/var/log/aks-flex-node"
-  },
-  "kubernetes": { "version": "${E2E_KUBERNETES_VERSION}" },
-  "containerd": { "version": "${E2E_CONTAINERD_VERSION}" },
-  "runc": { "version": "${E2E_RUNC_VERSION}" }
-}
-EOF
-
-  # Step 3: Deploy and start
-  _deploy_and_start_agent "${vm_ip}" "${config_file}" "aks-flex-node-msi"
-
-  log_success "MSI node joined in $(timer_elapsed "${start}")s"
-}
-
-# ---------------------------------------------------------------------------
-# node_join_token - Join the Token VM
-# ---------------------------------------------------------------------------
-node_join_token() {
-  log_section "Joining Token Node"
-  local start
-  start=$(timer_start)
-
-  local vm_ip
-  vm_ip="$(state_get token_vm_ip)"
-  local cluster_id
-  cluster_id="$(state_get cluster_id)"
-  local subscription_id
-  subscription_id="$(state_get subscription_id)"
-  local tenant_id
-  tenant_id="$(state_get tenant_id)"
-  local location
-  location="$(state_get location)"
-  local server_url
-  server_url="$(state_get server_url)"
-  local ca_cert_data
-  ca_cert_data="$(state_get ca_cert_data)"
-
-  # Step 1: Create bootstrap token & RBAC in the cluster
-  log_info "Creating bootstrap token and RBAC resources..."
-  local token_id token_secret bootstrap_token expiration
-
-  token_id="$(openssl rand -hex 3)"
-  token_secret="$(openssl rand -hex 8)"
-  bootstrap_token="${token_id}.${token_secret}"
-
-  # Use a portable date command for expiration (24h from now)
-  if date --version &>/dev/null 2>&1; then
-    # GNU date
-    expiration="$(date -u -d "+24 hours" +"%Y-%m-%dT%H:%M:%SZ")"
-  else
-    # BSD/macOS date
-    expiration="$(date -u -v+24H +"%Y-%m-%dT%H:%M:%SZ")"
-  fi
-
-  log_info "Token ID: ${token_id} | Expires: ${expiration}"
-
-  # Create the bootstrap token secret
-  kubectl apply -f - <<EOF
-apiVersion: v1
-kind: Secret
-metadata:
-  name: bootstrap-token-${token_id}
-  namespace: kube-system
-type: bootstrap.kubernetes.io/token
-stringData:
-  description: "AKS Flex Node E2E bootstrap token"
-  token-id: "${token_id}"
-  token-secret: "${token_secret}"
-  expiration: "${expiration}"
-  usage-bootstrap-authentication: "true"
-  usage-bootstrap-signing: "true"
-  auth-extra-groups: "system:bootstrappers:aks-flex-node"
-EOF
-
-  # Create RBAC bindings for TLS bootstrapping
-  kubectl apply -f - <<EOF
-apiVersion: rbac.authorization.k8s.io/v1
-kind: ClusterRoleBinding
-metadata:
-  name: aks-flex-node-bootstrapper
-roleRef:
-  apiGroup: rbac.authorization.k8s.io
-  kind: ClusterRole
-  name: system:node-bootstrapper
-subjects:
-- apiGroup: rbac.authorization.k8s.io
-  kind: Group
-  name: system:bootstrappers:aks-flex-node
----
-apiVersion: rbac.authorization.k8s.io/v1
-kind: ClusterRoleBinding
-metadata:
-  name: aks-flex-node-auto-approve-csr
-roleRef:
-  apiGroup: rbac.authorization.k8s.io
-  kind: ClusterRole
-  name: system:certificates.k8s.io:certificatesigningrequests:nodeclient
-subjects:
-- apiGroup: rbac.authorization.k8s.io
-  kind: Group
-  name: system:bootstrappers:aks-flex-node
----
-apiVersion: rbac.authorization.k8s.io/v1
-kind: ClusterRoleBinding
-metadata:
-  name: aks-flex-node-role
-roleRef:
-  apiGroup: rbac.authorization.k8s.io
-  kind: ClusterRole
-  name: system:node
-subjects:
-- apiGroup: rbac.authorization.k8s.io
-  kind: Group
-  name: system:bootstrappers:aks-flex-node
-EOF
-
-  log_success "Bootstrap token and RBAC configured"
-  state_set "bootstrap_token" "${bootstrap_token}"
-
-  # Step 2: Generate token config
-  local config_file="${E2E_WORK_DIR}/config-token.json"
-  cat > "${config_file}" <<EOF
-{
-  "azure": {
-    "subscriptionId": "${subscription_id}",
-    "tenantId": "${tenant_id}",
-    "cloud": "AzurePublicCloud",
-    "bootstrapToken": {
-      "token": "${bootstrap_token}"
-    },
-    "arc": { "enabled": false },
-    "targetCluster": {
-      "resourceId": "${cluster_id}",
-      "location": "${location}"
-    }
-  },
-  "node": {
-    "kubelet": {
-      "serverURL": "${server_url}",
-      "caCertData": "${ca_cert_data}"
-    }
-  },
-  "agent": {
-    "logLevel": "debug",
-    "logDir": "/var/log/aks-flex-node"
-  },
-  "kubernetes": { "version": "${E2E_KUBERNETES_VERSION}" },
-  "containerd": { "version": "${E2E_CONTAINERD_VERSION}" },
-  "runc": { "version": "${E2E_RUNC_VERSION}" }
-}
-EOF
-
-  # Step 3: Deploy and start
-  _deploy_and_start_agent "${vm_ip}" "${config_file}" "aks-flex-node-token"
-
-  log_success "Token node joined in $(timer_elapsed "${start}")s"
-}
-
-# ---------------------------------------------------------------------------
-# node_join_kubeadm - Join the Kubeadm VM using apply -f with KubeadmNodeJoin
-# ---------------------------------------------------------------------------
-node_join_kubeadm() {
-  log_section "Joining Kubeadm Node (apply -f)"
-  local start
-  start=$(timer_start)
-
-  local vm_ip
-  vm_ip="$(state_get kubeadm_vm_ip)"
-  local server_url
-  server_url="$(state_get server_url)"
-  local ca_cert_data
-  ca_cert_data="$(state_get ca_cert_data)"
-
-  # Step 1: Create bootstrap token & RBAC in the cluster
-  log_info "Creating bootstrap token and RBAC resources for kubeadm join..."
-  local token_id token_secret bootstrap_token expiration
-
-  token_id="$(openssl rand -hex 3)"
-  token_secret="$(openssl rand -hex 8)"
-  bootstrap_token="${token_id}.${token_secret}"
-
-  # Use a portable date command for expiration (24h from now)
-  if date --version &>/dev/null; then
-    # GNU date
-    expiration="$(date -u -d "+24 hours" +"%Y-%m-%dT%H:%M:%SZ")"
-  else
-    # BSD/macOS date
-    expiration="$(date -u -v+24H +"%Y-%m-%dT%H:%M:%SZ")"
-  fi
-
-  log_info "Token ID: ${token_id} | Expires: ${expiration}"
-
-  # Create the bootstrap token secret
-  kubectl apply -f - <<EOF
-apiVersion: v1
-kind: Secret
-metadata:
-  name: bootstrap-token-${token_id}
-  namespace: kube-system
-type: bootstrap.kubernetes.io/token
-stringData:
-  description: "AKS Flex Node E2E kubeadm bootstrap token"
-  token-id: "${token_id}"
-  token-secret: "${token_secret}"
-  expiration: "${expiration}"
-  usage-bootstrap-authentication: "true"
-  usage-bootstrap-signing: "true"
-  auth-extra-groups: "system:bootstrappers:aks-flex-node"
-EOF
-
-  # Create RBAC bindings for TLS bootstrapping (idempotent).
-  # Mirrors the full set of resources that kubeadm init sets up:
-  #  - ClusterRoleBindings for CSR creation and auto-approval
-  #  - Roles/RoleBindings granting bootstrappers read access to kubeadm config
-  #    and kubelet config (required by kubeadm join's preflight phase)
-  #  - ClusterRole/ClusterRoleBinding for bootstrappers to GET nodes
-  #  - ConfigMaps: cluster-info (kube-public), kubeadm-config and
-  #    kubelet-config (kube-system) consumed by kubeadm join
-  kubectl apply -f - <<EOF
-apiVersion: rbac.authorization.k8s.io/v1
-kind: ClusterRoleBinding
-metadata:
-  name: aks-flex-node-bootstrapper
-roleRef:
-  apiGroup: rbac.authorization.k8s.io
-  kind: ClusterRole
-  name: system:node-bootstrapper
-subjects:
-- apiGroup: rbac.authorization.k8s.io
-  kind: Group
-  name: system:bootstrappers:aks-flex-node
----
-apiVersion: rbac.authorization.k8s.io/v1
-kind: ClusterRoleBinding
-metadata:
-  name: aks-flex-node-auto-approve-csr
-roleRef:
-  apiGroup: rbac.authorization.k8s.io
-  kind: ClusterRole
-  name: system:certificates.k8s.io:certificatesigningrequests:nodeclient
-subjects:
-- apiGroup: rbac.authorization.k8s.io
-  kind: Group
-  name: system:bootstrappers:aks-flex-node
----
-apiVersion: rbac.authorization.k8s.io/v1
-kind: ClusterRoleBinding
-metadata:
-  name: aks-flex-node-auto-approve-certificate-rotation
-roleRef:
-  apiGroup: rbac.authorization.k8s.io
-  kind: ClusterRole
-  name: system:certificates.k8s.io:certificatesigningrequests:selfnodeclient
-subjects:
-- apiGroup: rbac.authorization.k8s.io
-  kind: Group
-  name: system:nodes
----
-apiVersion: rbac.authorization.k8s.io/v1
-kind: ClusterRoleBinding
-metadata:
-  name: aks-flex-node-role
-roleRef:
-  apiGroup: rbac.authorization.k8s.io
-  kind: ClusterRole
-  name: system:node
-subjects:
-- apiGroup: rbac.authorization.k8s.io
-  kind: Group
-  name: system:bootstrappers:aks-flex-node
----
-apiVersion: rbac.authorization.k8s.io/v1
-kind: Role
-metadata:
-  namespace: kube-system
-  name: kubeadm:nodes-kubeadm-config
-rules:
-- verbs: ["get"]
-  apiGroups: [""]
-  resources: ["configmaps"]
-  resourceNames: ["kubeadm-config"]
----
-apiVersion: rbac.authorization.k8s.io/v1
-kind: RoleBinding
-metadata:
-  namespace: kube-system
-  name: kubeadm:nodes-kubeadm-config
-roleRef:
-  apiGroup: rbac.authorization.k8s.io
-  kind: Role
-  name: kubeadm:nodes-kubeadm-config
-subjects:
-- kind: Group
-  apiGroup: rbac.authorization.k8s.io
-  name: system:bootstrappers:aks-flex-node
----
-apiVersion: rbac.authorization.k8s.io/v1
-kind: Role
-metadata:
-  namespace: kube-system
-  name: kubeadm:kubelet-config
-rules:
-- verbs: ["get"]
-  apiGroups: [""]
-  resources: ["configmaps"]
-  resourceNames: ["kubelet-config"]
----
-apiVersion: rbac.authorization.k8s.io/v1
-kind: RoleBinding
-metadata:
-  namespace: kube-system
-  name: kubeadm:kubelet-config
-roleRef:
-  apiGroup: rbac.authorization.k8s.io
-  kind: Role
-  name: kubeadm:kubelet-config
-subjects:
-- kind: Group
-  apiGroup: rbac.authorization.k8s.io
-  name: system:bootstrappers:aks-flex-node
----
-apiVersion: rbac.authorization.k8s.io/v1
-kind: ClusterRole
-metadata:
-  name: kubeadm:get-nodes
-rules:
-- verbs: ["get"]
-  apiGroups: [""]
-  resources: ["nodes"]
----
-apiVersion: rbac.authorization.k8s.io/v1
-kind: ClusterRoleBinding
-metadata:
-  name: kubeadm:get-nodes
-roleRef:
-  apiGroup: rbac.authorization.k8s.io
-  kind: ClusterRole
-  name: kubeadm:get-nodes
-subjects:
-- kind: Group
-  apiGroup: rbac.authorization.k8s.io
-  name: system:bootstrappers:aks-flex-node
-EOF
-
-  # Publish the ConfigMaps that kubeadm join reads during its preflight phase.
-  # cluster-info goes into kube-public (publicly readable).
-  # kubeadm-config and kubelet-config go into kube-system (bootstrapper-readable).
-  kubectl apply -f - <<EOF
-apiVersion: v1
-kind: ConfigMap
-metadata:
-  namespace: kube-public
-  name: cluster-info
-data:
-  kubeconfig: |
-    apiVersion: v1
-    kind: Config
-    clusters:
-    - cluster:
-        certificate-authority-data: ${ca_cert_data}
-        server: ${server_url}
-      name: ""
-    contexts: []
-    current-context: ""
-    preferences: {}
-    users: []
----
-apiVersion: v1
-kind: ConfigMap
-metadata:
-  namespace: kube-system
-  name: kubeadm-config
-data:
-  ClusterConfiguration: |
-    apiVersion: kubeadm.k8s.io/v1beta4
-    kind: ClusterConfiguration
-    kubernetesVersion: ${E2E_KUBERNETES_VERSION}
-    networking:
-      serviceSubnet: 10.0.0.0/16
----
-apiVersion: v1
-kind: ConfigMap
-metadata:
-  namespace: kube-system
-  name: kubelet-config
-data:
-  kubelet: |
-    apiVersion: kubelet.config.k8s.io/v1beta1
-    kind: KubeletConfiguration
-EOF
-
-  log_success "Bootstrap token and RBAC configured"
-  state_set "kubeadm_bootstrap_token" "${bootstrap_token}"
-
-  # Step 2: Generate the apply -f action file (JSON array of all bootstrap steps
-  #         ending with the KubeadmNodeJoin action)
-  local action_file="${E2E_WORK_DIR}/kubeadm-join.json"
-  cat > "${action_file}" <<EOF
-[
-  {
-    "metadata": {
-      "type": "type.googleapis.com/aks.flex.components.linux.ConfigureBaseOS",
-      "name": "configure-os"
-    },
-    "spec": {}
-  },
-  {
-    "metadata": {
-      "type": "type.googleapis.com/aks.flex.components.cri.DownloadCRIBinaries",
-      "name": "download-cri-binaries"
-    },
-    "spec": {
-      "containerdVersion": "${E2E_CONTAINERD_VERSION}",
-      "runcVersion": "${E2E_RUNC_VERSION}"
-    }
-  },
-  {
-    "metadata": {
-      "type": "type.googleapis.com/aks.flex.components.kubebins.DownloadKubeBinaries",
-      "name": "download-kube-binaries"
-    },
-    "spec": {
-      "kubernetesVersion": "${E2E_KUBERNETES_VERSION}"
-    }
-  },
-  {
-    "metadata": {
-      "type": "type.googleapis.com/aks.flex.components.cni.DownloadCNIBinaries",
-      "name": "download-cni-binaries"
-    },
-    "spec": {}
-  },
-  {
-    "metadata": {
-      "type": "type.googleapis.com/aks.flex.components.cni.ConfigureCNI",
-      "name": "configure-cni"
-    },
-    "spec": {}
-  },
-  {
-    "metadata": {
-      "type": "type.googleapis.com/aks.flex.components.cri.StartContainerdService",
-      "name": "start-containerd"
-    },
-    "spec": {}
-  },
-  {
-    "metadata": {
-      "type": "type.googleapis.com/aks.flex.components.kubeadm.KubeadmNodeJoin",
-      "name": "kubeadm-node-join"
-    },
-    "spec": {
-      "controlPlane": {
-        "server": "${server_url}",
-        "certificateAuthorityData": "${ca_cert_data}"
-      },
-      "kubelet": {
-        "bootstrapAuthInfo": {
-          "token": "${bootstrap_token}"
-        }
-      }
-    }
-  }
-]
-EOF
-
-  # Step 3: Upload binary and action file, then run apply -f directly
-  log_info "Uploading binary and action file to ${vm_ip}..."
-  remote_copy "${E2E_BINARY}" "${vm_ip}" "/tmp/aks-flex-node-binary"
-  remote_copy "${action_file}" "${vm_ip}" "/tmp/kubeadm-join.json"
-
-  log_info "Running kubeadm join via apply -f on ${vm_ip}..."
-  remote_exec "${vm_ip}" 'bash -s' <<REMOTE
-set -euo pipefail
-
-sudo cp /tmp/aks-flex-node-binary /usr/local/bin/aks-flex-node
-sudo chmod +x /usr/local/bin/aks-flex-node
-aks-flex-node version
-
-sudo mkdir -p /etc/aks-flex-node /var/log/aks-flex-node
-sudo cp /tmp/kubeadm-join.json /etc/aks-flex-node/
-
-sudo /usr/local/bin/aks-flex-node apply --no-prettyui -f /etc/aks-flex-node/kubeadm-join.json \
-  2>&1 | sudo tee /var/log/aks-flex-node/aks-flex-node.log
-
-if systemctl is-active --quiet kubelet; then
-  echo "kubelet is running"
-else
-  echo "kubelet status:"
-  systemctl status kubelet --no-pager -l 2>&1 || true
-fi
-REMOTE
-
-  log_success "Kubeadm node joined via apply -f in $(timer_elapsed "${start}")s"
-}
+# shellcheck disable=SC1091
+source "$(dirname "${BASH_SOURCE[0]}")/node-join-msi.sh"
+# shellcheck disable=SC1091
+source "$(dirname "${BASH_SOURCE[0]}")/node-join-token.sh"
+# shellcheck disable=SC1091
+source "$(dirname "${BASH_SOURCE[0]}")/node-join-kubeadm.sh"
 
 # ---------------------------------------------------------------------------
 # node_join_all - Join all nodes in parallel