Azure · awesomenix · Mar 10, 2026 · Copilot · Mar 24, 2026 · Copilot
@@ -20,7 +20,10 @@ set -euo pipefail
 
 logger -t aks-boothook "boothook start $(date -Ins)"
 
-mkdir -p /opt/azure/containers
+mkdir -p /opt/azure/containers /var/lib/waagent
+
+touch /var/lib/waagent/experimental_skip_ready_report
+chmod 0644 /var/lib/waagent/experimental_skip_ready_report
 
 cat <<'EOF' | base64 -d >/opt/azure/containers/aks-node-controller-config.json
 %s

@@ -506,8 +506,9 @@ func Test_Ubuntu2204_Scriptless(t *testing.T) {
 	RunScenario(t, &Scenario{
 		Description: "tests that a new ubuntu 2204 node using self contained installer can be properly bootstrapped",
 		Config: Config{
-			Cluster: ClusterKubenet,
-			VHD:     config.VHDUbuntu2204Gen2Containerd,
+			Cluster:                       ClusterKubenet,
+			VHD:                           config.VHDUbuntu2204Gen2Containerd,
+			UseCustomDataOnlyProvisioning: true,
 			Validator: func(ctx context.Context, s *Scenario) {
 				ValidateFileHasContent(ctx, s, "/var/log/azure/aks-node-controller.log", "aks-node-controller finished successfully")
 			},

@@ -301,8 +301,10 @@ func prepareAKSNode(ctx context.Context, s *Scenario) (*ScenarioVM, error) {
 		require.NoError(s.T, err, "create vmss %q, check %s for vm logs", s.Runtime.VMSSName, testDir(s.T))
 	}
 
-	err = getCustomScriptExtensionStatus(s, scenarioVM.VM)
-	require.NoError(s.T, err)
+	if !s.Config.UseCustomDataOnlyProvisioning {
+		err = getCustomScriptExtensionStatus(s, scenarioVM.VM)
+		require.NoError(s.T, err)
+	}
 
 	if !s.Config.SkipDefaultValidation {
 		vmssCreatedAt := time.Now()         // Record the start time

@@ -163,6 +163,11 @@ type Config struct {
 	// AKSNodeConfigMutator if defined then aks-node-controller will be used to provision nodes
 	AKSNodeConfigMutator func(*aksnodeconfigv1.Configuration)
 
+	// UseCustomDataOnlyProvisioning switches an AKSNodeConfig scenario to a CustomData-only E2E flow.
+	// It omits the VMSS Custom Script Extension and uses CustomData to run aks-node-controller provision
+	// directly during cloud-init instead.
+	UseCustomDataOnlyProvisioning bool
+
 	// VMConfigMutator is a function which mutates the base VMSS model according to the scenario's requirements
 	VMConfigMutator func(*armcompute.VirtualMachineScaleSet)
 

@@ -95,7 +95,10 @@ func CustomDataWithHack(s *Scenario, binaryURL string) (string, error) {
 #!/bin/bash
 set -euo pipefail
 
-mkdir -p /opt/azure/containers /opt/azure/bin
+mkdir -p /opt/azure/containers /opt/azure/bin /var/lib/waagent
+
+touch /var/lib/waagent/experimental_skip_ready_report
+chmod 0644 /var/lib/waagent/experimental_skip_ready_report
 
 cat <<'EOF' | base64 -d > /opt/azure/containers/aks-node-controller-config-hack.json
 %s

@@ -872,4 +872,13 @@ EOF
     systemctl restart nvidia-persistenced.service || exit 1
 }
 
+skipCloudInitReadyReport() {
+    local config_filepath="/etc/cloud/cloud.cfg.d/81_azure_skip_ready_report.cfg"
+    mkdir -p "$(dirname "${config_filepath}")"
+    cat <<EOF >"${config_filepath}"
+datasource:
+    Azure:
+        experimental_skip_ready_report: true
+EOF
-EOF
+EOF
+
+    # Ensure the marker file used by report_ready.py is present so that
+    # disabling the cloud-init ready report still allows the standalone
+    # reporting script to run as expected.
+    mkdir -p /var/lib/waagent
+    touch /var/lib/waagent/experimental_skip_ready_report
-EOF
+EOF
+
+    # Ensure the marker file used by report_ready.py is present so that
+    # disabling the cloud-init ready report still allows the standalone
+    # reporting script to run as expected.
+    mkdir -p /var/lib/waagent
+    touch /var/lib/waagent/experimental_skip_ready_report
+}
 #EOF
@@ -103,6 +103,15 @@ EVENT_JSON=$( jq -n \
 )
 echo ${EVENT_JSON} > ${EVENTS_LOGGING_DIR}${EVENTS_FILE_NAME}.json
 
+
+if [ -x /opt/azure/containers/report_ready.py ]; then
+    if [ "$EXIT_CODE" -eq 0 ]; then
+        python3 /opt/azure/containers/report_ready.py -v || echo "WARNING: Failed to report ready to Azure fabric"
-        python3 /opt/azure/containers/report_ready.py -v || echo "WARNING: Failed to report ready to Azure fabric"
+        python3 /opt/azure/containers/report_ready.py -v || echo "WARNING: Failed to report ready to Azure fabric" &
-        python3 /opt/azure/containers/report_ready.py -v || echo "WARNING: Failed to report ready to Azure fabric"
+        python3 /opt/azure/containers/report_ready.py -v || echo "WARNING: Failed to report ready to Azure fabric" &
+    else
+        python3 /opt/azure/containers/report_ready.py -v --failure --description "ExitCode: ${EXIT_CODE}, ${message_string}" || echo "WARNING: Failed to report failure to Azure fabric"
+    fi
+fi
+
 # force a log upload to the host after the provisioning script finishes
 # if we failed, wait for the upload to complete so that we don't remove
 # the VM before it finishes. if we succeeded, upload in the background