Azure · FumingZhang · May 6, 2024 · Apr 30, 2024 · Apr 30, 2024 · May 1, 2024
diff --git a/cSpell.json b/cSpell.json
@@ -188,7 +188,10 @@
             "words": [
                 "vtpm",
                 "trustedlaunch",
-                "aksadvancednetworking"
+                "aksadvancednetworking",
+                "PDBs",
+                "undrainable",
+                "Undrainable"
             ]
         },
         {

diff --git a/...ce-manager/Microsoft.ContainerService/aks/preview/2024-04-02-preview/managedClusters.json b/...ce-manager/Microsoft.ContainerService/aks/preview/2024-04-02-preview/managedClusters.json
@@ -4728,6 +4728,28 @@
           "minimum": 0,
           "title": "The soak duration for a node",
           "description": "The amount of time (in minutes) to wait after draining a node and before reimaging it and moving on to next node. If not specified, the default is 0 minutes."
+        },
+        "undrainableNodeBehavior": {
+          "type": "string",
+          "description": "Defines the behavior for undrainable nodes during upgrade. The most common cause of undrainable nodes is Pod Disruption Budgets (PDBs), but other issues, such as pod termination grace period is exceeding the remaining per-node drain timeout or pod is still being in a running state, can also cause undrainable nodes.",
+          "enum": [
+            "Schedule",
+            "Cordon"
+          ],
+          "x-ms-enum": {
+            "name": "UndrainableNodeBehavior",
+            "modelAsString": true,
+            "values": [
+              {
+                "value": "Cordon",
+                "description": "AKS will cordon the blocked nodes and replace them with surge nodes during upgrade. The blocked nodes will be cordoned and replaced by surge nodes. The blocked nodes will have label 'kubernetes.azure.com/upgrade-status:Quarantined'. A surge node will be retained for each blocked node. A best-effort attempt will be made to delete all other surge nodes. If there are enough surge nodes to replace blocked nodes, then the upgrade operation and the managed cluster will be in failed state. Otherwise, the upgrade operation and the managed cluster will be in canceled state."
+              },
+              {
+                "value": "Schedule",
+                "description": "AKS will mark the blocked nodes schedulable, but the blocked nodes are not upgraded. A best-effort attempt will be made to delete all surge nodes. The upgrade operation and the managed cluster will be in failed state if there are any blocked nodes."
+              }
+            ]
+          }
         }
       },
       "description": "Settings for upgrading an agentpool"