From 9c8824160415854e2baf1f65e01d8c1338d9587c Mon Sep 17 00:00:00 2001 From: Pablo Trivino Date: Sun, 3 May 2026 12:30:23 -0700 Subject: [PATCH 1/4] pretest wait --- steps/execute-tests.yml | 5 +++++ 1 file changed, 5 insertions(+) diff --git a/steps/execute-tests.yml b/steps/execute-tests.yml index 84b6e92a2b..ef0c7daf38 100644 --- a/steps/execute-tests.yml +++ b/steps/execute-tests.yml @@ -13,6 +13,11 @@ parameters: default: {} steps: +- script: | + echo "Waiting 20 minutes before starting test execution..." + sleep 1200 # 20 minutes = 1200 seconds + echo "Wait period completed, proceeding with tests" + displayName: "Pre-test wait period" - template: /steps/topology/${{ parameters.topology }}/execute-${{ parameters.engine }}.yml@self parameters: cloud: ${{ parameters.cloud }} From 00d5ac76b08bba8cc50391beac1ce21b9f658475 Mon Sep 17 00:00:00 2001 From: Pablo Trivino Date: Mon, 4 May 2026 18:26:57 -0400 Subject: [PATCH 2/4] add test with only on-demand --- .../node-auto-provisioning-benchmark.yml | 33 +++++++++++++++++++ 1 file changed, 33 insertions(+) diff --git a/pipelines/perf-eval/Autoscale Benchmark/node-auto-provisioning-benchmark.yml b/pipelines/perf-eval/Autoscale Benchmark/node-auto-provisioning-benchmark.yml index d6a6b1630f..64cd0c5612 100644 --- a/pipelines/perf-eval/Autoscale Benchmark/node-auto-provisioning-benchmark.yml +++ b/pipelines/perf-eval/Autoscale Benchmark/node-auto-provisioning-benchmark.yml @@ -125,6 +125,39 @@ stages: credential_type: service_connection ssh_key_enabled: false + - stage: azure_australiaeast_small_scale_on_demand + condition: eq(variables['Build.Reason'], 'Manual') + dependsOn: [] + jobs: + - template: /jobs/competitive-test.yml + parameters: + cloud: azure + regions: + - australiaeast + engine: clusterloader2 + engine_input: + image: "ghcr.io/azure/clusterloader2:v20250423" + topology: karpenter + matrix: + small-scale-on-demand: + cpu_per_node: 4 + node_count: 10 + pod_count: 100 + scale_up_timeout: "15m" + scale_down_timeout: "15m" + node_label_selector: "karpenter.sh/nodepool = default" + node_selector: "{karpenter.sh/nodepool: default}" + loop_count: 5 + karpenter_cooldown: 900 #seconds + warmup_deployment: true + warmup_deployment_template: warmup_deployment.yaml + vm_size: Standard_D4ds_v4 + capacity_type: on-demand + max_parallel: 1 + timeout_in_minutes: 560 + credential_type: service_connection + ssh_key_enabled: false + - stage: azure_australiaeast_small_scale condition: | or( From 62196c9ece33d2cfa197be345d9a6d3ba463582a Mon Sep 17 00:00:00 2001 From: Pablo Trivino Date: Tue, 5 May 2026 17:39:47 -0400 Subject: [PATCH 3/4] add MS workload --- pipelines/system/new-pipeline-test.yml | 52 +++++++++++++++++--------- 1 file changed, 34 insertions(+), 18 deletions(-) diff --git a/pipelines/system/new-pipeline-test.yml b/pipelines/system/new-pipeline-test.yml index 63d55f02d9..674c73978a 100644 --- a/pipelines/system/new-pipeline-test.yml +++ b/pipelines/system/new-pipeline-test.yml @@ -1,25 +1,41 @@ trigger: none - variables: - SCENARIO_TYPE: - SCENARIO_NAME: + SCENARIO_TYPE: perf-eval + SCENARIO_NAME: nap-complex stages: - - stage: # format: [_]+ (e.g. azure_eastus2, aws_eastus_westus) + - stage: azure_canadacentral_ondemand_complex_config dependsOn: [] + variables: + - group: NAP-MS-CanadaCentral jobs: - - template: /jobs/competitive-test.yml # must keep as is + - template: /jobs/competitive-test.yml parameters: - cloud: # e.g. azure, aws - regions: # list of regions - - region1 # e.g. eastus2 - topology: # e.g. cluster-autoscaler - engine: # e.g. clusterloader2 - matrix: # list of test parameters to customize the provisioned resources - : - : - : - max_parallel: # required - credential_type: service_connection # required - ssh_key_enabled: false - timeout_in_minutes: 60 # if not specified, default is 60 + cloud: azure + regions: + - canadacentral + engine: clusterloader2 + engine_input: + image: "ghcr.io/azure/clusterloader2:v20250912" + topology: karpenter-private-cluster + matrix: + complex-nap: + pod_count: 5000 + pod_cpu_request: 16 + pod_memory_request: "60Gi" + scale_up_timeout: "900s" # 15 minutes + scale_down_timeout: "900s" + node_selector: "{karpenter.sh/nodepool: default}" + loop_count: 1 + warmup_deployment: true + warmup_deployment_template: warmup_deployment.yaml + capacity_type: on-demand + cl2_config_file: "ms_complex_config.yaml" + enable_prometheus: True + scrape_kubelets: True + scrape_ksm: True + enable_apiserver_vnet_integration: "true" + max_parallel: 1 + timeout_in_minutes: 120 + credential_type: service_connection + ssh_key_enabled: true \ No newline at end of file From b859dbcc519c4823fb3cdb49e50d66775a56d2fb Mon Sep 17 00:00:00 2001 From: Pablo Trivino Date: Tue, 5 May 2026 17:45:42 -0400 Subject: [PATCH 4/4] put MS workload with schedule --- pipelines/system/new-pipeline-test.yml | 8 ++++++++ 1 file changed, 8 insertions(+) diff --git a/pipelines/system/new-pipeline-test.yml b/pipelines/system/new-pipeline-test.yml index 674c73978a..c2a9360a2d 100644 --- a/pipelines/system/new-pipeline-test.yml +++ b/pipelines/system/new-pipeline-test.yml @@ -1,4 +1,12 @@ trigger: none +schedules: + # canadacentral - daily + - cron: "0 21 * * *" + displayName: "Every day at 9:00 PM" + branches: + include: + - main + always: true variables: SCENARIO_TYPE: perf-eval SCENARIO_NAME: nap-complex