Skip to content

Commit 34b78d9

Browse files
committed
add 5000 node dra test
Signed-off-by: Alay Patel <[email protected]>
1 parent c596351 commit 34b78d9

File tree

1 file changed

+96
-0
lines changed

1 file changed

+96
-0
lines changed

config/jobs/kubernetes/sig-scalability/DRA/sig-scalability-periodic-dra.yaml

Lines changed: 96 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -405,3 +405,99 @@ periodics:
405405
value: "true"
406406
- name: NODE_PRELOAD_IMAGES
407407
value: "gcr.io/k8s-staging-perf-tests/sleep:v0.0.3"
408+
409+
- name: ci-kubernetes-e2e-gce-5000-node-dra-with-workload
410+
cluster: k8s-infra-prow-build
411+
tags:
412+
- "perfDashPrefix: gce-dra-5000Nodes-with-workload"
413+
- "perfDashBuildsCount: 270"
414+
- "perfDashJobType: performance"
415+
# Run on even days at 17:01 UTC (9:01 PST) to complement the release-blocking test that runs on odd days
416+
# The release-blocking test runs on even days at 17:01 UTC (9:01 PST)
417+
cron: '1 17 2-30/2 * *'
418+
labels:
419+
preset-service-account: "true"
420+
preset-k8s-ssh: "true"
421+
preset-e2e-scalability-common: "true"
422+
preset-e2e-scalability-periodics: "true"
423+
preset-e2e-scalability-periodics-master: "true"
424+
annotations:
425+
testgrid-dashboards: sig-scalability-dra
426+
testgrid-tab-name: gce-dra-with-workload-master-scalability-5000
427+
testgrid-alert-email: [email protected], [email protected]
428+
testgrid-num-failures-to-alert: '2'
429+
description: "Uses kubetest to run k8s.io/perf-tests/run-e2e.sh against a 5000-node cluster with DRA enabled"
430+
decorate: true
431+
decoration_config:
432+
timeout: 8h
433+
extra_refs:
434+
- org: kubernetes
435+
repo: kubernetes
436+
base_ref: master
437+
path_alias: k8s.io/kubernetes
438+
- org: kubernetes
439+
repo: perf-tests
440+
base_ref: master
441+
path_alias: k8s.io/perf-tests
442+
spec:
443+
containers:
444+
- image: gcr.io/k8s-staging-test-infra/kubekins-e2e:v20250925-95b5a2c7a5-master
445+
command:
446+
- runner.sh
447+
- /workspace/scenarios/kubernetes_e2e.py
448+
args:
449+
- --cluster=gce-scale-cluster
450+
- --env=HEAPSTER_MACHINE_TYPE=e2-standard-32
451+
# TODO(mborsz): Adjust or remove this change once we understand coredns
452+
# memory usage regression.
453+
- --env=KUBE_DNS_MEMORY_LIMIT=300Mi
454+
- --extract=ci/fast/latest-fast
455+
- --gcp-nodes=5000
456+
- --gcp-project-type=scalability-scale-project
457+
- --gcp-zone=us-east1-b
458+
- --provider=gce
459+
- --metadata-sources=cl2-metadata.json
460+
- --env=KUBE_FEATURE_GATES=DynamicResourceAllocation=true
461+
- --runtime-config=api/all=true
462+
- --test=false
463+
- --test-cmd=$GOPATH/src/k8s.io/perf-tests/run-e2e.sh
464+
- --test-cmd-args=cluster-loader2
465+
- --test-cmd-args=--nodes=5000
466+
- --test-cmd-args=--provider=gce
467+
- --test-cmd-args=--enable-prometheus-server=true
468+
- --test-cmd-args=--prometheus-scrape-node-exporter
469+
- --test-cmd-args=--experimental-gcp-snapshot-prometheus-disk=true
470+
- --test-cmd-args=--experimental-prometheus-disk-snapshot-name=$(JOB_NAME)-$(BUILD_ID)
471+
- --test-cmd-args=--experimental-prometheus-snapshot-to-report-dir=true
472+
- --test-cmd-args=--testconfig=testing/dra/config.yaml
473+
- --test-cmd-args=--report-dir=$(ARTIFACTS)
474+
- --test-cmd-args=--testoverrides=./testing/overrides/5000_nodes.yaml
475+
- --test-cmd-name=ClusterLoaderV2
476+
- --timeout=420m
477+
- --use-logexporter
478+
- --logexporter-gcs-path=gs://k8s-infra-scalability-tests-logs/$(JOB_NAME)/$(BUILD_ID)
479+
resources:
480+
requests:
481+
cpu: 6
482+
memory: "16Gi"
483+
limits:
484+
cpu: 6
485+
memory: "16Gi"
486+
env:
487+
- name: CL2_MODE
488+
value: "Indexed"
489+
- name: CL2_NODES_PER_NAMESPACE
490+
value: "2500"
491+
- name: CL2_JOB_RUNNING_TIME
492+
value: "3s"
493+
- name: CL2_LONG_JOB_RUNNING_TIME
494+
value: "240m"
495+
# TODO: 100 node gce test run with 10 and 5, can increase if needed
496+
# - name: CL2_LOAD_TEST_THROUGHPUT
497+
# value: "50"
498+
# - name: CL2_STEADY_STATE_QPS
499+
# value: "25"
500+
- name: PROMETHEUS_SCRAPE_KUBELETS
501+
value: "true"
502+
- name: NODE_PRELOAD_IMAGES
503+
value: "gcr.io/k8s-staging-perf-tests/sleep:v0.0.3"

0 commit comments

Comments
 (0)