Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Original file line number Diff line number Diff line change
Expand Up @@ -407,3 +407,220 @@ periodics:
value: "gcr.io/k8s-staging-perf-tests/sleep:v0.0.3"
- name: CL2_ENABLE_EXTENDED_RESOURCES
value: "true"

- name: ci-kubernetes-e2e-kops-gce-100-node-dra-with-workload-ipalias-using-cl2
tags:
- "perfDashPrefix: gce-dra-100Nodes-with-workload-dev"
- "perfDashBuildsCount: 270"
- "perfDashJobType: performance"
cluster: k8s-infra-prow-build
interval: 4h
labels:
preset-k8s-ssh: "true"
preset-dind-enabled: "true"
decorate: true
decoration_config:
timeout: 480m
extra_refs:
- org: kubernetes
repo: kubernetes
base_ref: master
path_alias: k8s.io/kubernetes
- org: kubernetes
repo: perf-tests
base_ref: master
path_alias: k8s.io/perf-tests
- org: kubernetes
repo: kops
base_ref: master
path_alias: k8s.io/kops
workdir: true
annotations:
test.kops.k8s.io/cloud: gce
test.kops.k8s.io/distro: u2404
test.kops.k8s.io/k8s_version: stable
test.kops.k8s.io/kops_channel: alpha
test.kops.k8s.io/networking: ipalias
testgrid-dashboards: kops-misc, sig-cluster-lifecycle-kops, sig-scalability-gce, sig-scalability-dra
testgrid-tab-name: gce-dra-with-workload-master-scalability-100-canary
description: "Uses kops to run k8s.io/perf-tests/run-e2e.sh against a 100-node cluster with DRA enabled"
spec:
serviceAccountName: prow-build
containers:
- image: us-central1-docker.pkg.dev/k8s-staging-test-infra/images/kubekins-e2e:v20250925-95b5a2c7a5-master
imagePullPolicy: Always
command:
- runner.sh
args:
- ./tests/e2e/scenarios/scalability/run-test.sh
securityContext:
privileged: true
env:
- name: KUBE_SSH_KEY_PATH
value: /etc/ssh-key-secret/ssh-private
- name: KUBE_SSH_USER
value: ubuntu
- name: GOPATH
value: /home/prow/go
- name: ARTIFACTS
value: $(ARTIFACTS)
- name: CNI_PLUGIN
value: gce
- name: KUBE_NODE_COUNT
value: "100"
- name: CL2_MODE
value: "Indexed"
- name: CL2_NODES_PER_NAMESPACE
value: "10"
- name: CL2_JOB_RUNNING_TIME
value: "3s"
- name: CL2_LONG_JOB_RUNNING_TIME
value: "45m"
- name: CL2_EXTENDED_RESOURCE_NAME
value: "example.com/gpu"
# - name: CL2_LOAD_TEST_THROUGHPUT
# value: "50"
# - name: CL2_DELETE_TEST_THROUGHPUT
# value: "50"
- name: CL2_RATE_LIMIT_POD_CREATION
value: "false"
- name: NODE_MODE
value: "master"
- name: CONTROL_PLANE_COUNT
value: "1"
- name: CONTROL_PLANE_SIZE
value: "c4-standard-96"
- name: KUBE_PROXY_MODE
value: "nftables"
- name: ENABLE_PROMETHEUS_SERVER
value: "true"
- name: PROMETHEUS_SCRAPE_KUBELETS
value: "true"
- name: PROMETHEUS_PVC_STORAGE_CLASS
value: "ssd-csi"
- name: CLOUD_PROVIDER
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

The DRA test also require enabling certain feature flags. From the config above this is set:

            - --env=KUBE_FEATURE_GATES=DynamicResourceAllocation=true

In the case of kops, should we be setting the KOPS_FEATURE_FLAGS feature flag with above?

Copy link
Member Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

DRA feature should be autoenabled already. kops does enable all GA/Beta flags by default

value: "gce"
- name: BOSKOS_RESOURCE_TYPE
value: "scalability-project"
- name: NODE_PRELOAD_IMAGES
value: "gcr.io/k8s-staging-perf-tests/sleep:v0.0.3"
- name: KOPS_CL2_TEST_CONFIG
value: testing/dra/config.yaml
- name: CL2_ENABLE_EXTENDED_RESOURCES
value: "true"
resources:
requests:
cpu: "7"
memory: "28Gi"
limits:
cpu: "7"
memory: "28Gi"

- name: ci-kubernetes-e2e-kops-gce-5000-node-dra-with-workload-ipalias-using-cl2
tags:
- "perfDashPrefix: gce-dra-5000Nodes-with-workload"
- "perfDashBuildsCount: 270"
- "perfDashJobType: performance"
cluster: k8s-infra-prow-build
cron: '0 3 * * *' # Run once a day at 03:00 UTC
labels:
preset-k8s-ssh: "true"
preset-dind-enabled: "true"
job_queue_name: "5k-gce-scale-test" # DON'T REMOVE THIS
decorate: true
decoration_config:
timeout: 480m
extra_refs:
- org: kubernetes
repo: kubernetes
base_ref: master
path_alias: k8s.io/kubernetes
- org: kubernetes
repo: perf-tests
base_ref: master
path_alias: k8s.io/perf-tests
- org: kubernetes
repo: kops
base_ref: master
path_alias: k8s.io/kops
workdir: true
annotations:
test.kops.k8s.io/cloud: gce
test.kops.k8s.io/distro: u2404
test.kops.k8s.io/k8s_version: stable
test.kops.k8s.io/kops_channel: alpha
test.kops.k8s.io/networking: ipalias
testgrid-dashboards: kops-misc, sig-cluster-lifecycle-kops, sig-scalability-gce, sig-scalability-dra
testgrid-tab-name: gce-dra-with-workload-master-scalability-5000
testgrid-alert-email: kubernetes-sig-scale@googlegroups.com, kubernetes-scalability-tickets@google.com
testgrid-num-failures-to-alert: '2'
description: "Uses kops to run k8s.io/perf-tests/run-e2e.sh against a 5000-node cluster with DRA enabled"
spec:
serviceAccountName: prow-build
containers:
- image: us-central1-docker.pkg.dev/k8s-staging-test-infra/images/kubekins-e2e:v20250925-95b5a2c7a5-master
imagePullPolicy: Always
command:
- runner.sh
args:
- ./tests/e2e/scenarios/scalability/run-test.sh
securityContext:
privileged: true
env:
- name: KUBE_SSH_KEY_PATH
value: /etc/ssh-key-secret/ssh-private
- name: KUBE_SSH_USER
value: ubuntu
- name: GOPATH
value: /home/prow/go
- name: ARTIFACTS
value: $(ARTIFACTS)
- name: CNI_PLUGIN
value: gce
- name: KUBE_NODE_COUNT
value: "5000"
- name: CL2_MODE
value: "Indexed"
- name: CL2_NODES_PER_NAMESPACE
value: "2500"
- name: CL2_JOB_RUNNING_TIME
value: "3s"
- name: CL2_LONG_JOB_RUNNING_TIME
value: "240m"
# - name: CL2_LOAD_TEST_THROUGHPUT
# value: "50"
# - name: CL2_DELETE_TEST_THROUGHPUT
# value: "50"
- name: CL2_RATE_LIMIT_POD_CREATION
value: "false"
- name: NODE_MODE
value: "master"
- name: CONTROL_PLANE_COUNT
value: "1"
- name: CONTROL_PLANE_SIZE
value: "c4-standard-96"
- name: KUBE_PROXY_MODE
value: "nftables"
- name: ENABLE_PROMETHEUS_SERVER
value: "true"
- name: PROMETHEUS_SCRAPE_KUBELETS
value: "true"
- name: PROMETHEUS_PVC_STORAGE_CLASS
value: "ssd-csi"
- name: CLOUD_PROVIDER
value: "gce"
- name: BOSKOS_RESOURCE_TYPE
value: "scalability-scale-project"
- name: NODE_PRELOAD_IMAGES
value: "gcr.io/k8s-staging-perf-tests/sleep:v0.0.3"
- name: CL2_ENABLE_EXTENDED_RESOURCES
value: "true"
- name: KOPS_CL2_TEST_CONFIG
value: testing/dra/config.yaml
resources:
requests:
cpu: "7"
memory: "28Gi"
limits:
cpu: "7"
memory: "28Gi"
Original file line number Diff line number Diff line change
Expand Up @@ -1181,6 +1181,7 @@ periodics:
preset-e2e-scalability-common: "true"
preset-e2e-scalability-periodics: "true"
preset-e2e-scalability-periodics-master: "true"
job_queue_name: "5k-gce-scale-test" # DON'T REMOVE THIS
decorate: true
decoration_config:
timeout: 450m
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -11,6 +11,7 @@ periodics:
preset-e2e-scalability-periodics: "true"
preset-e2e-scalability-periodics-master: "true"
decorate: true
job_queue_name: "5k-gce-scale-test" # DON'T REMOVE THIS
decoration_config:
timeout: 270m
annotations:
Expand Down Expand Up @@ -85,6 +86,7 @@ periodics:
preset-e2e-scalability-periodics: "true"
preset-e2e-scalability-periodics-master: "true"
decorate: true
job_queue_name: "5k-gce-scale-test" # DON'T REMOVE THIS
decoration_config:
timeout: 450m
extra_refs:
Expand Down
2 changes: 2 additions & 0 deletions config/prow/config.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -11,6 +11,8 @@ plank:
'k8sio-image-promo': 1
# limits concurrency for k8s-test-infra-staging project
'test-infra-staging-image-push': 1
# limits concurrency for 5k GCE jobs
'5k-gce-scale-test': 1
default_decoration_config_entries:
- config:
timeout: 2h
Expand Down