Skip to content

Commit f737d3c

Browse files
committed
add support for DRAExtendedResources
Signed-off-by: Alay Patel <[email protected]>
1 parent 48123e4 commit f737d3c

File tree

5 files changed

+36
-4
lines changed

5 files changed

+36
-4
lines changed

clusterloader2/pkg/dependency/dra/dra.go

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -70,6 +70,10 @@ func (d *draDependency) Setup(config *dependency.Config) error {
7070
"Namespace": namespace,
7171
"WorkerNodeCount": getWorkerCount(config),
7272
}
73+
74+
if extendedResourceName, ok := config.Params["ExtendedResourceName"]; ok {
75+
mapping["ExtendedResourceName"] = extendedResourceName
76+
}
7377
if err := config.ClusterFramework.ApplyTemplatedManifests(
7478
manifestsFS,
7579
"manifests/*.yaml",
Lines changed: 4 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,10 +1,13 @@
11
---
22
# Source: dra-example-driver/templates/deviceclass.yaml
3-
apiVersion: resource.k8s.io/v1beta1
3+
apiVersion: resource.k8s.io/v1
44
kind: DeviceClass
55
metadata:
66
name: gpu.example.com
77
spec:
88
selectors:
99
- cel:
1010
expression: "device.driver == 'gpu.example.com'"
11+
{{- if .ExtendedResourceName}}
12+
extendedResourceName: "{{.ExtendedResourceName}}"
13+
{{- end}}

clusterloader2/testing/dra/config.yaml

Lines changed: 16 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -23,8 +23,15 @@
2323
{{$smallJobSize := 1}}
2424
{{$smallJobCompletions := 10}}
2525
{{$jobRunningTime := DefaultParam .CL2_JOB_RUNNING_TIME "30s"}}
26+
{{$ENABLE_EXTENDED_RESOURCES := DefaultParam .CL2_ENABLE_EXTENDED_RESOURCES false}}
2627

28+
{{$extendedResourceName := ""}}
29+
{{if $ENABLE_EXTENDED_RESOURCES}}
30+
{{$extendedResourceName = DefaultParam .CL2_EXTENDED_RESOURCE_NAME "example.com/gpu"}}
31+
name: dra-extended-resources-steady-state
32+
{{else}}
2733
name: dra-steady-state
34+
{{end}}
2835

2936
namespace:
3037
number: {{$namespaces}}
@@ -37,11 +44,15 @@ tuningSets:
3744
qpsLoad:
3845
qps: {{$STEADY_STATE_QPS}}
3946

47+
4048
dependencies:
4149
- name: Install dra-example-driver for test
4250
Method: DRATestDriver
4351
Params:
4452
WorkerNodeCount: {{.Nodes}}
53+
{{if $ENABLE_EXTENDED_RESOURCES}}
54+
ExtendedResourceName: {{$extendedResourceName}}
55+
{{end}}
4556
Timeout: 5m
4657

4758
steps:
@@ -89,6 +100,7 @@ steps:
89100
query: histogram_quantile(0.99, sum(rate(dra_grpc_operations_duration_seconds_bucket{method_name=~".*NodePrepareResources"}[%v])) by (le))
90101
- name: p99_dra_grpc_node_unprepare_resources
91102
query: histogram_quantile(0.99, sum(rate(dra_grpc_operations_duration_seconds_bucket{method_name=~".*NodeUnprepareResources"}[%v])) by (le))
103+
{{if not $ENABLE_EXTENDED_RESOURCES}}
92104
- name: Create ResourceClaimTemplates in namespaces
93105
phases:
94106
- namespaceRange:
@@ -99,6 +111,7 @@ steps:
99111
objectBundle:
100112
- basename: single-gpu
101113
objectTemplatePath: "resourceclaimtemplate.yaml"
114+
{{end}}
102115
- name: Fill cluster to {{$fillPercentage}}% utilization
103116
phases:
104117
- namespaceRange:
@@ -113,6 +126,7 @@ steps:
113126
Replicas: {{$longJobSize}}
114127
Mode: {{$MODE}}
115128
Sleep: {{$longJobRunningTime}}
129+
ExtendedResource: {{ $ENABLE_EXTENDED_RESOURCES }}
116130
- name: Wait for fill pods to be running
117131
measurements:
118132
- Identifier: WaitForControlledPodsRunning
@@ -188,6 +202,7 @@ steps:
188202
CompletionReplicas: {{$smallJobCompletions}}
189203
Mode: {{$MODE}}
190204
Sleep: {{$jobRunningTime}}
205+
ExtendedResource: {{ $ENABLE_EXTENDED_RESOURCES }}
191206
- name: Wait for short-lived jobs to finish
192207
measurements:
193208
- Identifier: WaitForFinishedJobs
@@ -216,4 +231,4 @@ steps:
216231
- Identifier: ChurnDRAMetrics
217232
Method: GenericPrometheusQuery
218233
Params:
219-
action: gather
234+
action: gather

clusterloader2/testing/dra/job.yaml

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -23,8 +23,13 @@ spec:
2323
args:
2424
- {{.Sleep}}
2525
resources:
26+
{{ if .ExtendedResource }}
27+
limits:
28+
example.com/gpu: "1"
29+
{{ else }}
2630
claims:
2731
- name: gpu
2832
resourceClaims:
2933
- name: gpu
30-
resourceClaimTemplateName: single-gpu-0
34+
resourceClaimTemplateName: single-gpu-0
35+
{{ end }}

clusterloader2/testing/dra/long-running-job.yaml

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -23,8 +23,13 @@ spec:
2323
args:
2424
- {{.Sleep}}
2525
resources:
26+
{{ if .ExtendedResource }}
27+
limits:
28+
example.com/gpu: "1"
29+
{{ else }}
2630
claims:
2731
- name: gpu
2832
resourceClaims:
2933
- name: gpu
30-
resourceClaimTemplateName: single-gpu-0
34+
resourceClaimTemplateName: single-gpu-0
35+
{{ end }}

0 commit comments

Comments
 (0)