Skip to content

Commit db99097

Browse files
committed
add support for DRAExtendedResources
Signed-off-by: Alay Patel <alayp@nvidia.com>
1 parent 48123e4 commit db99097

File tree

5 files changed

+47
-3
lines changed

5 files changed

+47
-3
lines changed

clusterloader2/pkg/dependency/dra/dra.go

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -70,6 +70,10 @@ func (d *draDependency) Setup(config *dependency.Config) error {
7070
"Namespace": namespace,
7171
"WorkerNodeCount": getWorkerCount(config),
7272
}
73+
74+
if extendedResourceName, ok := config.Params["ExtendedResourceName"]; ok {
75+
mapping["ExtendedResourceName"] = extendedResourceName
76+
}
7377
if err := config.ClusterFramework.ApplyTemplatedManifests(
7478
manifestsFS,
7579
"manifests/*.yaml",
Lines changed: 4 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,10 +1,13 @@
11
---
22
# Source: dra-example-driver/templates/deviceclass.yaml
3-
apiVersion: resource.k8s.io/v1beta1
3+
apiVersion: resource.k8s.io/v1
44
kind: DeviceClass
55
metadata:
66
name: gpu.example.com
77
spec:
88
selectors:
99
- cel:
1010
expression: "device.driver == 'gpu.example.com'"
11+
{{- if .ExtendedResourceName}}
12+
extendedResourceName: "{{.ExtendedResourceName}}"
13+
{{- end}}

clusterloader2/testing/dra/config.yaml

Lines changed: 23 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -23,8 +23,15 @@
2323
{{$smallJobSize := 1}}
2424
{{$smallJobCompletions := 10}}
2525
{{$jobRunningTime := DefaultParam .CL2_JOB_RUNNING_TIME "30s"}}
26+
{{$ENABLE_EXTENDED_RESOURCES := DefaultParam .CL2_ENABLE_EXTENDED_RESOURCES false}}
2627

28+
{{$extendedResourceName := ""}}
29+
{{if $ENABLE_EXTENDED_RESOURCES}}
30+
{{$extendedResourceName = DefaultParam .CL2_EXTENDED_RESOURCE_NAME "example.com/gpu"}}
31+
name: dra-extended-resources-steady-state
32+
{{else}}
2733
name: dra-steady-state
34+
{{end}}
2835

2936
namespace:
3037
number: {{$namespaces}}
@@ -37,11 +44,15 @@ tuningSets:
3744
qpsLoad:
3845
qps: {{$STEADY_STATE_QPS}}
3946

47+
4048
dependencies:
4149
- name: Install dra-example-driver for test
4250
Method: DRATestDriver
4351
Params:
4452
WorkerNodeCount: {{.Nodes}}
53+
{{if $ENABLE_EXTENDED_RESOURCES}}
54+
ExtendedResourceName: {{$extendedResourceName}}
55+
{{end}}
4556
Timeout: 5m
4657

4758
steps:
@@ -89,6 +100,7 @@ steps:
89100
query: histogram_quantile(0.99, sum(rate(dra_grpc_operations_duration_seconds_bucket{method_name=~".*NodePrepareResources"}[%v])) by (le))
90101
- name: p99_dra_grpc_node_unprepare_resources
91102
query: histogram_quantile(0.99, sum(rate(dra_grpc_operations_duration_seconds_bucket{method_name=~".*NodeUnprepareResources"}[%v])) by (le))
103+
{{if not $ENABLE_EXTENDED_RESOURCES}}
92104
- name: Create ResourceClaimTemplates in namespaces
93105
phases:
94106
- namespaceRange:
@@ -99,6 +111,7 @@ steps:
99111
objectBundle:
100112
- basename: single-gpu
101113
objectTemplatePath: "resourceclaimtemplate.yaml"
114+
{{end}}
102115
- name: Fill cluster to {{$fillPercentage}}% utilization
103116
phases:
104117
- namespaceRange:
@@ -113,6 +126,11 @@ steps:
113126
Replicas: {{$longJobSize}}
114127
Mode: {{$MODE}}
115128
Sleep: {{$longJobRunningTime}}
129+
{{if $ENABLE_EXTENDED_RESOURCES}}
130+
ExtendedResource: {{ true }}
131+
{{else}}
132+
ExtendedResource: {{ false }}
133+
{{end}}
116134
- name: Wait for fill pods to be running
117135
measurements:
118136
- Identifier: WaitForControlledPodsRunning
@@ -188,6 +206,11 @@ steps:
188206
CompletionReplicas: {{$smallJobCompletions}}
189207
Mode: {{$MODE}}
190208
Sleep: {{$jobRunningTime}}
209+
{{if $ENABLE_EXTENDED_RESOURCES}}
210+
ExtendedResource: {{ true }}
211+
{{else}}
212+
ExtendedResource: {{ false }}
213+
{{end}}
191214
- name: Wait for short-lived jobs to finish
192215
measurements:
193216
- Identifier: WaitForFinishedJobs

clusterloader2/testing/dra/job.yaml

Lines changed: 8 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -23,8 +23,15 @@ spec:
2323
args:
2424
- {{.Sleep}}
2525
resources:
26+
{{ if not .ExtendedResource }}
2627
claims:
2728
- name: gpu
29+
{{ else }}
30+
limits:
31+
example.com/gpu: "1"
32+
{{ end }}
33+
{{ if not .ExtendedResource }}
2834
resourceClaims:
2935
- name: gpu
30-
resourceClaimTemplateName: single-gpu-0
36+
resourceClaimTemplateName: single-gpu-0
37+
{{ end }}

clusterloader2/testing/dra/long-running-job.yaml

Lines changed: 8 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -23,8 +23,15 @@ spec:
2323
args:
2424
- {{.Sleep}}
2525
resources:
26+
{{ if not .ExtendedResource }}
2627
claims:
2728
- name: gpu
29+
{{ else }}
30+
limits:
31+
example.com/gpu: "1"
32+
{{ end }}
33+
{{ if not .ExtendedResource }}
2834
resourceClaims:
2935
- name: gpu
30-
resourceClaimTemplateName: single-gpu-0
36+
resourceClaimTemplateName: single-gpu-0
37+
{{ end }}

0 commit comments

Comments
 (0)