From a9ac858b711803afd362b10a4dde0505708efef4 Mon Sep 17 00:00:00 2001
From: Kevin Hannon <kehannon@redhat.com>
Date: Tue, 3 Sep 2024 14:07:28 -0400
Subject: [PATCH 1/4] Kueue and DRA support

---
 keps/2941-DRA-Structured-Parameters/README.md | 394 ++++++++++++++++++
 .../examples/gpu-test1/gpu-test1.yaml         |  46 ++
 .../gpu-test1/single-clusterqueue-setup.yaml  |  32 ++
 keps/2941-DRA-Structured-Parameters/kep.yaml  |  42 ++
 4 files changed, 514 insertions(+)
 create mode 100644 keps/2941-DRA-Structured-Parameters/README.md
 create mode 100644 keps/2941-DRA-Structured-Parameters/examples/gpu-test1/gpu-test1.yaml
 create mode 100644 keps/2941-DRA-Structured-Parameters/examples/gpu-test1/single-clusterqueue-setup.yaml
 create mode 100644 keps/2941-DRA-Structured-Parameters/kep.yaml
diff --git a/keps/2941-DRA-Structured-Parameters/README.md b/keps/2941-DRA-Structured-Parameters/README.md
new file mode 100644
index 0000000000..953777fc07
--- /dev/null
+++ b/keps/2941-DRA-Structured-Parameters/README.md
@@ -0,0 +1,394 @@
+# KEP-2941: Structured Parameters
+
+<!--
+This is the title of your KEP. Keep it short, simple, and descriptive. A good
+title can help communicate what the KEP is and should be considered as part of
+any review.
+-->
+
+<!--
+A table of contents is helpful for quickly jumping to sections of a KEP and for
+highlighting any additional information provided beyond the standard KEP
+template.
+
+Ensure the TOC is wrapped with
+  <code>&lt;!-- toc --&rt;&lt;!-- /toc --&rt;</code>
+tags, and then generate with `hack/update-toc.sh`.
+-->
+
+<!-- toc -->
+- [Summary](#summary)
+- [Motivation](#motivation)
+  - [Background](#background)
+    - [DRA Example](#dra-example)
+    - [Workload Example](#workload-example)
+    - [Example Driver Cluster Resources](#example-driver-cluster-resources)
+      - [Resource slices](#resource-slices)
+      - [Device classes](#device-classes)
+  - [Goals](#goals)
+  - [Non-Goals](#non-goals)
+- [Proposal](#proposal)
+  - [User Stories (Optional)](#user-stories-optional)
+    - [Story 1](#story-1)
+  - [Notes/Constraints/Caveats (Optional)](#notesconstraintscaveats-optional)
+  - [Risks and Mitigations](#risks-and-mitigations)
+- [Design Details](#design-details)
+  - [Resource Quota API](#resource-quota-api)
+  - [Workloads](#workloads)
+  - [Test Plan](#test-plan)
+      - [Prerequisite testing updates](#prerequisite-testing-updates)
+    - [Unit Tests](#unit-tests)
+    - [Integration tests](#integration-tests)
+    - [E2E Test](#e2e-test)
+  - [Graduation Criteria](#graduation-criteria)
+    - [Feature Gate](#feature-gate)
+- [Implementation History](#implementation-history)
+- [Drawbacks](#drawbacks)
+- [Alternatives](#alternatives)
+  - [Resource Claim By Count](#resource-claim-by-count)
+<!-- /toc -->
+
+## Summary
+
+Dynamic Resource Allocation (DRA) is a major effort to improve device support in Kubernetes.
+It changes how one can request resources in a myriad of ways.
+
+## Motivation
+
+Dynamic Resource Allocation (DRA) provides the groundwork for more sophisticated device allocations to Pods.
+Quota management is about enforcing rules around the use of resources.
+For example, GPUs are resource constrained and a popular request is the ability to enforce fair sharing of GPU resources.
+With these devices, many users want access and sometimes some users want the ability to preempt other users if their workloads have a higher priority. Kueue provides support for this.
+
+DRA provides a future where users could schedule partitionable GPU devices (MIG) or time slicing. As devices gain a more robust way to schedule, it is important to walk through how support of DRA will work with Kueue.
+
+### Background
+
+DRA has three APIs that are relevant for a Kueue:
+
+- Resource Claims
+- DeviceClasses
+- ResourceSlices
+
+#### DRA Example
+
+I found the easiest way to test DRA was to use [dra example driver repository](https://github.com/kubernetes-sigs/dra-example-driver)
+
+You can clone that repo and run `make setup-e2e` and that will create a Kind cluster with the DRA feature gate and install a mock dra driver.
+
+This does not use actual GPUs so it is perfect for a test environment for exploring Kueue and DRA integration.
+
+#### Workload Example
+
+An example workload that uses DRA:
+
+```yaml
+---
+
+apiVersion: resource.k8s.io/v1alpha3
+kind: ResourceClaimTemplate
+metadata:
+  namespace: gpu-test1
+  name: single-gpu
+spec:
+  spec:
+    devices:
+      requests:
+      - name: gpu
+        deviceClassName: gpu.example.com
+
+---
+
+apiVersion: batch/v1
+kind: Job
+metadata:
+  namespace: gpu-test1
+  name: job0
+  labels:
+    app: job
+    kueue.x-k8s.io/queue-name: user-queue
+spec:
+  template:
+    spec:
+      restartPolicy: Never
+      containers:
+      - name: ctr0
+        image: ubuntu:22.04
+        command: ["bash", "-c"]
+        args: ["export; sleep 9999"]
+        resources:
+          claims:
+          - name: gpu
+          requests:
+            cpu: 1
+            memory: "200Mi"
+      resourceClaims:
+      - name: gpu
+        resourceClaimTemplateName: gpu.example.com
+```
+
+#### Example Driver Cluster Resources
+
+The dra-example-driver creates a resource slice and a device class for the entire cluster.
+
+##### Resource slices
+
+Resource slices are meant for communication between drivers and the control planes. These are not expected to be used for workloads.
+
+Kueue does not need to be aware of these resources.
+
+##### Device classes
+
+Each driver creates a device class and every resource claim will reference the device class.
+
+The dra-example-driver has a simple device class named `gpu.example.com`.
+
+This can be a way to enforce quota limits.
+
+### Goals
+
+- Users can submit workloads using resource claims and Kueue can monitor the usage.
+- Admins can enforce the number of requests to a given device class.
+
+<!--
+List the specific goals of the KEP. What is it trying to achieve? How will we
+know that this has succeeded?
+-->
+
+### Non-Goals
+
+- We are limiting scope for DRA to structured parameters (beta in 1.32)
+
+<!--
+What is out of scope for this KEP? Listing non-goals helps to focus discussion
+and make progress.
+-->
+
+## Proposal
+
+
+<!--
+This is where we get down to the specifics of what the proposal actually is.
+This should have enough detail that reviewers can understand exactly what
+you're proposing, but should not include things like API designs or
+implementation. What is the desired outcome and how do we measure success?.
+The "Design Details" section below is for the real
+nitty-gritty.
+-->
+
+### User Stories (Optional)
+
+<!--
+Detail the things that people will be able to do if this KEP is implemented.
+Include as much detail as possible so that people can understand the "how" of
+the system. The goal here is to make this feel real for users without getting
+bogged down.
+-->
+
+#### Story 1
+
+As an user, I want to use resource claims to provide more control over the scheduling of devices.
+I have a dra driver installed on my cluster and I am interested in using DRA for scheduling.
+
+I want to enforce quota usage for a ClusterQueue and forbid admitting workloads once they exceed the cluster queue limit.
+
+
+### Notes/Constraints/Caveats (Optional)
+
+<!--
+What are the caveats to the proposal?
+What are some important details that didn't come across above?
+Go in to as much detail as necessary here.
+This might be a good place to talk about core concepts and how they relate.
+-->
+
+### Risks and Mitigations
+
+<!--
+What are the risks of this proposal, and how do we mitigate? Think broadly.
+For example, consider both security and how this will impact the larger
+Kubernetes ecosystem.
+
+How will security be reviewed, and by whom?
+
+How will UX be reviewed, and by whom?
+
+Consider including folks who also work outside the SIG or subproject.
+-->
+
+## Design Details
+
+### Resource Quota API
+
+```golang
+type ResourceQuota struct {
+  // ...
+	// Kind is the type of resource that this resource is
+	// +kubebuilder:validation:Enum={Core,DeviceClass}
+	// +kubebuilder:default=Core
+	Kind ResourceKind `json:"kind"`
+}
+```
+
+Kind allows one to distinguish between a Core resource and a Device class.
+
+With this, a cluster queue could be defined as follows:
+
+```yaml
+apiVersion: kueue.x-k8s.io/v1beta1
+kind: ClusterQueue
+metadata:
+  name: "cluster-queue"
+spec:
+  namespaceSelector: {} # match all.
+  resourceGroups:
+  - coveredResources: ["cpu", "memory", "gpu.example.com"]
+    flavors:
+    - name: "default-flavor"
+      resources:
+      - name: "cpu"
+        nominalQuota: 9
+      - name: "memory"
+        nominalQuota: "200Mi"
+      - name: "gpu.example.com"
+        nominalQuota: 2
+        kind: "DeviceClass"
+```
+
+### Workloads
+
+When a user submits a workload and KueueDynamicResourceAllocation feature gate is on, Kueue will do the following:
+
+a. Claims will be read from resources.claims in the PodTemplateSpec.
+b. The name of the claim will be used to look up the corresponding `ResourceClaimTemplateName` in the PodTemplateSpec.
+c. The ResourceClaim will be read given the name in b and using the same namespace as the workload.
+d. From the ResourceClaimTemplate, the deviceClassName will be read.
+e. Every claim that requests the same deviceClassName will be tallied and reported in the ResourceUsage.
+
+```yaml
+---
+
+apiVersion: batch/v1
+kind: Job
+metadata:
+  namespace: gpu-test1
+  name: job0
+  labels:
+    app: job
+    kueue.x-k8s.io/queue-name: user-queue
+spec:
+  template:
+    spec:
+      restartPolicy: Never
+      containers:
+      - name: ctr0
+        image: ubuntu:22.04
+        command: ["bash", "-c"]
+        args: ["export; sleep 9999"]
+        resources:
+          claims:
+          - name: gpu. #a) read the claim from resources.claims
+          requests:
+            cpu: 1
+            memory: "200Mi"
+      resourceClaims:
+      - name: gpu # b) use the name in resources.claim
+        resourceClaimTemplateName: single-gpu # c) the name for resource claim templates 
+---
+apiVersion: resource.k8s.io/v1alpha3
+kind: ResourceClaimTemplate
+metadata:
+  namespace: gpu-test1
+  name: single-gpu
+spec:
+  spec:
+    devices:
+      requests:
+      - name: gpu
+        deviceClassName: gpu.example.com # d) the name of the device class
+
+```
+<!--
+This section should contain enough information that the specifics of your
+change are understandable. This may include API specs (though not always
+required) or even code snippets. If there's any ambiguity about HOW your
+proposal will be implemented, this is the place to discuss them.
+-->
+
+### Test Plan
+
+[x] I/we understand the owners of the involved components may require updates to
+existing tests to make this code solid enough prior to committing the changes necessary
+to implement this enhancement.
+
+##### Prerequisite testing updates
+
+<!--
+Based on reviewers feedback describe what additional tests need to be added prior
+implementing this enhancement to ensure the enhancements have also solid foundations.
+-->
+
+#### Unit Tests
+
+<!--
+In principle every added code should have complete unit test coverage, so providing
+the exact set of tests will not bring additional value.
+However, if complete unit test coverage is not possible, explain the reason of it
+together with explanation why this is acceptable.
+-->
+
+<!--
+Additionally, try to enumerate the core package you will be touching
+to implement this enhancement and provide the current unit coverage for those
+in the form of:
+- <package>: <date> - <current test coverage>
+
+This can inform certain test coverage improvements that we want to do before
+extending the production code to implement this enhancement.
+-->
+
+TBD
+- `<package>`: `<date>` - `<test coverage>`
+
+#### Integration tests
+
+I am not sure if we can test DRA functionality (requiring alpha features enabled) at the integration level.
+
+DRA requires a kubelet plugin so this may not be a good candidate for an integration test.
+
+#### E2E Test
+
+It may be worth creating install dra-example-driver and testing this e2e.
+
+<!--
+Describe what tests will be added to ensure proper quality of the enhancement.
+
+After the implementation PR is merged, add the names of the tests here.
+-->
+
+### Graduation Criteria
+
+#### Feature Gate
+
+We will introduce a KueueDynamicResourceAllocation feature gate.
+
+This feature gate will go beta once DRA is beta.
+
+The goal will be limit changes only if this feature gate is enabled in combination with the DRA feature.
+
+## Implementation History
+
+- Draft on September 16th 2024.
+
+## Drawbacks
+
+NA. Kueue should be able to schedule devices following what upstream is proposing. 
+The only drawbacks are that workloads will have to fetch the resource claim if they are specifying resource claims.
+
+## Alternatives
+
+### Resource Claim By Count
+
+Originally I was thinking one could keep a tally of the resource claims for a given workload. 
+The issue with this is that resource claims are namespaced scoped.
+To enforce quota usage across namespaces we need to use cluster scoped resources.
\ No newline at end of file
diff --git a/keps/2941-DRA-Structured-Parameters/examples/gpu-test1/gpu-test1.yaml b/keps/2941-DRA-Structured-Parameters/examples/gpu-test1/gpu-test1.yaml
new file mode 100644
index 0000000000..a2b072f70a
--- /dev/null
+++ b/keps/2941-DRA-Structured-Parameters/examples/gpu-test1/gpu-test1.yaml
@@ -0,0 +1,46 @@
+# Two pods, one container each
+# Each container asking for 1 distinct GPU
+
+---
+
+apiVersion: resource.k8s.io/v1alpha3
+kind: ResourceClaimTemplate
+metadata:
+  namespace: gpu-test1
+  name: single-gpu
+spec:
+  spec:
+    devices:
+      requests:
+      - name: gpu
+        deviceClassName: gpu.example.com
+
+---
+
+apiVersion: batch/v1
+kind: Job
+metadata:
+  namespace: gpu-test1
+  name: job0
+  labels:
+    app: job
+    kueue.x-k8s.io/queue-name: user-queue
+spec:
+  template:
+    spec:
+      restartPolicy: Never
+      containers:
+      - name: ctr0
+        image: ubuntu:22.04
+        command: ["bash", "-c"]
+        args: ["export; sleep 9999"]
+        resources:
+          claims:
+          - name: gpu
+          requests:
+            cpu: 1
+            memory: "200Mi"
+      resourceClaims:
+      - name: gpu
+        resourceClaimTemplateName: gpu.example.com
+
diff --git a/keps/2941-DRA-Structured-Parameters/examples/gpu-test1/single-clusterqueue-setup.yaml b/keps/2941-DRA-Structured-Parameters/examples/gpu-test1/single-clusterqueue-setup.yaml
new file mode 100644
index 0000000000..8434ee8df1
--- /dev/null
+++ b/keps/2941-DRA-Structured-Parameters/examples/gpu-test1/single-clusterqueue-setup.yaml
@@ -0,0 +1,32 @@
+apiVersion: kueue.x-k8s.io/v1beta1
+kind: ResourceFlavor
+metadata:
+  name: "default-flavor"
+---
+apiVersion: kueue.x-k8s.io/v1beta1
+kind: ClusterQueue
+metadata:
+  name: "cluster-queue"
+spec:
+  namespaceSelector: {} # match all.
+  resourceGroups:
+  - coveredResources: ["cpu", "memory", "gpu.example.com"]
+    flavors:
+    - name: "default-flavor"
+      resources:
+      - name: "cpu"
+        nominalQuota: 9
+      - name: "memory"
+        nominalQuota: "200Mi"
+      - name: "gpu.example.com"
+        nominalQuota: 2
+        kind: "DeviceClass"
+---
+apiVersion: kueue.x-k8s.io/v1beta1
+kind: LocalQueue
+metadata:
+  namespace: "gpu-test1"
+  name: "user-queue"
+spec:
+  clusterQueue: "cluster-queue"
+
diff --git a/keps/2941-DRA-Structured-Parameters/kep.yaml b/keps/2941-DRA-Structured-Parameters/kep.yaml
new file mode 100644
index 0000000000..5013d83832
--- /dev/null
+++ b/keps/2941-DRA-Structured-Parameters/kep.yaml
@@ -0,0 +1,42 @@
+title: DRA (Structured Parameters) Support in Kueue
+kep-number: 2941
+authors:
+  - "@kannon92"
+status: provisional
+creation-date: 2024-08-30
+reviewers:
+  - tbd
+  - "tbd"
+approvers:
+  - TBD
+  - "tbd"
+
+see-also:
+  - "dra kep in upstream"
+  - "/keps/2345-everyone-gets-a-kep"
+replaces:
+  - "/keps/3456-replaced-kep"
+
+# The target maturity stage in the current dev cycle for this KEP.
+stage: alpha
+
+# The most recent milestone for which work toward delivery of this KEP has been
+# done. This can be the current (upcoming) milestone, if it is being actively
+# worked on.
+latest-milestone: "v0.9"
+
+# The milestone at which this feature was, or is targeted to be, at each stage.
+milestone:
+  alpha: "v0.9"
+  beta: "v0.10"
+  stable: "v0.11"
+
+# The following PRR answers are required at alpha release
+# List the feature gate name and the components for which it must be enabled
+feature-gates:
+  - name: MyFeature
+disable-supported: true
+
+# The following PRR answers are required at beta release
+metrics:
+  - my_feature_metric

From 8a23e50ddbe1667ccd118bae5516a322fb1d0ac6 Mon Sep 17 00:00:00 2001
From: Kevin Hannon <kehannon@redhat.com>
Date: Fri, 20 Sep 2024 13:23:43 -0400
Subject: [PATCH 2/4] poc for dynamic resource support in kueue

---
 config/components/rbac/role.yaml              |  9 ++
 .../examples/gpu-test1/gpu-test1.yaml         |  6 +-
 .../gpu-test1/single-clusterqueue-setup.yaml  |  1 -
 keps/2941-DRA-Structured-Parameters/kep.yaml  |  2 +-
 .../core/clusterqueue_controller.go           |  2 +
 pkg/controller/core/workload_controller.go    |  4 +
 pkg/features/kube_features.go                 |  8 ++
 pkg/queue/manager.go                          |  1 +
 pkg/util/limitrange/limitrange.go             | 57 ++++++++++++
 pkg/util/limitrange/limitrange_test.go        | 43 +++++++++
 pkg/util/testing/wrappers.go                  |  6 ++
 pkg/workload/resources.go                     | 80 +++++++++++++++++
 pkg/workload/resources_test.go                | 87 +++++++++++++++++++
 13 files changed, 302 insertions(+), 4 deletions(-)

diff --git a/config/components/rbac/role.yaml b/config/components/rbac/role.yaml
index d708ec0799..328753c3d8 100644
--- a/config/components/rbac/role.yaml
+++ b/config/components/rbac/role.yaml
@@ -290,6 +290,15 @@ rules:
   verbs:
   - get
   - update
+- apiGroups:
+  - resource.k8s.io
+  resources:
+  - deviceclasses
+  - resourceclaimtemplates
+  verbs:
+  - get
+  - list
+  - watch
 - apiGroups:
   - scheduling.k8s.io
   resources:
diff --git a/keps/2941-DRA-Structured-Parameters/examples/gpu-test1/gpu-test1.yaml b/keps/2941-DRA-Structured-Parameters/examples/gpu-test1/gpu-test1.yaml
index a2b072f70a..6e40ebe8c7 100644
--- a/keps/2941-DRA-Structured-Parameters/examples/gpu-test1/gpu-test1.yaml
+++ b/keps/2941-DRA-Structured-Parameters/examples/gpu-test1/gpu-test1.yaml
@@ -26,6 +26,8 @@ metadata:
     app: job
     kueue.x-k8s.io/queue-name: user-queue
 spec:
+  parallelism: 2
+  completions: 2
   template:
     spec:
       restartPolicy: Never
@@ -39,8 +41,8 @@ spec:
           - name: gpu
           requests:
             cpu: 1
-            memory: "200Mi"
+            memory: "100Mi"
       resourceClaims:
       - name: gpu
-        resourceClaimTemplateName: gpu.example.com
+        resourceClaimTemplateName: single-gpu
 
diff --git a/keps/2941-DRA-Structured-Parameters/examples/gpu-test1/single-clusterqueue-setup.yaml b/keps/2941-DRA-Structured-Parameters/examples/gpu-test1/single-clusterqueue-setup.yaml
index 8434ee8df1..309e93d8d0 100644
--- a/keps/2941-DRA-Structured-Parameters/examples/gpu-test1/single-clusterqueue-setup.yaml
+++ b/keps/2941-DRA-Structured-Parameters/examples/gpu-test1/single-clusterqueue-setup.yaml
@@ -20,7 +20,6 @@ spec:
         nominalQuota: "200Mi"
       - name: "gpu.example.com"
         nominalQuota: 2
-        kind: "DeviceClass"
 ---
 apiVersion: kueue.x-k8s.io/v1beta1
 kind: LocalQueue
diff --git a/keps/2941-DRA-Structured-Parameters/kep.yaml b/keps/2941-DRA-Structured-Parameters/kep.yaml
index 5013d83832..2a2b40d737 100644
--- a/keps/2941-DRA-Structured-Parameters/kep.yaml
+++ b/keps/2941-DRA-Structured-Parameters/kep.yaml
@@ -34,7 +34,7 @@ milestone:
 # The following PRR answers are required at alpha release
 # List the feature gate name and the components for which it must be enabled
 feature-gates:
-  - name: MyFeature
+  - name: KueueDynamicResourceAllocation
 disable-supported: true
 
 # The following PRR answers are required at beta release
diff --git a/pkg/controller/core/clusterqueue_controller.go b/pkg/controller/core/clusterqueue_controller.go
index 719f4caced..73179d2d7d 100644
--- a/pkg/controller/core/clusterqueue_controller.go
+++ b/pkg/controller/core/clusterqueue_controller.go
@@ -152,6 +152,8 @@ func NewClusterQueueReconciler(
 
 // +kubebuilder:rbac:groups="",resources=namespaces,verbs=get;list;watch
 // +kubebuilder:rbac:groups="",resources=events,verbs=create;watch;update;patch
+// +kubebuilder:rbac:groups=resource.k8s.io,resources=resourceclaimtemplates,verbs=get;list;watch
+// +kubebuilder:rbac:groups=resource.k8s.io,resources=deviceclasses,verbs=get;list;watch
 // +kubebuilder:rbac:groups=kueue.x-k8s.io,resources=clusterqueues,verbs=get;list;watch;create;update;patch;delete
 // +kubebuilder:rbac:groups=kueue.x-k8s.io,resources=clusterqueues/status,verbs=get;update;patch
 // +kubebuilder:rbac:groups=kueue.x-k8s.io,resources=clusterqueues/finalizers,verbs=update
diff --git a/pkg/controller/core/workload_controller.go b/pkg/controller/core/workload_controller.go
index 642312555d..23db631a62 100644
--- a/pkg/controller/core/workload_controller.go
+++ b/pkg/controller/core/workload_controller.go
@@ -569,6 +569,7 @@ func (r *WorkloadReconciler) Create(e event.CreateEvent) bool {
 	ctx := ctrl.LoggerInto(context.Background(), log)
 	wlCopy := wl.DeepCopy()
 	workload.AdjustResources(ctx, r.client, wlCopy)
+	workload.AddDeviceClassesToContainerRequests(ctx, r.client, wlCopy)
 
 	if !workload.HasQuotaReservation(wl) {
 		if !r.queues.AddOrUpdateWorkload(wlCopy) {
@@ -655,6 +656,7 @@ func (r *WorkloadReconciler) Update(e event.UpdateEvent) bool {
 	wlCopy := wl.DeepCopy()
 	// We do not handle old workload here as it will be deleted or replaced by new one anyway.
 	workload.AdjustResources(ctrl.LoggerInto(ctx, log), r.client, wlCopy)
+	workload.AddDeviceClassesToContainerRequests(ctx, r.client, wlCopy)
 
 	switch {
 	case status == workload.StatusFinished || !active:
@@ -858,6 +860,8 @@ func (h *resourceUpdatesHandler) queueReconcileForPending(ctx context.Context, _
 		log := log.WithValues("workload", klog.KObj(wlCopy))
 		log.V(5).Info("Queue reconcile for")
 		workload.AdjustResources(ctrl.LoggerInto(ctx, log), h.r.client, wlCopy)
+		workload.AddDeviceClassesToContainerRequests(ctx, h.r.client, wlCopy)
+
 		if !h.r.queues.AddOrUpdateWorkload(wlCopy) {
 			log.V(2).Info("Queue for workload didn't exist")
 		}
diff --git a/pkg/features/kube_features.go b/pkg/features/kube_features.go
index 1fea5f250a..6c57ffd864 100644
--- a/pkg/features/kube_features.go
+++ b/pkg/features/kube_features.go
@@ -101,6 +101,13 @@ const (
 	// Enable more than one workload sharing flavors to preempt within a Cohort,
 	// as long as the preemption targets don't overlap.
 	MultiplePreemptions featuregate.Feature = "MultiplePreemptions"
+
+	// owner: @kannon92
+	// kep: 2941
+	// this should follow graduation process for strucuted parameters
+	// alpha: v0.9
+	// Enable the usage of DRA for Kueue
+	DynamicResourceStructuredParameters featuregate.Feature = "DynamicResourceStructuredParameters"
 )
 
 func init() {
@@ -124,6 +131,7 @@ var defaultFeatureGates = map[featuregate.Feature]featuregate.FeatureSpec{
 	LendingLimit:                    {Default: true, PreRelease: featuregate.Beta},
 	MultiKueueBatchJobWithManagedBy: {Default: false, PreRelease: featuregate.Alpha},
 	MultiplePreemptions:             {Default: true, PreRelease: featuregate.Beta},
+	DynamicResourceStructuredParameters: {Default: false, PreRelease: featuregate.Alpha},
 }
 
 func SetFeatureGateDuringTest(tb testing.TB, f featuregate.Feature, value bool) {
diff --git a/pkg/queue/manager.go b/pkg/queue/manager.go
index a36ee73f52..5a43b3efde 100644
--- a/pkg/queue/manager.go
+++ b/pkg/queue/manager.go
@@ -220,6 +220,7 @@ func (m *Manager) AddLocalQueue(ctx context.Context, q *kueue.LocalQueue) error
 			continue
 		}
 		workload.AdjustResources(ctx, m.client, &w)
+		workload.AddDeviceClassesToContainerRequests(ctx, m.client, &w)
 		qImpl.AddOrUpdate(workload.NewInfo(&w, m.workloadInfoOptions...))
 	}
 	cq := m.hm.ClusterQueues[qImpl.ClusterQueue]
diff --git a/pkg/util/limitrange/limitrange.go b/pkg/util/limitrange/limitrange.go
index 98fbde5faf..2ae360ad08 100644
--- a/pkg/util/limitrange/limitrange.go
+++ b/pkg/util/limitrange/limitrange.go
@@ -22,7 +22,9 @@ import (
 
 	corev1 "k8s.io/api/core/v1"
 	"k8s.io/utils/field"
+	"k8s.io/utils/ptr"
 
+	k8sresource "k8s.io/apimachinery/pkg/api/resource"
 	"sigs.k8s.io/kueue/pkg/util/resource"
 )
 
@@ -133,6 +135,61 @@ func calculateSidecarContainersResources(initContainers []corev1.Container) core
 	return total
 }
 
+// TotalResourceClaimsFromPodSpec will calculate the number of requests
+// for ResourceClaimTemplates from a single pod spec.
+// We will increment all requests for PodResourceClaims.
+func TotalResourceClaimsFromPodSpec(ps *corev1.PodSpec) corev1.ResourceList {
+	return calculatePodClaims(ps)
+}
+
+func calculatePodClaims(ps *corev1.PodSpec) corev1.ResourceList {
+	totalClaims := make(map[string]int64)
+	totalResourceClaimTemplate := corev1.ResourceList{}
+	containers := ps.Containers
+	initContainers := ps.InitContainers
+	// We want to track the number of claims for the pod.
+	for i := range ps.Containers {
+		for _, val := range containers[i].Resources.Claims {
+			totalClaims[val.Name] = totalClaims[val.Name] + 1
+		}
+	}
+	for i := range initContainers {
+		for _, val := range initContainers[i].Resources.Claims {
+			totalClaims[val.Name] = totalClaims[val.Name] + 1
+		}
+	}
+	for i := range initContainers {
+		if isSidecarContainer(initContainers[i]) {
+			for _, val := range initContainers[i].Resources.Claims {
+				totalClaims[val.Name] = totalClaims[val.Name] + 1
+			}
+		}
+	}
+	for _, val := range ps.ResourceClaims {
+		_, ok := totalClaims[val.Name]
+		if ok {
+			keyName := ""
+			if ptr.Deref(val.ResourceClaimName, "") != "" {
+				keyName = *val.ResourceClaimName
+			} else if ptr.Deref(val.ResourceClaimTemplateName, "") != "" {
+				keyName = *val.ResourceClaimTemplateName
+			} else {
+				// TODO: figure out what to do in this case
+				// DRA API says this is not allowed
+				return totalResourceClaimTemplate
+			}
+			countOfClaims, ok := totalResourceClaimTemplate[corev1.ResourceName(keyName)]
+			if ok {
+				count := countOfClaims.Value() + totalClaims[val.Name]
+				totalResourceClaimTemplate[corev1.ResourceName(keyName)] = *k8sresource.NewQuantity(count, k8sresource.DecimalSI)
+			} else {
+				totalResourceClaimTemplate[corev1.ResourceName(keyName)] = *k8sresource.NewQuantity(totalClaims[val.Name], k8sresource.DecimalSI)
+			}
+		}
+	}
+	return totalResourceClaimTemplate
+}
+
 func isSidecarContainer(container corev1.Container) bool {
 	return container.RestartPolicy != nil && *container.RestartPolicy == corev1.ContainerRestartPolicyAlways
 }
diff --git a/pkg/util/limitrange/limitrange_test.go b/pkg/util/limitrange/limitrange_test.go
index 536f5b0f68..dfe2d703d9 100644
--- a/pkg/util/limitrange/limitrange_test.go
+++ b/pkg/util/limitrange/limitrange_test.go
@@ -23,6 +23,7 @@ import (
 	corev1 "k8s.io/api/core/v1"
 	"k8s.io/apimachinery/pkg/api/resource"
 	"k8s.io/utils/field"
+	"k8s.io/utils/ptr"
 
 	testingutil "sigs.k8s.io/kueue/pkg/util/testing"
 )
@@ -501,3 +502,45 @@ func TestValidatePodSpec(t *testing.T) {
 		})
 	}
 }
+
+func TestTotalResourceClaimsFromPodSpec(t *testing.T) {
+	cases := map[string]struct {
+		podSpec *corev1.PodSpec
+		want    corev1.ResourceList
+	}{
+		"pod without init containers. resource claims shared": {
+			podSpec: &corev1.PodSpec{
+				Containers: []corev1.Container{
+					*testingutil.MakeContainer().
+						WithClaimReq([]corev1.ResourceClaim{{Name: "test"}}).
+						Obj(),
+					*testingutil.MakeContainer().
+						WithClaimReq([]corev1.ResourceClaim{{Name: "test1"}}).
+						Obj(),
+				},
+				ResourceClaims: []corev1.PodResourceClaim{
+					{
+						Name:                      "test",
+						ResourceClaimTemplateName: ptr.To("single-gpu"),
+					},
+					{
+						Name:                      "test1",
+						ResourceClaimTemplateName: ptr.To("single-gpu"),
+					},
+				},
+			},
+			want: corev1.ResourceList{
+				"single-gpu": resource.MustParse("2"),
+			},
+		},
+	}
+
+	for name, tc := range cases {
+		t.Run(name, func(t *testing.T) {
+			result := TotalResourceClaimsFromPodSpec(tc.podSpec)
+			if diff := cmp.Diff(tc.want, result); diff != "" {
+				t.Errorf("Unexpected result (-want,+got):\n%s", diff)
+			}
+		})
+	}
+}
diff --git a/pkg/util/testing/wrappers.go b/pkg/util/testing/wrappers.go
index f7c3555739..051622dca7 100644
--- a/pkg/util/testing/wrappers.go
+++ b/pkg/util/testing/wrappers.go
@@ -1203,6 +1203,12 @@ func (c *ContainerWrapper) WithResourceReq(resourceName corev1.ResourceName, qua
 	return c
 }
 
+// WithResourceClaim appends a claim request to the container
+func (c *ContainerWrapper) WithClaimReq(claims []corev1.ResourceClaim) *ContainerWrapper {
+	c.Container.Resources.Claims = claims
+	return c
+}
+
 // AsSidecar makes the container a sidecar when used as an Init Container.
 func (c *ContainerWrapper) AsSidecar() *ContainerWrapper {
 	c.Container.RestartPolicy = ptr.To(corev1.ContainerRestartPolicyAlways)
diff --git a/pkg/workload/resources.go b/pkg/workload/resources.go
index b8cf31c182..5854a5e4ce 100644
--- a/pkg/workload/resources.go
+++ b/pkg/workload/resources.go
@@ -22,12 +22,16 @@ import (
 
 	corev1 "k8s.io/api/core/v1"
 	nodev1 "k8s.io/api/node/v1"
+	dra "k8s.io/api/resource/v1alpha3"
+	k8sresource "k8s.io/apimachinery/pkg/api/resource"
 	"k8s.io/apimachinery/pkg/types"
 	ctrl "sigs.k8s.io/controller-runtime"
 	"sigs.k8s.io/controller-runtime/pkg/client"
 
 	kueue "sigs.k8s.io/kueue/apis/kueue/v1beta1"
 	"sigs.k8s.io/kueue/pkg/controller/core/indexer"
+	"sigs.k8s.io/kueue/pkg/features"
+	"sigs.k8s.io/kueue/pkg/resources"
 	"sigs.k8s.io/kueue/pkg/util/limitrange"
 	"sigs.k8s.io/kueue/pkg/util/resource"
 )
@@ -119,3 +123,79 @@ func AdjustResources(ctx context.Context, cl client.Client, wl *kueue.Workload)
 	}
 	handleLimitsToRequests(wl)
 }
+
+// GetResourceClaimTemplates will retrieve the ResourceClaimTemplate from the api server.
+func GetResourceClaimTemplates(ctx context.Context, c client.Client, name, namespace string) (dra.ResourceClaimTemplate, error) {
+	resourceClaimTemplate := dra.ResourceClaimTemplate{}
+	err := c.Get(ctx, types.NamespacedName{Name: name, Namespace: namespace}, &resourceClaimTemplate, &client.GetOptions{})
+	return resourceClaimTemplate, err
+}
+
+func AddDeviceClassesToContainerRequests(ctx context.Context, cl client.Client, wl *kueue.Workload) {
+	// If DRA is not enabled then this becomes a no op and workloads won't be modified.
+	// There is a potential issue
+	// If Kueue has this feature enabled but the k8s cluster does not have this enabled,
+	// then Kueue may not be able to actually find these resources
+	if !features.Enabled(features.DynamicResourceStructuredParameters) {
+		return
+	}
+
+	log := ctrl.LoggerFrom(ctx)
+	resourceList, errors := handleResourceClaimTemplate(ctx, cl, AddResourceClaimsToResourceList(wl), wl.Namespace)
+	for key, val := range resourceList {
+		log.Info("ResourceList", "key", key, "val", val)
+	}
+	for _, err := range errors {
+		log.Error(err, "Failures adjusting requests for dynamic resources")
+	}
+	for pi := range wl.Spec.PodSets {
+		resourceClaimsToContainerRequests(&wl.Spec.PodSets[pi].Template.Spec, resourceList)
+	}
+}
+
+func resourceClaimsToContainerRequests(podSpec *corev1.PodSpec, resourceList corev1.ResourceList) {
+	for i := range podSpec.InitContainers {
+		res := &podSpec.InitContainers[i].Resources
+		res.Requests = resource.MergeResourceListKeepFirst(res.Requests, resourceList)
+	}
+	for i := range podSpec.Containers {
+		res := &podSpec.Containers[i].Resources
+		res.Requests = resource.MergeResourceListKeepFirst(res.Requests, resourceList)
+	}
+}
+func handleResourceClaimTemplate(ctx context.Context, cl client.Client, psr []PodSetResources, namespace string) (corev1.ResourceList, []error) {
+	var errors []error
+	updateResourceList := corev1.ResourceList{}
+	for _, singlePsr := range psr {
+		for key, request := range singlePsr.Requests {
+			draDeviceClass, err := GetResourceClaimTemplates(ctx, cl, key.String(), namespace)
+			if err != nil {
+				errors = append(errors, fmt.Errorf("unable to get %s/%s resource claim %v", namespace, key, err))
+			}
+			for _, val := range draDeviceClass.Spec.Spec.Devices.Requests {
+				updateResourceList[corev1.ResourceName(val.DeviceClassName)] = *k8sresource.NewQuantity(request, k8sresource.DecimalSI)
+			}
+		}
+	}
+	return updateResourceList, errors
+}
+
+func AddResourceClaimsToResourceList(wl *kueue.Workload) []PodSetResources {
+	if len(wl.Spec.PodSets) == 0 {
+		return nil
+	}
+	res := make([]PodSetResources, 0, len(wl.Spec.PodSets))
+	podSets := &wl.Spec.PodSets
+	currentCounts := podSetsCountsAfterReclaim(wl)
+	for _, ps := range *podSets {
+		count := currentCounts[ps.Name]
+		setRes := PodSetResources{
+			Name:  ps.Name,
+			Count: count,
+		}
+		setRes.Requests = resources.NewRequests(limitrange.TotalResourceClaimsFromPodSpec(&ps.Template.Spec))
+		scaleUp(setRes.Requests, int64(count))
+		res = append(res, setRes)
+	}
+	return res
+}
diff --git a/pkg/workload/resources_test.go b/pkg/workload/resources_test.go
index 0b5623401e..9a2bc5b2c5 100644
--- a/pkg/workload/resources_test.go
+++ b/pkg/workload/resources_test.go
@@ -19,6 +19,7 @@ import (
 	"github.com/google/go-cmp/cmp"
 	corev1 "k8s.io/api/core/v1"
 	nodev1 "k8s.io/api/node/v1"
+	dra "k8s.io/api/resource/v1alpha3"
 	"k8s.io/apimachinery/pkg/api/resource"
 
 	kueue "sigs.k8s.io/kueue/apis/kueue/v1beta1"
@@ -481,3 +482,89 @@ func TestAdjustResources(t *testing.T) {
 		})
 	}
 }
+
+func TestAddDeviceClassesToContainerRequests(t *testing.T) {
+	cases := map[string]struct {
+		wl                    *kueue.Workload
+		resourceClaimTemplate dra.ResourceClaimTemplate
+		wantWl                *kueue.Workload
+	}{
+		"single device class request": {
+			wl: utiltesting.MakeWorkload("foo", "").
+				PodSets(
+					*utiltesting.MakePodSet("a", 1).
+						InitContainers(corev1.Container{}).
+						Obj(),
+					*utiltesting.MakePodSet("b", 1).
+						InitContainers(corev1.Container{}).
+						Limit(corev1.ResourceCPU, "6").
+						Obj(),
+					*utiltesting.MakePodSet("c", 1).
+						InitContainers(corev1.Container{}).
+						Request(corev1.ResourceCPU, "1").
+						Obj(),
+				).
+				Obj(),
+			wantWl: utiltesting.MakeWorkload("foo", "").
+				PodSets(
+					*utiltesting.MakePodSet("a", 1).
+						Limit(corev1.ResourceCPU, "4").
+						Request(corev1.ResourceCPU, "3").
+						InitContainers(corev1.Container{
+							Resources: corev1.ResourceRequirements{
+								Limits: corev1.ResourceList{
+									corev1.ResourceCPU: *resource.NewQuantity(4, resource.DecimalSI),
+								},
+								Requests: corev1.ResourceList{
+									corev1.ResourceCPU: *resource.NewQuantity(3, resource.DecimalSI),
+								},
+							},
+						}).
+						Obj(),
+					*utiltesting.MakePodSet("b", 1).
+						Limit(corev1.ResourceCPU, "6").
+						Request(corev1.ResourceCPU, "3").
+						InitContainers(corev1.Container{
+							Resources: corev1.ResourceRequirements{
+								Limits: corev1.ResourceList{
+									corev1.ResourceCPU: *resource.NewQuantity(4, resource.DecimalSI),
+								},
+								Requests: corev1.ResourceList{
+									corev1.ResourceCPU: *resource.NewQuantity(3, resource.DecimalSI),
+								},
+							},
+						}).
+						Obj(),
+					*utiltesting.MakePodSet("c", 1).
+						Limit(corev1.ResourceCPU, "4").
+						Request(corev1.ResourceCPU, "1").
+						InitContainers(corev1.Container{
+							Resources: corev1.ResourceRequirements{
+								Limits: corev1.ResourceList{
+									corev1.ResourceCPU: *resource.NewQuantity(4, resource.DecimalSI),
+								},
+								Requests: corev1.ResourceList{
+									corev1.ResourceCPU: *resource.NewQuantity(3, resource.DecimalSI),
+								},
+							},
+						}).
+						Obj(),
+				).
+				Obj(),
+		},
+	}
+	for name, tc := range cases {
+		t.Run(name, func(t *testing.T) {
+			cl := utiltesting.NewClientBuilder().WithLists(
+				&nodev1.RuntimeClassList{Items: tc.runtimeClasses},
+				&corev1.LimitRangeList{Items: tc.limitranges},
+			).WithIndex(&corev1.LimitRange{}, indexer.LimitRangeHasContainerType, indexer.IndexLimitRangeHasContainerType).
+				Build()
+			ctx, _ := utiltesting.ContextWithLog(t)
+			AddDeviceClassesToContainerRequests(ctx, cl, tc.wl)
+			if diff := cmp.Diff(tc.wl, tc.wantWl); diff != "" {
+				t.Errorf("Unexpected resources after adjusting (-want,+got): %s", diff)
+			}
+		})
+	}
+}

From 88631bdac4a174a1c8b7913c70a973f037f4c868 Mon Sep 17 00:00:00 2001
From: Kevin Hannon <kehannon@redhat.com>
Date: Fri, 20 Sep 2024 13:57:57 -0400
Subject: [PATCH 3/4] poc with some tests

---
 pkg/util/testing/wrappers.go   |  16 ++++
 pkg/workload/resources_test.go | 136 ++++++++++++++++++++++-----------
 2 files changed, 106 insertions(+), 46 deletions(-)

diff --git a/pkg/util/testing/wrappers.go b/pkg/util/testing/wrappers.go
index 051622dca7..b82895cb75 100644
--- a/pkg/util/testing/wrappers.go
+++ b/pkg/util/testing/wrappers.go
@@ -401,6 +401,22 @@ func (p *PodSetWrapper) Limit(r corev1.ResourceName, q string) *PodSetWrapper {
 	return p
 }
 
+func (p *PodSetWrapper) Claim(claim corev1.ResourceClaim) *PodSetWrapper {
+	if p.Template.Spec.Containers[0].Resources.Claims == nil {
+		p.Template.Spec.Containers[0].Resources.Claims = []corev1.ResourceClaim{}
+	}
+	p.Template.Spec.Containers[0].Resources.Claims = append(p.Template.Spec.Containers[0].Resources.Claims, claim)
+	return p
+}
+
+func (p *PodSetWrapper) ResourceClaim(resourceClaim corev1.PodResourceClaim) *PodSetWrapper {
+	if p.Template.Spec.ResourceClaims == nil {
+		p.Template.Spec.ResourceClaims = []corev1.PodResourceClaim{}
+	}
+	p.Template.Spec.ResourceClaims = append(p.Template.Spec.ResourceClaims, resourceClaim)
+	return p
+}
+
 func (p *PodSetWrapper) Image(image string) *PodSetWrapper {
 	p.Template.Spec.Containers[0].Image = image
 	return p
diff --git a/pkg/workload/resources_test.go b/pkg/workload/resources_test.go
index 9a2bc5b2c5..2b60af9607 100644
--- a/pkg/workload/resources_test.go
+++ b/pkg/workload/resources_test.go
@@ -21,9 +21,12 @@ import (
 	nodev1 "k8s.io/api/node/v1"
 	dra "k8s.io/api/resource/v1alpha3"
 	"k8s.io/apimachinery/pkg/api/resource"
+	v1 "k8s.io/apimachinery/pkg/apis/meta/v1"
+	"k8s.io/utils/ptr"
 
 	kueue "sigs.k8s.io/kueue/apis/kueue/v1beta1"
 	"sigs.k8s.io/kueue/pkg/controller/core/indexer"
+	"sigs.k8s.io/kueue/pkg/features"
 	"sigs.k8s.io/kueue/pkg/resources"
 	utiltesting "sigs.k8s.io/kueue/pkg/util/testing"
 )
@@ -486,67 +489,108 @@ func TestAdjustResources(t *testing.T) {
 func TestAddDeviceClassesToContainerRequests(t *testing.T) {
 	cases := map[string]struct {
 		wl                    *kueue.Workload
-		resourceClaimTemplate dra.ResourceClaimTemplate
+		enableDRAGate         bool
+		resourceClaimTemplate []dra.ResourceClaimTemplate
 		wantWl                *kueue.Workload
 	}{
-		"single device class request": {
+		"dra feature gate off; ignore devices": {
+			enableDRAGate: false,
+			resourceClaimTemplate: []dra.ResourceClaimTemplate{
+				{
+					ObjectMeta: v1.ObjectMeta{
+						Name:      "single-gpu",
+						Namespace: "",
+					},
+					Spec: dra.ResourceClaimTemplateSpec{
+						Spec: dra.ResourceClaimSpec{
+							Devices: dra.DeviceClaim{
+								Requests: []dra.DeviceRequest{{
+									Name:            "single-gpu",
+									DeviceClassName: "gpu.example.com",
+								}},
+							},
+						},
+					},
+				},
+			},
 			wl: utiltesting.MakeWorkload("foo", "").
 				PodSets(
 					*utiltesting.MakePodSet("a", 1).
-						InitContainers(corev1.Container{}).
-						Obj(),
-					*utiltesting.MakePodSet("b", 1).
-						InitContainers(corev1.Container{}).
-						Limit(corev1.ResourceCPU, "6").
-						Obj(),
-					*utiltesting.MakePodSet("c", 1).
-						InitContainers(corev1.Container{}).
+						Limit(corev1.ResourceCPU, "2").
 						Request(corev1.ResourceCPU, "1").
+						Claim(corev1.ResourceClaim{
+							Name: "gpu",
+						}).
+						ResourceClaim(corev1.PodResourceClaim{
+							Name:                      "gpu",
+							ResourceClaimTemplateName: ptr.To("single-gpu"),
+						}).
 						Obj(),
 				).
 				Obj(),
 			wantWl: utiltesting.MakeWorkload("foo", "").
 				PodSets(
 					*utiltesting.MakePodSet("a", 1).
-						Limit(corev1.ResourceCPU, "4").
-						Request(corev1.ResourceCPU, "3").
-						InitContainers(corev1.Container{
-							Resources: corev1.ResourceRequirements{
-								Limits: corev1.ResourceList{
-									corev1.ResourceCPU: *resource.NewQuantity(4, resource.DecimalSI),
-								},
-								Requests: corev1.ResourceList{
-									corev1.ResourceCPU: *resource.NewQuantity(3, resource.DecimalSI),
-								},
-							},
+						Limit(corev1.ResourceCPU, "2").
+						Request(corev1.ResourceCPU, "1").
+						Claim(corev1.ResourceClaim{
+							Name: "gpu",
+						}).
+						ResourceClaim(corev1.PodResourceClaim{
+							Name:                      "gpu",
+							ResourceClaimTemplateName: ptr.To("single-gpu"),
 						}).
 						Obj(),
-					*utiltesting.MakePodSet("b", 1).
-						Limit(corev1.ResourceCPU, "6").
-						Request(corev1.ResourceCPU, "3").
-						InitContainers(corev1.Container{
-							Resources: corev1.ResourceRequirements{
-								Limits: corev1.ResourceList{
-									corev1.ResourceCPU: *resource.NewQuantity(4, resource.DecimalSI),
-								},
-								Requests: corev1.ResourceList{
-									corev1.ResourceCPU: *resource.NewQuantity(3, resource.DecimalSI),
-								},
+				).
+				Obj(),
+		},
+		"single device class request in a container": {
+			enableDRAGate: true,
+			resourceClaimTemplate: []dra.ResourceClaimTemplate{
+				{
+					ObjectMeta: v1.ObjectMeta{
+						Name:      "single-gpu",
+						Namespace: "",
+					},
+					Spec: dra.ResourceClaimTemplateSpec{
+						Spec: dra.ResourceClaimSpec{
+							Devices: dra.DeviceClaim{
+								Requests: []dra.DeviceRequest{{
+									Name:            "single-gpu",
+									DeviceClassName: "gpu.example.com",
+								}},
 							},
+						},
+					},
+				},
+			},
+			wl: utiltesting.MakeWorkload("foo", "").
+				PodSets(
+					*utiltesting.MakePodSet("a", 1).
+						Limit(corev1.ResourceCPU, "2").
+						Request(corev1.ResourceCPU, "1").
+						Claim(corev1.ResourceClaim{
+							Name: "gpu",
+						}).
+						ResourceClaim(corev1.PodResourceClaim{
+							Name:                      "gpu",
+							ResourceClaimTemplateName: ptr.To("single-gpu"),
 						}).
 						Obj(),
-					*utiltesting.MakePodSet("c", 1).
-						Limit(corev1.ResourceCPU, "4").
+				).
+				Obj(),
+			wantWl: utiltesting.MakeWorkload("foo", "").
+				PodSets(
+					*utiltesting.MakePodSet("a", 1).
+						Limit(corev1.ResourceCPU, "2").
 						Request(corev1.ResourceCPU, "1").
-						InitContainers(corev1.Container{
-							Resources: corev1.ResourceRequirements{
-								Limits: corev1.ResourceList{
-									corev1.ResourceCPU: *resource.NewQuantity(4, resource.DecimalSI),
-								},
-								Requests: corev1.ResourceList{
-									corev1.ResourceCPU: *resource.NewQuantity(3, resource.DecimalSI),
-								},
-							},
+						Request("gpu.example.com", "1").
+						Claim(corev1.ResourceClaim{
+							Name: "gpu",
+						}).
+						ResourceClaim(corev1.PodResourceClaim{
+							Name:                      "gpu",
+							ResourceClaimTemplateName: ptr.To("single-gpu"),
 						}).
 						Obj(),
 				).
@@ -556,11 +600,11 @@ func TestAddDeviceClassesToContainerRequests(t *testing.T) {
 	for name, tc := range cases {
 		t.Run(name, func(t *testing.T) {
 			cl := utiltesting.NewClientBuilder().WithLists(
-				&nodev1.RuntimeClassList{Items: tc.runtimeClasses},
-				&corev1.LimitRangeList{Items: tc.limitranges},
-			).WithIndex(&corev1.LimitRange{}, indexer.LimitRangeHasContainerType, indexer.IndexLimitRangeHasContainerType).
+				&dra.ResourceClaimTemplateList{Items: tc.resourceClaimTemplate},
+			).
 				Build()
 			ctx, _ := utiltesting.ContextWithLog(t)
+			features.SetFeatureGateDuringTest(t, features.DynamicResourceStructuredParameters, tc.enableDRAGate)
 			AddDeviceClassesToContainerRequests(ctx, cl, tc.wl)
 			if diff := cmp.Diff(tc.wl, tc.wantWl); diff != "" {
 				t.Errorf("Unexpected resources after adjusting (-want,+got): %s", diff)

From 79900667d87ef8ed41e220750ef4b07ddf2d2f30 Mon Sep 17 00:00:00 2001
From: Kevin Hannon <kehannon@redhat.com>
Date: Fri, 20 Sep 2024 16:42:53 -0400
Subject: [PATCH 4/4] get lint passing

---
 config/components/rbac/role.yaml              |  1 -
 .../gpu-test1/single-clusterqueue-setup.yaml  |  1 +
 .../examples/gpu-test2/gpu-test2.yaml         | 42 ++++++++++++++
 .../gpu-test2/single-clusterqueue-setup.yaml  |  9 +++
 .../examples/gpu-test3/gpu-test3.yaml         | 56 +++++++++++++++++++
 .../gpu-test3/single-clusterqueue-setup.yaml  |  9 +++
 .../core/clusterqueue_controller.go           |  1 -
 pkg/util/limitrange/limitrange.go             | 16 +++---
 pkg/workload/resources_test.go                |  6 +-
 test/e2e/config/common/manager_e2e_patch.yaml |  2 +-
 10 files changed, 129 insertions(+), 14 deletions(-)
 create mode 100644 keps/2941-DRA-Structured-Parameters/examples/gpu-test2/gpu-test2.yaml
 create mode 100644 keps/2941-DRA-Structured-Parameters/examples/gpu-test2/single-clusterqueue-setup.yaml
 create mode 100644 keps/2941-DRA-Structured-Parameters/examples/gpu-test3/gpu-test3.yaml
 create mode 100644 keps/2941-DRA-Structured-Parameters/examples/gpu-test3/single-clusterqueue-setup.yaml

diff --git a/config/components/rbac/role.yaml b/config/components/rbac/role.yaml
index 328753c3d8..7b94ff9d9e 100644
--- a/config/components/rbac/role.yaml
+++ b/config/components/rbac/role.yaml
@@ -293,7 +293,6 @@ rules:
 - apiGroups:
   - resource.k8s.io
   resources:
-  - deviceclasses
   - resourceclaimtemplates
   verbs:
   - get
diff --git a/keps/2941-DRA-Structured-Parameters/examples/gpu-test1/single-clusterqueue-setup.yaml b/keps/2941-DRA-Structured-Parameters/examples/gpu-test1/single-clusterqueue-setup.yaml
index 309e93d8d0..7ea9df25a4 100644
--- a/keps/2941-DRA-Structured-Parameters/examples/gpu-test1/single-clusterqueue-setup.yaml
+++ b/keps/2941-DRA-Structured-Parameters/examples/gpu-test1/single-clusterqueue-setup.yaml
@@ -1,3 +1,4 @@
+
 apiVersion: kueue.x-k8s.io/v1beta1
 kind: ResourceFlavor
 metadata:
diff --git a/keps/2941-DRA-Structured-Parameters/examples/gpu-test2/gpu-test2.yaml b/keps/2941-DRA-Structured-Parameters/examples/gpu-test2/gpu-test2.yaml
new file mode 100644
index 0000000000..35f334a326
--- /dev/null
+++ b/keps/2941-DRA-Structured-Parameters/examples/gpu-test2/gpu-test2.yaml
@@ -0,0 +1,42 @@
+# One pod, one container
+# Asking for 2 distinct GPUs
+
+---
+apiVersion: resource.k8s.io/v1alpha3
+kind: ResourceClaimTemplate
+metadata:
+  namespace: gpu-test2
+  name: multiple-gpus
+spec:
+  spec:
+    devices:
+      requests:
+      - name: gpus
+        deviceClassName: gpu.example.com
+        allocationMode: ExactCount
+        count: 2
+
+---
+apiVersion: batch/v1
+kind: Job
+metadata:
+  namespace: gpu-test2
+  name: job0
+  labels:
+    app: job
+    kueue.x-k8s.io/queue-name: user-queue-gpu-test2
+spec:
+  template:
+    spec:
+      restartPolicy: Never
+      containers:
+      - name: ctr0
+        image: ubuntu:22.04
+        command: ["bash", "-c"]
+        args: ["export; sleep 9999"]
+        resources:
+          claims:
+          - name: gpus
+      resourceClaims:
+      - name: gpus
+        resourceClaimTemplateName: multiple-gpus
diff --git a/keps/2941-DRA-Structured-Parameters/examples/gpu-test2/single-clusterqueue-setup.yaml b/keps/2941-DRA-Structured-Parameters/examples/gpu-test2/single-clusterqueue-setup.yaml
new file mode 100644
index 0000000000..e6f3f59ef5
--- /dev/null
+++ b/keps/2941-DRA-Structured-Parameters/examples/gpu-test2/single-clusterqueue-setup.yaml
@@ -0,0 +1,9 @@
+
+apiVersion: kueue.x-k8s.io/v1beta1
+kind: LocalQueue
+metadata:
+  namespace: "gpu-test2"
+  name: "user-queue-gpu-test2"
+spec:
+  clusterQueue: "cluster-queue"
+
diff --git a/keps/2941-DRA-Structured-Parameters/examples/gpu-test3/gpu-test3.yaml b/keps/2941-DRA-Structured-Parameters/examples/gpu-test3/gpu-test3.yaml
new file mode 100644
index 0000000000..4a47a71657
--- /dev/null
+++ b/keps/2941-DRA-Structured-Parameters/examples/gpu-test3/gpu-test3.yaml
@@ -0,0 +1,56 @@
+# One pod, two containers
+# Each asking for shared access to a single GPU
+
+---
+apiVersion: v1
+kind: Namespace
+metadata:
+  name: gpu-test3
+
+---
+apiVersion: resource.k8s.io/v1alpha3
+kind: ResourceClaimTemplate
+metadata:
+  namespace: gpu-test3
+  name: single-gpu
+spec:
+  spec:
+    devices:
+      requests:
+      - name: gpu
+        deviceClassName: gpu.example.com
+
+---
+
+apiVersion: batch/v1
+kind: Job
+metadata:
+  namespace: gpu-test3
+  name: job0
+  labels:
+    app: job
+    kueue.x-k8s.io/queue-name: "user-queue-gpu-test3"
+spec:
+  parallelism: 1
+  completions: 1
+  template:
+    spec:
+      restartPolicy: Never
+      containers:
+      - name: ctr0
+        image: ubuntu:22.04
+        command: ["bash", "-c"]
+        args: ["export; sleep 9999"]
+        resources:
+          claims:
+          - name: shared-gpu
+      - name: ctr1
+        image: ubuntu:22.04
+        command: ["bash", "-c"]
+        args: ["export; sleep 9999"]
+        resources:
+          claims:
+          - name: shared-gpu
+      resourceClaims:
+      - name: shared-gpu
+        resourceClaimTemplateName: single-gpu
diff --git a/keps/2941-DRA-Structured-Parameters/examples/gpu-test3/single-clusterqueue-setup.yaml b/keps/2941-DRA-Structured-Parameters/examples/gpu-test3/single-clusterqueue-setup.yaml
new file mode 100644
index 0000000000..1c26666caf
--- /dev/null
+++ b/keps/2941-DRA-Structured-Parameters/examples/gpu-test3/single-clusterqueue-setup.yaml
@@ -0,0 +1,9 @@
+
+apiVersion: kueue.x-k8s.io/v1beta1
+kind: LocalQueue
+metadata:
+  namespace: "gpu-test3"
+  name: "user-queue-gpu-test3"
+spec:
+  clusterQueue: "cluster-queue"
+
diff --git a/pkg/controller/core/clusterqueue_controller.go b/pkg/controller/core/clusterqueue_controller.go
index 73179d2d7d..785cca556f 100644
--- a/pkg/controller/core/clusterqueue_controller.go
+++ b/pkg/controller/core/clusterqueue_controller.go
@@ -153,7 +153,6 @@ func NewClusterQueueReconciler(
 // +kubebuilder:rbac:groups="",resources=namespaces,verbs=get;list;watch
 // +kubebuilder:rbac:groups="",resources=events,verbs=create;watch;update;patch
 // +kubebuilder:rbac:groups=resource.k8s.io,resources=resourceclaimtemplates,verbs=get;list;watch
-// +kubebuilder:rbac:groups=resource.k8s.io,resources=deviceclasses,verbs=get;list;watch
 // +kubebuilder:rbac:groups=kueue.x-k8s.io,resources=clusterqueues,verbs=get;list;watch;create;update;patch;delete
 // +kubebuilder:rbac:groups=kueue.x-k8s.io,resources=clusterqueues/status,verbs=get;update;patch
 // +kubebuilder:rbac:groups=kueue.x-k8s.io,resources=clusterqueues/finalizers,verbs=update
diff --git a/pkg/util/limitrange/limitrange.go b/pkg/util/limitrange/limitrange.go
index 2ae360ad08..3bd3bd7b82 100644
--- a/pkg/util/limitrange/limitrange.go
+++ b/pkg/util/limitrange/limitrange.go
@@ -25,6 +25,7 @@ import (
 	"k8s.io/utils/ptr"
 
 	k8sresource "k8s.io/apimachinery/pkg/api/resource"
+
 	"sigs.k8s.io/kueue/pkg/util/resource"
 )
 
@@ -150,18 +151,18 @@ func calculatePodClaims(ps *corev1.PodSpec) corev1.ResourceList {
 	// We want to track the number of claims for the pod.
 	for i := range ps.Containers {
 		for _, val := range containers[i].Resources.Claims {
-			totalClaims[val.Name] = totalClaims[val.Name] + 1
+			totalClaims[val.Name]++
 		}
 	}
 	for i := range initContainers {
 		for _, val := range initContainers[i].Resources.Claims {
-			totalClaims[val.Name] = totalClaims[val.Name] + 1
+			totalClaims[val.Name]++
 		}
 	}
 	for i := range initContainers {
 		if isSidecarContainer(initContainers[i]) {
 			for _, val := range initContainers[i].Resources.Claims {
-				totalClaims[val.Name] = totalClaims[val.Name] + 1
+				totalClaims[val.Name]++
 			}
 		}
 	}
@@ -169,13 +170,12 @@ func calculatePodClaims(ps *corev1.PodSpec) corev1.ResourceList {
 		_, ok := totalClaims[val.Name]
 		if ok {
 			keyName := ""
-			if ptr.Deref(val.ResourceClaimName, "") != "" {
+			switch {
+			case ptr.Deref(val.ResourceClaimName, "") != "":
 				keyName = *val.ResourceClaimName
-			} else if ptr.Deref(val.ResourceClaimTemplateName, "") != "" {
+			case ptr.Deref(val.ResourceClaimTemplateName, "") != "":
 				keyName = *val.ResourceClaimTemplateName
-			} else {
-				// TODO: figure out what to do in this case
-				// DRA API says this is not allowed
+			default:
 				return totalResourceClaimTemplate
 			}
 			countOfClaims, ok := totalResourceClaimTemplate[corev1.ResourceName(keyName)]
diff --git a/pkg/workload/resources_test.go b/pkg/workload/resources_test.go
index 2b60af9607..fc22ea21dd 100644
--- a/pkg/workload/resources_test.go
+++ b/pkg/workload/resources_test.go
@@ -21,7 +21,7 @@ import (
 	nodev1 "k8s.io/api/node/v1"
 	dra "k8s.io/api/resource/v1alpha3"
 	"k8s.io/apimachinery/pkg/api/resource"
-	v1 "k8s.io/apimachinery/pkg/apis/meta/v1"
+	metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
 	"k8s.io/utils/ptr"
 
 	kueue "sigs.k8s.io/kueue/apis/kueue/v1beta1"
@@ -497,7 +497,7 @@ func TestAddDeviceClassesToContainerRequests(t *testing.T) {
 			enableDRAGate: false,
 			resourceClaimTemplate: []dra.ResourceClaimTemplate{
 				{
-					ObjectMeta: v1.ObjectMeta{
+					ObjectMeta: metav1.ObjectMeta{
 						Name:      "single-gpu",
 						Namespace: "",
 					},
@@ -548,7 +548,7 @@ func TestAddDeviceClassesToContainerRequests(t *testing.T) {
 			enableDRAGate: true,
 			resourceClaimTemplate: []dra.ResourceClaimTemplate{
 				{
-					ObjectMeta: v1.ObjectMeta{
+					ObjectMeta: metav1.ObjectMeta{
 						Name:      "single-gpu",
 						Namespace: "",
 					},
diff --git a/test/e2e/config/common/manager_e2e_patch.yaml b/test/e2e/config/common/manager_e2e_patch.yaml
index 2a5c3b0486..fbb0ffbe0b 100644
--- a/test/e2e/config/common/manager_e2e_patch.yaml
+++ b/test/e2e/config/common/manager_e2e_patch.yaml
@@ -3,4 +3,4 @@
   value: IfNotPresent
 - op: add
   path: /spec/template/spec/containers/0/args/-
-  value: --feature-gates=MultiKueue=true,MultiKueueBatchJobWithManagedBy=true
+  value: --feature-gates=VisibilityOnDemand=true,MultiKueue=true,MultiKueueBatchJobWithManagedBy=true,DynamicResourceStructuredParameters=true