containers · klihub · Jun 5, 2025 · Jun 9, 2025 · Jul 16, 2024 · Jun 4, 2025
diff --git a/Makefile b/Makefile
@@ -233,6 +233,24 @@ $(BIN_PATH)/%: .static.%.$(STATIC)
 
 .PRECIOUS: $(foreach dir,$(BUILD_DIRS),.static.$(dir).1 .static.$(dir).)
 
+#
+# Eskimo words for snow...
+#
+
+balloons: $(BIN_PATH)/nri-resource-policy-balloons
+balloons-img: image.nri-resource-policy-balloons
+t-a topology-aware: $(BIN_PATH)/nri-resource-policy-topology-aware
+ta-img topolog-aware-img: image.nri-resource-policy-topology-aware
+template: $(BIN_PATH)/nri-resource-policy-template
+template-img: image.nri-resource-policy-template
+memqos memory-qos: $(BIN_PATH)/nri-memory-qos
+memqos-img memory-qos-img: image.nri-memory-qos
+memtierd: $(BIN_PATH)/nri-memtierd
+memtierd-img: image.nri-memtierd
+sgx-epc sgx: $(BIN_PATH)/nri-sgx-epc
+sgx-epc-img: image.nri-sgx-epc
+config-manager: $(BIN_PATH)/config-manager
+
 #
 # Image building test deployment generation targets
 #

diff --git a/README-DRA-driver-proto.md b/README-DRA-driver-proto.md
@@ -0,0 +1,226 @@
+# Prototyping CPU DRA device abstraction / DRA-based CPU allocation
+
+## Background
+
+This prototype patch set bolts a DRA allocation frontend on top of the existing
+topology aware resource policy plugin. The main intention with of this patch set
+is to
+
+- provide something practical to play around with for the [feasibility study]( https://docs.google.com/document/d/1Tb_dC60YVCBr7cNYWuVLddUUTMcNoIt3zjd5-8rgug0/edit?tab=t.0#heading=h.iutbebngx80e) of enabling DRA-based CPU allocation,
+- allow (relatively) easy experimentation with how to expose CPU as DRA
+devices (IOW test various CPU DRA attributes)
+- allow testing how DRA-based CPU allocation (using non-trivial CEL expressions)
+would scale with cluster and cluster node size
+
+## Notes
+
+This patched NRI plugin, especially in its current state and form, is
+*not a proposal* for a first real DRA-based CPU driver.
+
+## Prerequisites for Testing
+
+To test out this in a cluster, make sure you have
+
+1. A recent enough control plane with DRA v1 support (for instance Kubernetes v1.35.0).
+
+2. CDI enabled in your runtime configuration
+
+## Installation and Testing
+
+Once you have your cluster properly set upset up, you can pull this in to
+your cluster with for testing with something like this:
+
+```bash
+helm install --devel -n kube-system test oci://ghcr.io/klihub/nri-plugins/helm-charts/nri-resource-policy-topology-aware --version v0.12-dra-driver-unstable --set image.pullPolicy=Always --set extraEnv.OVERRIDE_SYS_ATOM_CPUS='2-5' --set extraEnv.OVERRIDE_SYS_CORE_CPUS='0\,1\,6-15'
+```
+
+Once the NRI plugin+DRA driver is up and running, you should see some CPUs
+exposed as DRI devices. You can check the resource slices with the following
+command
+
+```bash
+[kli@n4c16-fedora-40-cloud-base-containerd ~]# kubectl get resourceslices
+NAME                                                     NODE                                    DRIVER       POOL    AGE
+n4c16-fedora-40-cloud-base-containerd-native.cpu-jxfkj   n4c16-fedora-40-cloud-base-containerd   native.cpu   pool0   4d2h
+```
+
+And the exposed devices like this:
+
+```bash
+[kli@n4c16-fedora-40-cloud-base-containerd ~]# kubectl get resourceslices -oyaml | less
+apiVersion: v1
+items:
+- apiVersion: resource.k8s.io/v1
+  kind: ResourceSlice
+  metadata:
+    creationTimestamp: "2025-06-10T06:01:54Z"
+    generateName: n4c16-fedora-40-cloud-base-containerd-native.cpu-
+    generation: 1
+    name: n4c16-fedora-40-cloud-base-containerd-native.cpu-jxfkj
+    ownerReferences:
+    - apiVersion: v1
+      controller: true
+      kind: Node
+      name: n4c16-fedora-40-cloud-base-containerd
+      uid: 90a99f1f-c1ca-4bea-8dbd-3cc821f744b1
+    resourceVersion: "871388"
+    uid: 4639d31f-e508-4b0a-8378-867f6c1c7cb1
+  spec:
+    devices:
+    - attributes:
+        cache0ID:
+          int: 0
+        cache1ID:
+          int: 8
+        cache2ID:
+          int: 16
+        cache3ID:
+          int: 24
+        cluster:
+          int: 0
+        core:
+          int: 0
+        coreType:
+          string: P-core
+        die:
+          int: 0
+        isolated:
+          bool: false
+        localMemory:
+          int: 0
+        package:
+          int: 0
+      name: cpu1
+    - attributes:
+    - attributes:
+        cache0ID:
+          int: 1
+        cache1ID:
+          int: 9
+        cache2ID:
+          int: 17
+        cache3ID:
+          int: 24
+        cluster:
+          int: 2
+        core:
+          int: 1
+        coreType:
+          string: E-core
+        die:
+          int: 0
+        isolated:
+          bool: false
+        localMemory:
+          int: 0
+        package:
+          int: 0
+      name: cpu2
+    - attributes:
+        cache0ID:
+          int: 1
+        cache1ID:
+          int: 9
+        cache2ID:
+          int: 17
+        cache3ID:
+          int: 24
+        cluster:
+          int: 2
+        core:
+...
+```
+
+If everything looks fine and you do have CPUs available as DRA devices, you
+can test DRA-based CPU allocation with something like this. This allocates
+a single P-core for the container.
+
+```yaml
+apiVersion: resource.k8s.io/v1
+kind: ResourceClaimTemplate
+metadata:
+  name: any-cores
+spec:
+  spec:
+    devices:
+      requests:
+      - name: cpu
+        exactly:
+          deviceClassName: native.cpu
+---
+apiVersion: resource.k8s.io/v1
+kind: ResourceClaimTemplate
+metadata:
+  name: p-cores
+spec:
+  spec:
+    devices:
+      requests:
+      - name: cpu
+        exactly:
+          deviceClassName: native.cpu
+          selectors:
+            - cel:
+                expression: device.attributes["native.cpu"].coreType == "P-core"
+          count: 1
+---
+apiVersion: resource.k8s.io/v1
+kind: ResourceClaimTemplate
+metadata:
+  name: e-cores
+spec:
+  spec:
+    devices:
+      requests:
+      - name: cpu
+        exactly:
+          deviceClassName: native.cpu
+          selectors:
+            - cel:
+                expression: device.attributes["native.cpu"].coreType == "E-core"
+          count: 1
+---
+apiVersion: v1
+kind: Pod
+metadata:
+  name: pcore-test
+  labels:
+    app: pod
+spec:
+  containers:
+  - name: ctr0
+    image: busybox
+    imagePullPolicy: IfNotPresent
+    args:
+      - /bin/sh
+      - -c
+      - trap 'exit 0' TERM; sleep 3600 & wait
+    resources:
+      requests:
+        cpu: 1
+        memory: 100M
+      limits:
+        cpu: 1
+        memory: 100M
+      claims:
+      - name: claim-pcores
+  resourceClaims:
+  - name: claim-pcores
+    resourceClaimTemplateName: p-cores
+  terminationGracePeriodSeconds: 1
+```
+
+If you want to try a mixed native CPU + DRA-based allocation, try
+increasing the CPU request and limit in the pods spec to 1500m CPUs
+or CPUs and see what happens.
+
+
+## Playing Around with CPU Abstractions
+
+If you want to play around with this (for instance modify the exposed CPU abstraction), the easiest way is to
+1. [fork](https://github.com/containers/nri-plugins/fork) the [main NRI Reference Plugins](https://github.com/containers/nri-plugins) repo
+2. enable github actions in your personal fork
+3. make any changes you want (for instance, to alter the CPU abstraction, take a look at [cpu.DRA()](https://github.com/klihub/nri-plugins/blob/test/build/dra-driver/pkg/sysfs/dra.go)
+4. Push your changes to ssh://git@github.com/$YOUR_FORK/nri-plugins/refs/heads/test/build/dra-driver.
+5. Wait for the image and Helm chart publishing actions to succeed
+6. Once done, you can pull the result in to your cluster with something like `helm install --devel -n kube-system test oci://ghcr.io/$YOUR_GITHUB_USERID/nri-plugins/helm-charts/nri-resource-policy-topology-aware --version v0.9-dra-driver-unstable`
diff --git a/README.md b/README.md
@@ -19,3 +19,6 @@ Currently following plugins are available:
 [5]: https://containers.github.io/nri-plugins/stable/docs/memory/sgx-epc.html
 
 See the [NRI plugins documentation](https://containers.github.io/nri-plugins/) for more information.
+
+See the [DRA CPU driver prototype notes](README-DRA-driver-proto.md) for more information
+about using the Topology Aware policy as a DRA CPU driver.
diff --git a/cmd/plugins/balloons/policy/balloons-policy.go b/cmd/plugins/balloons/policy/balloons-policy.go
@@ -372,6 +372,18 @@ func (p *balloons) UpdateResources(c cache.Container) error {
 	return nil
 }
 
+// AllocateClaim allocates CPUs for the claim.
+func (p *balloons) AllocateClaim(claim policy.Claim) error {
+	log.Debug("allocating claim %s for pods %v...", claim.String(), claim.GetPods())
+	return nil
+}
+
+// ReleaseClaim releases CPUs of the claim.
+func (p *balloons) ReleaseClaim(claim policy.Claim) error {
+	log.Debug("releasing claim %s for pods %v...", claim.String(), claim.GetPods())
+	return nil
+}
+
 // HandleEvent handles policy-specific events.
 func (p *balloons) HandleEvent(*events.Policy) (bool, error) {
 	log.Debug("(not) handling event...")

diff --git a/cmd/plugins/template/policy/template-policy.go b/cmd/plugins/template/policy/template-policy.go
@@ -108,6 +108,18 @@ func (p *policy) UpdateResources(c cache.Container) error {
 	return nil
 }
 
+// AllocateClaim alloctes CPUs for the claim.
+func (p *policy) AllocateClaim(claim policyapi.Claim) error {
+	log.Debug("allocating claim %s for pods %v...", claim.String(), claim.GetPods())
+	return nil
+}
+
+// ReleaseClaim releases CPUs of the claim.
+func (p *policy) ReleaseClaim(claim policyapi.Claim) error {
+	log.Debug("releasing claim %s for pods %v...", claim.String(), claim.GetPods())
+	return nil
+}
+
 // HandleEvent handles policy-specific events.
 func (p *policy) HandleEvent(e *events.Policy) (bool, error) {
 	log.Info("received policy event %s.%s with data %v...", e.Source, e.Type, e.Data)

diff --git a/cmd/plugins/topology-aware/policy/cache.go b/cmd/plugins/topology-aware/policy/cache.go
@@ -126,6 +126,7 @@ func (p *policy) reinstateGrants(grants map[string]Grant) error {
 
 type cachedGrant struct {
 	PrettyName string
+	Claimed    string
 	Exclusive  string
 	Part       int
 	CPUType    cpuClass
@@ -140,6 +141,7 @@ type cachedGrant struct {
 func newCachedGrant(cg Grant) *cachedGrant {
 	ccg := &cachedGrant{}
 	ccg.PrettyName = cg.GetContainer().PrettyName()
+	ccg.Claimed = cg.ClaimedCPUs().String()
 	ccg.Exclusive = cg.ExclusiveCPUs().String()
 	ccg.Part = cg.CPUPortion()
 	ccg.CPUType = cg.CPUType()
@@ -168,6 +170,7 @@ func (ccg *cachedGrant) ToGrant(policy *policy) (Grant, error) {
 		container,
 		ccg.CPUType,
 		cpuset.MustParse(ccg.Exclusive),
+		cpuset.MustParse(ccg.Claimed),
 		ccg.Part,
 		ccg.MemType,
 		ccg.ColdStart,

diff --git a/cmd/plugins/topology-aware/policy/mocks_test.go b/cmd/plugins/topology-aware/policy/mocks_test.go
@@ -30,6 +30,7 @@ import (
 	"github.com/intel/goresctrl/pkg/sst"
 	idset "github.com/intel/goresctrl/pkg/utils"
 	v1 "k8s.io/api/core/v1"
+	resapi "k8s.io/api/resource/v1"
 )
 
 type mockSystemNode struct {
@@ -207,6 +208,10 @@ func (c *mockCPU) CoreKind() sysfs.CoreKind {
 	return sysfs.PerformanceCore
 }
 
+func (c *mockCPU) DRA(extras ...map[sysfs.QualifiedName]sysfs.Attribute) *resapi.Device {
+	panic("unimplmented")
+}
+
 type mockSystem struct {
 	isolatedCPU  int
 	nodes        []sysfs.Node
@@ -348,6 +353,9 @@ func (fake *mockSystem) NodeDistance(idset.ID, idset.ID) int {
 func (fake *mockSystem) NodeHintToCPUs(string) string {
 	return ""
 }
+func (fake *mockSystem) CPUsAsDRADevices(ids []idset.ID) []resapi.Device {
+	panic("unimplemented")
+}
 
 type mockContainer struct {
 	name                                  string
@@ -408,6 +416,9 @@ func (m *mockContainer) GetAnnotation(string, interface{}) (string, bool) {
 func (m *mockContainer) GetEnv(string) (string, bool) {
 	panic("unimplemented")
 }
+func (m *mockContainer) GetEnvList() []string {
+	panic("unimplemented")
+}
 func (m *mockContainer) GetAnnotations() map[string]string {
 	panic("unimplemented")
 }
@@ -752,6 +763,12 @@ func (m *mockCache) SetPolicyEntry(string, interface{}) {
 func (m *mockCache) GetPolicyEntry(string, interface{}) bool {
 	return m.returnValueForGetPolicyEntry
 }
+func (m *mockCache) SetEntry(string, interface{}) {
+	panic("unimplemented")
+}
+func (m *mockCache) GetEntry(string, interface{}) (interface{}, error) {
+	panic("unimplemented")
+}
 func (m *mockCache) Save() error {
 	return nil
 }