diff --git a/content/en/docs/reference/command-line-tools-reference/feature-gates/KubeletPodResourcesDynamicResources.md b/content/en/docs/reference/command-line-tools-reference/feature-gates/KubeletPodResourcesDynamicResources.md index 4173e41d092c3..ec9110518d99d 100644 --- a/content/en/docs/reference/command-line-tools-reference/feature-gates/KubeletPodResourcesDynamicResources.md +++ b/content/en/docs/reference/command-line-tools-reference/feature-gates/KubeletPodResourcesDynamicResources.md @@ -18,3 +18,22 @@ Extend the kubelet's [pod resources monitoring gRPC API](/docs/concepts/extend-kubernetes/compute-storage-net/device-plugins.md) endpoints List and Get to include resources allocated in ResourceClaims via [Dynamic Resource Allocation](/docs/concepts/scheduling-eviction/dynamic-resource-allocation/). + +Below is an example of GPU metrics to show how this API is consumed by [NVIDIA dcgm-exporter](https://github.com/NVIDIA/dcgm-exporter) to collect per pod GPU metrics allocated by [NVIDIA DRA driver](https://github.com/NVIDIA/k8s-dra-driver-gpu): + +``` +DCGM_FI_PROF_PCIE_RX_BYTES{gpu="0",UUID="GPU-a4f34abc-7715-3560-dcea-7238b9611a45",pci_bus_id="00000009:01:00.0",device="nvidia0",modelName="NVIDIA GH200 96GB HBM3",Hostname="sc-starwars-xxxx",container="ctr",dra_claim_name="single-gpu",dra_claim_namespace="gpu-test3",dra_device_name="gpu-0",dra_driver_name="gpu.nvidia.com",dra_pool_name="sc-starwars-xxxx",namespace="gpu-test3",pod="pod1"} 23792 + +DCGM_FI_PROF_PCIE_RX_BYTES{gpu="0",UUID="GPU-a4f34abc-7715-3560-dcea-7238b9611a45",pci_bus_id="00000009:01:00.0",device="nvidia0",modelName="NVIDIA GH200 96GB HBM3",Hostname="sc-starwars-xxxx",container="ctr",dra_claim_name="single-gpu",dra_claim_namespace="gpu-test3",dra_device_name="gpu-0",dra_driver_name="gpu.nvidia.com",dra_pool_name="sc-starwars-xxxx",namespace="gpu-test3",pod="pod2"} 23792 + +with Pod DRA info: + +container="ctr", +dra_claim_name="single-gpu", +dra_claim_namespace="gpu-test3", +dra_device_name="gpu-0",dra_driver_name="gpu.nvidia.com", +dra_pool_name="sc-starwars-xxxx", +namespace="gpu-test3", +pod="pod1" +``` +