Kubeintel Logo

Kubeintel

  • Search
  • Pods
  • Deployments
  • Statefulsets
  • jobJobs
  • Daemonsets
  • Namespaces
  • Nodes
  • Services
  • Configmaps
  1. Home
  2. /
  3. namespaces
  4. /
  5. kube-system
  6. /
  7. daemonsets
  8. /
  9. do-node-agent-amd-device-metrics-exporter
Summary
Metadata
Containers
Status
Spec
All
Pods
Events
Investigator
DaemonSet Details

Name: do-node-agent-amd-device-metrics-exporter

Namespace: kube-system

Pods: 0/0

Selector: app: do-node-agent-amd-de...

Kubectl Commands
  • View
  • Delete
  • Describe
Containers
Name
Image
Ports...
amdgpu-metrics-exporter-containerghcr.io/digitalocean-packages/amd-gpu-de...5000/TCP...
do-node-agentghcr.io/digitalocean-packages/do-agent:3...N/A...
  • 1
Init Containers
Name
Image
Ports...
dynamic-configgcr.io/distroless/static-debian12:debug-...N/A...
driver-initbusybox:1.36N/A...
  • 1
Metadata

Creation Time: 2025-08-14T22:04:45Z

Labels:

  • app: do-node-agent-amd-de...
  • c3.doks.digitalocean.com/component: do-node-agent...
  • c3.doks.digitalocean.com/plane: data...
  • doks.digitalocean.com/managed: true...

Annotation:

  • deprecated.daemonset.template.generation: 2...
name: do-node-agent-amd-device-metrics-exporter
namespace: kube-system
uid: 69947fe6-da27-4ba9-9099-88aa6c810404
resourceVersion: '134440246'
generation: 2
creationTimestamp: '2025-08-14T22:04:45Z'
labels:
app: do-node-agent-amd-device-metrics-exporter
c3.doks.digitalocean.com/component: do-node-agent
c3.doks.digitalocean.com/plane: data
doks.digitalocean.com/managed: 'true'
annotations:
deprecated.daemonset.template.generation: '2'
- name: amdgpu-metrics-exporter-container
image: ghcr.io/digitalocean-packages/amd-gpu-device-metrics-exporter:v1.3.1
workingDir: /root
ports:
- containerPort: 5000
protocol: TCP
env:
- name: NODE_NAME
valueFrom:
fieldRef:
apiVersion: v1
fieldPath: spec.nodeName
- name: METRICS_EXPORTER_PORT
value: '5000'
resources: {}
volumeMounts:
- name: dev-volume
mountPath: /dev
- name: sys-volume
mountPath: /sys
- name: pod-resources
mountPath: /var/lib/kubelet/pod-resources
- name: exporter-health-grpc-volume
mountPath: /var/lib/amd-metrics-exporter
- name: exporter-slurm-job
mountPath: /var/run/exporter
- name: metrics-config-volume
mountPath: /etc/metrics/
terminationMessagePath: /dev/termination-log
terminationMessagePolicy: File
imagePullPolicy: Always
securityContext:
privileged: true
- name: do-node-agent
image: ghcr.io/digitalocean-packages/do-agent:3.18.2
command:
- /bin/do-agent
args:
- '@/etc/config/do-agent-config'
- '--path.procfs=/host/proc'
- '--path.sysfs=/host/sys'
- >-
--k8s-metrics-path=http://kube-state-metrics.kube-system.svc.cluster.local:8080/metrics
- '--gpu-metrics-path=http://127.0.0.1:5000/metrics'
- >-
--additional-label=kubernetes_cluster_uuid:f6ce2907-8531-4ab3-861e-4e2affa620b1
resources:
limits:
memory: 300Mi
requests:
cpu: 102m
memory: 80Mi
volumeMounts:
- name: proc
readOnly: true
mountPath: /host/proc
- name: sys
readOnly: true
mountPath: /host/sys
- name: root
readOnly: true
mountPath: /host/root
mountPropagation: HostToContainer
- name: dynamic-config
mountPath: /etc/config
terminationMessagePath: /dev/termination-log
terminationMessagePolicy: File
imagePullPolicy: IfNotPresent
currentNumberScheduled: 0
numberMisscheduled: 0
desiredNumberScheduled: 0
numberReady: 0
observedGeneration: 2
selector:
matchLabels:
app: do-node-agent-amd-device-metrics-exporter
template:
metadata:
creationTimestamp: null
labels:
app: do-node-agent-amd-device-metrics-exporter
doks.digitalocean.com/managed: 'true'
annotations:
clusterlint.digitalocean.com/disabled-checks: resource-requirements,hostpath-volume
spec:
volumes:
- name: proc
hostPath:
path: /proc
type: ''
- name: sys
hostPath:
path: /sys
type: ''
- name: root
hostPath:
path: /
type: ''
- name: dynamic-config
emptyDir: {}
- name: host-kubectl
hostPath:
path: /usr/bin/kubectl
type: File
- name: dev-volume
hostPath:
path: /dev
type: Directory
- name: sys-volume
hostPath:
path: /sys
type: Directory
- name: pod-resources
hostPath:
path: /var/lib/kubelet/pod-resources
type: Directory
- name: exporter-health-grpc-volume
hostPath:
path: /var/lib/amd-metrics-exporter
type: DirectoryOrCreate
- name: exporter-slurm-job
hostPath:
path: /var/run/exporter
type: DirectoryOrCreate
- name: metrics-config-volume
configMap:
name: do-node-agent-device-metrics-exporter-charts-configmap
defaultMode: 420
initContainers:
- name: dynamic-config
image: gcr.io/distroless/static-debian12:debug-nonroot-amd64
command:
- sh
- '-c'
- >
set -o errexit
set -o pipefail
set -o nounset
KUBECTL=/host/usr/bin/kubectl
POOL_ID="$(${KUBECTL} get node ${NODE_NAME} -o
jsonpath='{.metadata.labels.doks\.digitalocean\.com/node-pool-id}')"
[[ -z "${POOL_ID}" ]] && echo "Pool ID label missing" && exit 1
echo "--additional-label=kubernetes_node_pool_uuid:${POOL_ID}" >
/etc/config/do-agent-config
echo "Pool ID configured: ${POOL_ID}"
env:
- name: NODE_NAME
valueFrom:
fieldRef:
apiVersion: v1
fieldPath: spec.nodeName
resources: {}
volumeMounts:
- name: dynamic-config
mountPath: /etc/config
- name: host-kubectl
mountPath: /host/usr/bin/kubectl
terminationMessagePath: /dev/termination-log
terminationMessagePolicy: File
imagePullPolicy: IfNotPresent
- name: driver-init
image: busybox:1.36
command:
- sh
- '-c'
- >-
while [ ! -d /host-sys/class/kfd ] || [ ! -d
/host-sys/module/amdgpu/drivers/ ]; do echo "amdgpu driver is not
loaded "; sleep 2 ;done
resources: {}
volumeMounts:
- name: sys-volume
mountPath: /host-sys
terminationMessagePath: /dev/termination-log
terminationMessagePolicy: File
imagePullPolicy: IfNotPresent
securityContext:
privileged: true
containers:
- name: amdgpu-metrics-exporter-container
image: ghcr.io/digitalocean-packages/amd-gpu-device-metrics-exporter:v1.3.1
workingDir: /root
ports:
- containerPort: 5000
protocol: TCP
env:
- name: NODE_NAME
valueFrom:
fieldRef:
apiVersion: v1
fieldPath: spec.nodeName
- name: METRICS_EXPORTER_PORT
value: '5000'
resources: {}
volumeMounts:
- name: dev-volume
mountPath: /dev
- name: sys-volume
mountPath: /sys
- name: pod-resources
mountPath: /var/lib/kubelet/pod-resources
- name: exporter-health-grpc-volume
mountPath: /var/lib/amd-metrics-exporter
- name: exporter-slurm-job
mountPath: /var/run/exporter
- name: metrics-config-volume
mountPath: /etc/metrics/
terminationMessagePath: /dev/termination-log
terminationMessagePolicy: File
imagePullPolicy: Always
securityContext:
privileged: true
- name: do-node-agent
image: ghcr.io/digitalocean-packages/do-agent:3.18.2
command:
- /bin/do-agent
args:
- '@/etc/config/do-agent-config'
- '--path.procfs=/host/proc'
- '--path.sysfs=/host/sys'
- >-
--k8s-metrics-path=http://kube-state-metrics.kube-system.svc.cluster.local:8080/metrics
- '--gpu-metrics-path=http://127.0.0.1:5000/metrics'
- >-
--additional-label=kubernetes_cluster_uuid:f6ce2907-8531-4ab3-861e-4e2affa620b1
resources:
limits:
memory: 300Mi
requests:
cpu: 102m
memory: 80Mi
volumeMounts:
- name: proc
readOnly: true
mountPath: /host/proc
- name: sys
readOnly: true
mountPath: /host/sys
- name: root
readOnly: true
mountPath: /host/root
mountPropagation: HostToContainer
- name: dynamic-config
mountPath: /etc/config
terminationMessagePath: /dev/termination-log
terminationMessagePolicy: File
imagePullPolicy: IfNotPresent
restartPolicy: Always
terminationGracePeriodSeconds: 30
dnsPolicy: ClusterFirstWithHostNet
nodeSelector:
doks.digitalocean.com/gpu-brand: amd
kubernetes.io/os: linux
serviceAccountName: do-agent
serviceAccount: do-agent
hostNetwork: true
securityContext: {}
schedulerName: default-scheduler
tolerations:
- operator: Exists
priorityClassName: system-node-critical
updateStrategy:
type: RollingUpdate
rollingUpdate:
maxUnavailable: 1
maxSurge: 0
revisionHistoryLimit: 10
metadata:
name: do-node-agent-amd-device-metrics-exporter
namespace: kube-system
uid: 69947fe6-da27-4ba9-9099-88aa6c810404
resourceVersion: '134440246'
generation: 2
creationTimestamp: '2025-08-14T22:04:45Z'
labels:
app: do-node-agent-amd-device-metrics-exporter
c3.doks.digitalocean.com/component: do-node-agent
c3.doks.digitalocean.com/plane: data
doks.digitalocean.com/managed: 'true'
annotations:
deprecated.daemonset.template.generation: '2'
spec:
selector:
matchLabels:
app: do-node-agent-amd-device-metrics-exporter
template:
metadata:
creationTimestamp: null
labels:
app: do-node-agent-amd-device-metrics-exporter
doks.digitalocean.com/managed: 'true'
annotations:
clusterlint.digitalocean.com/disabled-checks: resource-requirements,hostpath-volume
spec:
volumes:
- name: proc
hostPath:
path: /proc
type: ''
- name: sys
hostPath:
path: /sys
type: ''
- name: root
hostPath:
path: /
type: ''
- name: dynamic-config
emptyDir: {}
- name: host-kubectl
hostPath:
path: /usr/bin/kubectl
type: File
- name: dev-volume
hostPath:
path: /dev
type: Directory
- name: sys-volume
hostPath:
path: /sys
type: Directory
- name: pod-resources
hostPath:
path: /var/lib/kubelet/pod-resources
type: Directory
- name: exporter-health-grpc-volume
hostPath:
path: /var/lib/amd-metrics-exporter
type: DirectoryOrCreate
- name: exporter-slurm-job
hostPath:
path: /var/run/exporter
type: DirectoryOrCreate
- name: metrics-config-volume
configMap:
name: do-node-agent-device-metrics-exporter-charts-configmap
defaultMode: 420
initContainers:
- name: dynamic-config
image: gcr.io/distroless/static-debian12:debug-nonroot-amd64
command:
- sh
- '-c'
- >
set -o errexit
set -o pipefail
set -o nounset
KUBECTL=/host/usr/bin/kubectl
POOL_ID="$(${KUBECTL} get node ${NODE_NAME} -o
jsonpath='{.metadata.labels.doks\.digitalocean\.com/node-pool-id}')"
[[ -z "${POOL_ID}" ]] && echo "Pool ID label missing" && exit 1
echo "--additional-label=kubernetes_node_pool_uuid:${POOL_ID}" >
/etc/config/do-agent-config
echo "Pool ID configured: ${POOL_ID}"
env:
- name: NODE_NAME
valueFrom:
fieldRef:
apiVersion: v1
fieldPath: spec.nodeName
resources: {}
volumeMounts:
- name: dynamic-config
mountPath: /etc/config
- name: host-kubectl
mountPath: /host/usr/bin/kubectl
terminationMessagePath: /dev/termination-log
terminationMessagePolicy: File
imagePullPolicy: IfNotPresent
- name: driver-init
image: busybox:1.36
command:
- sh
- '-c'
- >-
while [ ! -d /host-sys/class/kfd ] || [ ! -d
/host-sys/module/amdgpu/drivers/ ]; do echo "amdgpu driver is not
loaded "; sleep 2 ;done
resources: {}
volumeMounts:
- name: sys-volume
mountPath: /host-sys
terminationMessagePath: /dev/termination-log
terminationMessagePolicy: File
imagePullPolicy: IfNotPresent
securityContext:
privileged: true
containers:
- name: amdgpu-metrics-exporter-container
image: ghcr.io/digitalocean-packages/amd-gpu-device-metrics-exporter:v1.3.1
workingDir: /root
ports:
- containerPort: 5000
protocol: TCP
env:
- name: NODE_NAME
valueFrom:
fieldRef:
apiVersion: v1
fieldPath: spec.nodeName
- name: METRICS_EXPORTER_PORT
value: '5000'
resources: {}
volumeMounts:
- name: dev-volume
mountPath: /dev
- name: sys-volume
mountPath: /sys
- name: pod-resources
mountPath: /var/lib/kubelet/pod-resources
- name: exporter-health-grpc-volume
mountPath: /var/lib/amd-metrics-exporter
- name: exporter-slurm-job
mountPath: /var/run/exporter
- name: metrics-config-volume
mountPath: /etc/metrics/
terminationMessagePath: /dev/termination-log
terminationMessagePolicy: File
imagePullPolicy: Always
securityContext:
privileged: true
- name: do-node-agent
image: ghcr.io/digitalocean-packages/do-agent:3.18.2
command:
- /bin/do-agent
args:
- '@/etc/config/do-agent-config'
- '--path.procfs=/host/proc'
- '--path.sysfs=/host/sys'
- >-
--k8s-metrics-path=http://kube-state-metrics.kube-system.svc.cluster.local:8080/metrics
- '--gpu-metrics-path=http://127.0.0.1:5000/metrics'
- >-
--additional-label=kubernetes_cluster_uuid:f6ce2907-8531-4ab3-861e-4e2affa620b1
resources:
limits:
memory: 300Mi
requests:
cpu: 102m
memory: 80Mi
volumeMounts:
- name: proc
readOnly: true
mountPath: /host/proc
- name: sys
readOnly: true
mountPath: /host/sys
- name: root
readOnly: true
mountPath: /host/root
mountPropagation: HostToContainer
- name: dynamic-config
mountPath: /etc/config
terminationMessagePath: /dev/termination-log
terminationMessagePolicy: File
imagePullPolicy: IfNotPresent
restartPolicy: Always
terminationGracePeriodSeconds: 30
dnsPolicy: ClusterFirstWithHostNet
nodeSelector:
doks.digitalocean.com/gpu-brand: amd
kubernetes.io/os: linux
serviceAccountName: do-agent
serviceAccount: do-agent
hostNetwork: true
securityContext: {}
schedulerName: default-scheduler
tolerations:
- operator: Exists
priorityClassName: system-node-critical
updateStrategy:
type: RollingUpdate
rollingUpdate:
maxUnavailable: 1
maxSurge: 0
revisionHistoryLimit: 10
status:
currentNumberScheduled: 0
numberMisscheduled: 0
desiredNumberScheduled: 0
numberReady: 0
observedGeneration: 2
Kubeintel ©2024