Files
auricom-home-cluster/kubernetes/apps/kube-system/intel-device-plugin/exporter/helmrelease.yaml
2024-12-03 22:21:21 +00:00

71 lines
1.8 KiB
YAML

---
# yaml-language-server: $schema=https://raw.githubusercontent.com/bjw-s/helm-charts/main/charts/other/app-template/schemas/helmrelease-helm-v2.schema.json
apiVersion: helm.toolkit.fluxcd.io/v2
kind: HelmRelease
metadata:
name: &app intel-gpu-exporter
namespace: kube-system
spec:
interval: 30m
chart:
spec:
chart: app-template
version: 3.5.1
sourceRef:
kind: HelmRepository
name: bjw-s
namespace: flux-system
maxHistory: 2
install:
createNamespace: true
remediation:
retries: 3
upgrade:
cleanupOnFail: true
remediation:
strategy: rollback
retries: 3
uninstall:
keepHistory: false
values:
defaultPodOptions:
nodeSelector:
intel.feature.node.kubernetes.io/gpu: "true"
controllers:
intel-gpu-exporter:
type: daemonset
containers:
app:
image:
repository: ghcr.io/onedr0p/intel-gpu-exporter
tag: rolling@sha256:5782b746f507149e7c3d5f7b19fe8d834fda854f117afcbdd21ecf822ef1ee02
resources:
requests:
gpu.intel.com/i915_monitoring: 1
cpu: 100m
memory: 100Mi
limits:
gpu.intel.com/i915_monitoring: 1
memory: 500Mi
securityContext:
privileged: true
service:
app:
controller: *app
ports:
http:
port: 8080
serviceMonitor:
app:
serviceName: app
enabled: true
endpoints:
- port: http
scheme: http
path: /metrics
interval: 1m
scrapeTimeout: 10s
relabelings:
- sourceLabels: [__meta_kubernetes_pod_node_name]
targetLabel: node