Add Nvidia GPU operator Helm configuration files #43
@@ -0,0 +1,18 @@
|
|||||||
|
apiVersion: v1
|
||||||
|
kind: ConfigMap
|
||||||
|
metadata:
|
||||||
|
name: time-slicing-config
|
||||||
|
namespace: gpu-operator
|
||||||
|
data:
|
||||||
|
any: |-
|
||||||
|
version: v1
|
||||||
|
flags:
|
||||||
|
migStrategy: none
|
||||||
|
sharing:
|
||||||
|
timeSlicing:
|
||||||
|
resources:
|
||||||
|
- name: nvidia.com/gpu
|
||||||
|
replicas: 4
|
||||||
|
|
||||||
|
# remember to patch the cluster policy to use this configmap
|
||||||
|
# kubectl patch clusterpolicy/cluster-policy -n gpu-operator --type merge -p '{"spec": {"devicePlugin": {"config": {"name": "time-slicing-config", "default": "any"}}}}'
|
||||||
31
clusters/default/helm/gpu-operator/gpu-operator-release.yml
Normal file
31
clusters/default/helm/gpu-operator/gpu-operator-release.yml
Normal file
@@ -0,0 +1,31 @@
|
|||||||
|
---
|
||||||
|
apiVersion: helm.toolkit.fluxcd.io/v2
|
||||||
|
kind: HelmRelease
|
||||||
|
metadata:
|
||||||
|
name: gpu-operator
|
||||||
|
namespace: gpu-operator
|
||||||
|
spec:
|
||||||
|
interval: 24h
|
||||||
|
chart:
|
||||||
|
spec:
|
||||||
|
chart: gpu-operator
|
||||||
|
version: "v25.3.4"
|
||||||
|
sourceRef:
|
||||||
|
kind: HelmRepository
|
||||||
|
name: nvidia
|
||||||
|
namespace: flux-system
|
||||||
|
interval: 24h
|
||||||
|
install:
|
||||||
|
createNamespace: true
|
||||||
|
upgrade:
|
||||||
|
remediation:
|
||||||
|
remediateLastFailure: true
|
||||||
|
values:
|
||||||
|
driver:
|
||||||
|
enabled: false
|
||||||
|
toolkit:
|
||||||
|
env:
|
||||||
|
- name: CONTAINERD_SOCKET
|
||||||
|
value: /run/k3s/containerd/containerd.sock
|
||||||
|
- name: CONTAINERD_CONFIG
|
||||||
|
value: /var/lib/rancher/k3s/agent/etc/containerd/config.toml
|
||||||
9
clusters/default/helm/gpu-operator/gpu-operator-repo.yml
Normal file
9
clusters/default/helm/gpu-operator/gpu-operator-repo.yml
Normal file
@@ -0,0 +1,9 @@
|
|||||||
|
---
|
||||||
|
apiVersion: source.toolkit.fluxcd.io/v1
|
||||||
|
kind: HelmRepository
|
||||||
|
metadata:
|
||||||
|
name: nvidia
|
||||||
|
namespace: flux-system
|
||||||
|
spec:
|
||||||
|
interval: 24h
|
||||||
|
url: https://helm.ngc.nvidia.com/nvidia
|
||||||
Reference in New Issue
Block a user