feat: Add NVIDIA GPU config and update Ollama to use it
This commit is contained in:
20
k8s/core/gpu/app.yaml
Normal file
20
k8s/core/gpu/app.yaml
Normal file
@@ -0,0 +1,20 @@
|
||||
apiVersion: argoproj.io/v1alpha1
|
||||
kind: Application
|
||||
metadata:
|
||||
name: gpu-system
|
||||
namespace: argocd
|
||||
spec:
|
||||
project: core
|
||||
destination:
|
||||
namespace: gpu-system
|
||||
server: https://kubernetes.default.svc
|
||||
source:
|
||||
repoURL: ssh://git@gt.hexor.cy:30022/ab/homelab.git
|
||||
targetRevision: HEAD
|
||||
path: k8s/core/gpu
|
||||
syncPolicy:
|
||||
automated:
|
||||
selfHeal: true
|
||||
prune: true
|
||||
syncOptions:
|
||||
- CreateNamespace=true
|
||||
15
k8s/core/gpu/kustomization.yaml
Normal file
15
k8s/core/gpu/kustomization.yaml
Normal file
@@ -0,0 +1,15 @@
|
||||
apiVersion: kustomize.config.k8s.io/v1beta1
|
||||
kind: Kustomization
|
||||
|
||||
resources:
|
||||
- app.yaml
|
||||
- runtime-class.yaml
|
||||
|
||||
helmCharts:
|
||||
- name: nvidia-device-plugin
|
||||
repo: https://nvidia.github.io/k8s-device-plugin
|
||||
version: 0.17.0
|
||||
releaseName: nvidia-device-plugin
|
||||
namespace: gpu-system
|
||||
valuesFile: values.yaml
|
||||
includeCRDs: true
|
||||
5
k8s/core/gpu/runtime-class.yaml
Normal file
5
k8s/core/gpu/runtime-class.yaml
Normal file
@@ -0,0 +1,5 @@
|
||||
apiVersion: node.k8s.io/v1
|
||||
kind: RuntimeClass
|
||||
metadata:
|
||||
name: nvidia
|
||||
handler: nvidia
|
||||
21
k8s/core/gpu/values.yaml
Normal file
21
k8s/core/gpu/values.yaml
Normal file
@@ -0,0 +1,21 @@
|
||||
nodeSelector:
|
||||
kubernetes.io/hostname: uk-desktop.tail2fe2d.ts.net
|
||||
|
||||
runtimeClassName: nvidia
|
||||
|
||||
setAsDefault: false
|
||||
|
||||
config:
|
||||
name: "nvidia-plugin-config"
|
||||
map:
|
||||
# use device driver mode instead of dev/nvmem
|
||||
default: |-
|
||||
version: v1
|
||||
flags:
|
||||
migStrategy: none
|
||||
failOnInitError: true
|
||||
nvidiaDriverRoot: "/"
|
||||
plugin:
|
||||
passDeviceSpecs: false
|
||||
deviceListStrategy: envvar
|
||||
deviceIDStrategy: uuid
|
||||
Reference in New Issue
Block a user