Compare commits

..

7 Commits

Author SHA1 Message Date
Gitea Actions Bot 7555207117 Auto-update README with current k8s applications
Keycloak Terraform / Terraform (pull_request) Failing after 14m34s
Generated by CI/CD workflow on 2026-06-04 16:33:10

This PR updates the README.md file with the current list of applications found in the k8s/ directory structure.
2026-06-04 16:33:10 +00:00
Ultradesu 0018d2b418 pinned llama.cpp to server-rocm-b9501
Check with kubeconform / lint (push) Successful in 13s
Auto-update README / Generate README and Create MR (push) Failing after 11m59s
Update Kubernetes Services Wiki / Generate and Update K8s Wiki (push) Failing after 14m13s
2026-06-04 17:19:19 +03:00
Ultradesu 82dbe84075 Added llama.cpp on ai
Auto-update README / Generate README and Create MR (push) Failing after 10m17s
Check with kubeconform / lint (push) Failing after 11m23s
Update Kubernetes Services Wiki / Generate and Update K8s Wiki (push) Failing after 12m29s
2026-06-04 16:59:58 +03:00
Ultradesu 6b717f5219 Added amd-gpu controller
Check with kubeconform / lint (push) Successful in 33s
Update Kubernetes Services Wiki / Generate and Update K8s Wiki (push) Failing after 11m48s
Auto-update README / Generate README and Create MR (push) Failing after 14m2s
2026-06-04 16:46:49 +03:00
ab 0c1aa7d633 Merge pull request 'Auto-update README with k8s applications' (#406) from auto-update-readme-20260604-130654 into main
Update Kubernetes Services Wiki / Generate and Update K8s Wiki (push) Failing after 13m12s
Reviewed-on: #406
2026-06-04 13:43:51 +00:00
Gitea Actions Bot f7c279a67a Auto-update README with current k8s applications
Keycloak Terraform / Terraform (pull_request) Successful in 13s
Generated by CI/CD workflow on 2026-06-04 13:06:54

This PR updates the README.md file with the current list of applications found in the k8s/ directory structure.
2026-06-04 13:06:54 +00:00
Ultradesu 09e43ded52 Updated ollama & openwebui
Update Kubernetes Services Wiki / Generate and Update K8s Wiki (push) Successful in 6s
Check with kubeconform / lint (push) Successful in 5s
Auto-update README / Generate README and Create MR (push) Successful in 6s
2026-06-04 16:06:30 +03:00
10 changed files with 182 additions and 4 deletions
+1
View File
@@ -53,6 +53,7 @@ ArgoCD homelab project
| **k8s-secrets** | [![k8s-secrets](https://ag.hexor.cy/api/badge?name=k8s-secrets&revision=true)](https://ag.hexor.cy/applications/argocd/k8s-secrets) |
| **khm** | [![khm](https://ag.hexor.cy/api/badge?name=khm&revision=true)](https://ag.hexor.cy/applications/argocd/khm) |
| **lidarr** | [![lidarr](https://ag.hexor.cy/api/badge?name=lidarr&revision=true)](https://ag.hexor.cy/applications/argocd/lidarr) |
| **llamacpp** | [![llamacpp](https://ag.hexor.cy/api/badge?name=llamacpp&revision=true)](https://ag.hexor.cy/applications/argocd/llamacpp) |
| **matrix** | [![matrix](https://ag.hexor.cy/api/badge?name=matrix&revision=true)](https://ag.hexor.cy/applications/argocd/matrix) |
| **mtproxy** | [![mtproxy](https://ag.hexor.cy/api/badge?name=mtproxy&revision=true)](https://ag.hexor.cy/applications/argocd/mtproxy) |
| **n8n** | [![n8n](https://ag.hexor.cy/api/badge?name=n8n&revision=true)](https://ag.hexor.cy/applications/argocd/n8n) |
+20
View File
@@ -0,0 +1,20 @@
apiVersion: argoproj.io/v1alpha1
kind: Application
metadata:
name: llamacpp
namespace: argocd
spec:
project: apps
destination:
namespace: llamacpp
server: https://kubernetes.default.svc
source:
repoURL: ssh://git@gt.hexor.cy:30022/ab/homelab.git
targetRevision: HEAD
path: k8s/apps/llamacpp
syncPolicy:
automated:
selfHeal: true
prune: true
syncOptions:
- CreateNamespace=true
+12
View File
@@ -0,0 +1,12 @@
apiVersion: v1
kind: ConfigMap
metadata:
name: llamacpp-config
data:
LLAMA_CACHE: /models
LLAMA_ARG_HOST: 0.0.0.0
LLAMA_ARG_PORT: "8080"
LLAMA_ARG_HF_REPO: unsloth/Qwen3.6-35B-A3B-MTP-GGUF:UD-Q6_K
LLAMA_ARG_CTX_SIZE: "32768"
LLAMA_ARG_FLASH_ATTN: auto
LLAMA_ARG_FIT: "on"
+70
View File
@@ -0,0 +1,70 @@
apiVersion: apps/v1
kind: Deployment
metadata:
name: llamacpp
annotations:
reloader.stakater.com/auto: "true"
labels:
app: llamacpp
spec:
replicas: 1
strategy:
type: Recreate
selector:
matchLabels:
app: llamacpp
template:
metadata:
labels:
app: llamacpp
spec:
nodeSelector:
kubernetes.io/hostname: ai.tail2fe2d.ts.net
tolerations:
- key: workload
operator: Equal
value: ai
effect: NoSchedule
containers:
- name: llamacpp
image: ghcr.io/ggml-org/llama.cpp:server-rocm-b9501
imagePullPolicy: Always
envFrom:
- configMapRef:
name: llamacpp-config
env:
- name: HF_TOKEN
valueFrom:
secretKeyRef:
name: llamacpp-hf-token
key: token
optional: true
ports:
- name: http
containerPort: 8080
protocol: TCP
resources:
limits:
amd.com/gpu: 1
startupProbe:
httpGet:
path: /health
port: http
failureThreshold: 180
periodSeconds: 10
timeoutSeconds: 5
readinessProbe:
httpGet:
path: /health
port: http
failureThreshold: 3
periodSeconds: 10
timeoutSeconds: 5
volumeMounts:
- name: models
mountPath: /models
volumes:
- name: models
hostPath:
path: /k8s/llamacpp/models
type: DirectoryOrCreate
+8
View File
@@ -0,0 +1,8 @@
apiVersion: kustomize.config.k8s.io/v1beta1
kind: Kustomization
resources:
- app.yaml
- configmap.yaml
- deployment.yaml
- service.yaml
+15
View File
@@ -0,0 +1,15 @@
apiVersion: v1
kind: Service
metadata:
name: llamacpp
labels:
app: llamacpp
spec:
type: ClusterIP
selector:
app: llamacpp
ports:
- name: http
port: 8080
targetPort: http
protocol: TCP
+3 -3
View File
@@ -9,18 +9,18 @@ resources:
helmCharts:
- name: ollama
repo: https://otwld.github.io/ollama-helm/
version: 1.49.0
version: 1.58.0
releaseName: ollama
namespace: ollama
valuesFile: ollama-values.yaml
includeCRDs: true
- name: open-webui
repo: https://helm.openwebui.com/
version: 12.10.0
version: 14.8.0
releaseName: openweb-ui
namespace: ollama
valuesFile: openweb-ui-values.yaml
includeCRDs: true
patches:
- path: patch-runtimeclass.yaml
- path: patch-runtimeclass.yaml
+1 -1
View File
@@ -31,7 +31,7 @@ ollama:
- qwen3-vl:8b
pipelines:
enabled: true
enabled: false
nodeSelector:
kubernetes.io/hostname: master.tail2fe2d.ts.net
+31
View File
@@ -0,0 +1,31 @@
nfd:
enabled: false
labeller:
enabled: false
dp:
image:
repository: docker.io/rocm/k8s-device-plugin
tag: "1.31.0.9"
updateStrategy:
type: RollingUpdate
rollingUpdate:
maxUnavailable: 1
securityContext:
allowPrivilegeEscalation: false
capabilities:
drop:
- ALL
tolerations:
- key: workload
operator: Equal
value: ai
effect: NoSchedule
node_selector_enabled: true
node_selector:
kubernetes.io/arch: amd64
kubernetes.io/hostname: ai.tail2fe2d.ts.net
+21
View File
@@ -13,3 +13,24 @@ helmCharts:
namespace: gpu-system
valuesFile: values.yaml
includeCRDs: true
- name: amd-gpu
repo: https://rocm.github.io/k8s-device-plugin/
version: 0.21.0
releaseName: amd-gpu-device-plugin
namespace: gpu-system
valuesFile: amd-gpu-values.yaml
includeCRDs: true
patches:
- target:
group: apps
version: v1
kind: DaemonSet
name: amd-gpu-device-plugin-daemonset
namespace: gpu-system
patch: |-
- op: replace
path: /spec/template/spec/nodeSelector
value:
kubernetes.io/arch: amd64
kubernetes.io/hostname: ai.tail2fe2d.ts.net