Compare commits

..

1 Commits

Author SHA1 Message Date
Gitea Actions Bot cf1db3557e Auto-update README with current k8s applications
Keycloak Terraform / Terraform (pull_request) Successful in 20s
Generated by CI/CD workflow on 2026-06-17 00:10:45

This PR updates the README.md file with the current list of applications found in the k8s/ directory structure.
2026-06-17 00:10:45 +00:00
5 changed files with 1 additions and 107 deletions
-12
View File
@@ -1,12 +0,0 @@
apiVersion: v1
kind: ConfigMap
metadata:
name: llamacpp-cuda-config
data:
LLAMA_CACHE: /models
LLAMA_ARG_HOST: 0.0.0.0
LLAMA_ARG_PORT: "8080"
LLAMA_ARG_HF_REPO: "unsloth/gemma-4-12b-it-GGUF:Q6_K"
LLAMA_ARG_CTX_SIZE: "32768"
LLAMA_ARG_FLASH_ATTN: auto
LLAMA_ARG_FIT: "on"
-72
View File
@@ -1,72 +0,0 @@
apiVersion: apps/v1
kind: Deployment
metadata:
name: llamacpp-cuda
annotations:
reloader.stakater.com/auto: "true"
labels:
app: llamacpp-cuda
spec:
replicas: 1
strategy:
type: Recreate
selector:
matchLabels:
app: llamacpp-cuda
template:
metadata:
labels:
app: llamacpp-cuda
spec:
dnsPolicy: Default
runtimeClassName: nvidia
nodeSelector:
kubernetes.io/hostname: uk-desktop.tail2fe2d.ts.net
tolerations:
- key: workload
operator: Equal
value: desktop
effect: NoSchedule
containers:
- name: llamacpp
image: ghcr.io/ggml-org/llama.cpp:server-cuda-b9501
imagePullPolicy: IfNotPresent
envFrom:
- configMapRef:
name: llamacpp-cuda-config
env:
- name: HF_TOKEN
valueFrom:
secretKeyRef:
name: llamacpp-hf-token
key: token
optional: true
ports:
- name: http
containerPort: 8080
protocol: TCP
resources:
limits:
nvidia.com/gpu: 1
startupProbe:
httpGet:
path: /health
port: http
failureThreshold: 180
periodSeconds: 10
timeoutSeconds: 5
readinessProbe:
httpGet:
path: /health
port: http
failureThreshold: 3
periodSeconds: 10
timeoutSeconds: 5
volumeMounts:
- name: models
mountPath: /models
volumes:
- name: models
hostPath:
path: /data/llama.cpp/models
type: DirectoryOrCreate
-3
View File
@@ -3,9 +3,6 @@ kind: Kustomization
resources:
- app.yaml
- configmap-cuda.yaml
- configmap.yaml
- deployment-cuda.yaml
- deployment.yaml
- service-cuda.yaml
- service.yaml
-15
View File
@@ -1,15 +0,0 @@
apiVersion: v1
kind: Service
metadata:
name: llamacpp-cuda
labels:
app: llamacpp-cuda
spec:
type: ClusterIP
selector:
app: llamacpp-cuda
ports:
- name: http
port: 8080
targetPort: http
protocol: TCP
+1 -5
View File
@@ -11,7 +11,7 @@ spec:
selector:
matchLabels:
app: pasarguard
replicas: 2
replicas: 1
strategy:
type: RollingUpdate
template:
@@ -50,10 +50,6 @@ spec:
value: "/app/tls/tls.crt"
- name: UVICORN_SSL_KEYFILE
value: "/app/tls/tls.key"
- name: UVICORN_PROXY_HEADERS
value: "true"
- name: FORWARDED_ALLOW_IPS
value: "*"
- name: CUSTOM_TEMPLATES_DIRECTORY
value: "/code/app/templates/"
- name: SUBSCRIPTION_PAGE_TEMPLATE