Compare commits
1 Commits
| Author | SHA1 | Date | |
|---|---|---|---|
| 1a40cb14cf |
@@ -9,7 +9,7 @@ data:
|
|||||||
set -euo pipefail
|
set -euo pipefail
|
||||||
|
|
||||||
PORT="${1:-5847}"
|
PORT="${1:-5847}"
|
||||||
VPN_CIDR="${2:-10.8.0.0/16}"
|
VPN_CIDR="${2:-10.8.1.0/24}"
|
||||||
|
|
||||||
external_interface() {
|
external_interface() {
|
||||||
ip route get 1.1.1.1 | awk '{for (i=1;i<=NF;i++) if ($i=="dev") {print $(i+1); exit}}'
|
ip route get 1.1.1.1 | awk '{for (i=1;i<=NF;i++) if ($i=="dev") {print $(i+1); exit}}'
|
||||||
@@ -68,7 +68,7 @@ data:
|
|||||||
set -euo pipefail
|
set -euo pipefail
|
||||||
|
|
||||||
PORT="${1:-5847}"
|
PORT="${1:-5847}"
|
||||||
VPN_CIDR="${2:-10.8.0.0/16}"
|
VPN_CIDR="${2:-10.8.1.0/24}"
|
||||||
|
|
||||||
external_interface() {
|
external_interface() {
|
||||||
ip route get 1.1.1.1 | awk '{for (i=1;i<=NF;i++) if ($i=="dev") {print $(i+1); exit}}'
|
ip route get 1.1.1.1 | awk '{for (i=1;i<=NF;i++) if ($i=="dev") {print $(i+1); exit}}'
|
||||||
|
|||||||
@@ -15,7 +15,7 @@ spec:
|
|||||||
awg0.conf: |-
|
awg0.conf: |-
|
||||||
[Interface]
|
[Interface]
|
||||||
PrivateKey = {{ .server_private_key }}
|
PrivateKey = {{ .server_private_key }}
|
||||||
Address = 10.8.0.1/16
|
Address = 10.8.1.1/24
|
||||||
ListenPort = 5847
|
ListenPort = 5847
|
||||||
MTU = 1376
|
MTU = 1376
|
||||||
Jc = 4
|
Jc = 4
|
||||||
@@ -29,8 +29,8 @@ spec:
|
|||||||
H2 = 3288052141
|
H2 = 3288052141
|
||||||
H3 = 1766607858
|
H3 = 1766607858
|
||||||
H4 = 2528465083
|
H4 = 2528465083
|
||||||
PostUp = /scripts/firewall-up.sh 5847 10.8.0.0/16
|
PostUp = /scripts/firewall-up.sh 5847 10.8.1.0/24
|
||||||
PostDown = /scripts/firewall-down.sh 5847 10.8.0.0/16
|
PostDown = /scripts/firewall-down.sh 5847 10.8.1.0/24
|
||||||
data:
|
data:
|
||||||
- secretKey: server_private_key
|
- secretKey: server_private_key
|
||||||
sourceRef:
|
sourceRef:
|
||||||
|
|||||||
@@ -1,12 +0,0 @@
|
|||||||
apiVersion: v1
|
|
||||||
kind: ConfigMap
|
|
||||||
metadata:
|
|
||||||
name: llamacpp-cuda-config
|
|
||||||
data:
|
|
||||||
LLAMA_CACHE: /models
|
|
||||||
LLAMA_ARG_HOST: 0.0.0.0
|
|
||||||
LLAMA_ARG_PORT: "8080"
|
|
||||||
LLAMA_ARG_HF_REPO: "unsloth/gemma-4-12b-it-GGUF:Q6_K"
|
|
||||||
LLAMA_ARG_CTX_SIZE: "128000"
|
|
||||||
LLAMA_ARG_FLASH_ATTN: auto
|
|
||||||
LLAMA_ARG_FIT: "on"
|
|
||||||
@@ -1,72 +0,0 @@
|
|||||||
apiVersion: apps/v1
|
|
||||||
kind: Deployment
|
|
||||||
metadata:
|
|
||||||
name: llamacpp-cuda
|
|
||||||
annotations:
|
|
||||||
reloader.stakater.com/auto: "true"
|
|
||||||
labels:
|
|
||||||
app: llamacpp-cuda
|
|
||||||
spec:
|
|
||||||
replicas: 1
|
|
||||||
strategy:
|
|
||||||
type: Recreate
|
|
||||||
selector:
|
|
||||||
matchLabels:
|
|
||||||
app: llamacpp-cuda
|
|
||||||
template:
|
|
||||||
metadata:
|
|
||||||
labels:
|
|
||||||
app: llamacpp-cuda
|
|
||||||
spec:
|
|
||||||
dnsPolicy: Default
|
|
||||||
runtimeClassName: nvidia
|
|
||||||
nodeSelector:
|
|
||||||
kubernetes.io/hostname: uk-desktop.tail2fe2d.ts.net
|
|
||||||
tolerations:
|
|
||||||
- key: workload
|
|
||||||
operator: Equal
|
|
||||||
value: desktop
|
|
||||||
effect: NoSchedule
|
|
||||||
containers:
|
|
||||||
- name: llamacpp
|
|
||||||
image: ghcr.io/ggml-org/llama.cpp:server-cuda-b9501
|
|
||||||
imagePullPolicy: IfNotPresent
|
|
||||||
envFrom:
|
|
||||||
- configMapRef:
|
|
||||||
name: llamacpp-cuda-config
|
|
||||||
env:
|
|
||||||
- name: HF_TOKEN
|
|
||||||
valueFrom:
|
|
||||||
secretKeyRef:
|
|
||||||
name: llamacpp-hf-token
|
|
||||||
key: token
|
|
||||||
optional: true
|
|
||||||
ports:
|
|
||||||
- name: http
|
|
||||||
containerPort: 8080
|
|
||||||
protocol: TCP
|
|
||||||
resources:
|
|
||||||
limits:
|
|
||||||
nvidia.com/gpu: 1
|
|
||||||
startupProbe:
|
|
||||||
httpGet:
|
|
||||||
path: /health
|
|
||||||
port: http
|
|
||||||
failureThreshold: 180
|
|
||||||
periodSeconds: 10
|
|
||||||
timeoutSeconds: 5
|
|
||||||
readinessProbe:
|
|
||||||
httpGet:
|
|
||||||
path: /health
|
|
||||||
port: http
|
|
||||||
failureThreshold: 3
|
|
||||||
periodSeconds: 10
|
|
||||||
timeoutSeconds: 5
|
|
||||||
volumeMounts:
|
|
||||||
- name: models
|
|
||||||
mountPath: /models
|
|
||||||
volumes:
|
|
||||||
- name: models
|
|
||||||
hostPath:
|
|
||||||
path: /data/llama.cpp/models
|
|
||||||
type: DirectoryOrCreate
|
|
||||||
@@ -3,9 +3,6 @@ kind: Kustomization
|
|||||||
|
|
||||||
resources:
|
resources:
|
||||||
- app.yaml
|
- app.yaml
|
||||||
- configmap-cuda.yaml
|
|
||||||
- configmap.yaml
|
- configmap.yaml
|
||||||
- deployment-cuda.yaml
|
|
||||||
- deployment.yaml
|
- deployment.yaml
|
||||||
- service-cuda.yaml
|
|
||||||
- service.yaml
|
- service.yaml
|
||||||
|
|||||||
@@ -1,15 +0,0 @@
|
|||||||
apiVersion: v1
|
|
||||||
kind: Service
|
|
||||||
metadata:
|
|
||||||
name: llamacpp-cuda
|
|
||||||
labels:
|
|
||||||
app: llamacpp-cuda
|
|
||||||
spec:
|
|
||||||
type: ClusterIP
|
|
||||||
selector:
|
|
||||||
app: llamacpp-cuda
|
|
||||||
ports:
|
|
||||||
- name: http
|
|
||||||
port: 8080
|
|
||||||
targetPort: http
|
|
||||||
protocol: TCP
|
|
||||||
@@ -15,14 +15,14 @@ resources:
|
|||||||
- service.yaml
|
- service.yaml
|
||||||
- ingress.yaml
|
- ingress.yaml
|
||||||
|
|
||||||
# helmCharts:
|
helmCharts:
|
||||||
# - name: yacy
|
- name: yacy
|
||||||
# repo: https://gt.hexor.cy/api/packages/ab/helm
|
repo: https://gt.hexor.cy/api/packages/ab/helm
|
||||||
# version: 0.1.2
|
version: 0.1.2
|
||||||
# releaseName: yacy
|
releaseName: yacy
|
||||||
# namespace: n8n
|
namespace: n8n
|
||||||
# valuesFile: values-yacy.yaml
|
valuesFile: values-yacy.yaml
|
||||||
# includeCRDs: true
|
includeCRDs: true
|
||||||
|
|
||||||
commonLabels:
|
commonLabels:
|
||||||
app.kubernetes.io/name: n8n
|
app.kubernetes.io/name: n8n
|
||||||
|
|||||||
@@ -11,7 +11,7 @@ spec:
|
|||||||
selector:
|
selector:
|
||||||
matchLabels:
|
matchLabels:
|
||||||
app: pasarguard
|
app: pasarguard
|
||||||
replicas: 2
|
replicas: 1
|
||||||
strategy:
|
strategy:
|
||||||
type: RollingUpdate
|
type: RollingUpdate
|
||||||
template:
|
template:
|
||||||
@@ -34,7 +34,7 @@ spec:
|
|||||||
mountPath: /templates/subscription
|
mountPath: /templates/subscription
|
||||||
containers:
|
containers:
|
||||||
- name: pasarguard-web
|
- name: pasarguard-web
|
||||||
image: pasarguard/panel:v5.0.3
|
image: pasarguard/panel:v5.0.1
|
||||||
imagePullPolicy: Always
|
imagePullPolicy: Always
|
||||||
envFrom:
|
envFrom:
|
||||||
- secretRef:
|
- secretRef:
|
||||||
@@ -50,10 +50,6 @@ spec:
|
|||||||
value: "/app/tls/tls.crt"
|
value: "/app/tls/tls.crt"
|
||||||
- name: UVICORN_SSL_KEYFILE
|
- name: UVICORN_SSL_KEYFILE
|
||||||
value: "/app/tls/tls.key"
|
value: "/app/tls/tls.key"
|
||||||
- name: UVICORN_PROXY_HEADERS
|
|
||||||
value: "true"
|
|
||||||
- name: FORWARDED_ALLOW_IPS
|
|
||||||
value: "*"
|
|
||||||
- name: CUSTOM_TEMPLATES_DIRECTORY
|
- name: CUSTOM_TEMPLATES_DIRECTORY
|
||||||
value: "/code/app/templates/"
|
value: "/code/app/templates/"
|
||||||
- name: SUBSCRIPTION_PAGE_TEMPLATE
|
- name: SUBSCRIPTION_PAGE_TEMPLATE
|
||||||
|
|||||||
@@ -7,7 +7,7 @@ kind: Kustomization
|
|||||||
helmCharts:
|
helmCharts:
|
||||||
- name: longhorn
|
- name: longhorn
|
||||||
repo: https://charts.longhorn.io
|
repo: https://charts.longhorn.io
|
||||||
version: 1.12.0
|
version: 1.11.2
|
||||||
releaseName: longhorn
|
releaseName: longhorn
|
||||||
namespace: longhorn
|
namespace: longhorn
|
||||||
valuesFile: values.yaml
|
valuesFile: values.yaml
|
||||||
|
|||||||
@@ -1,54 +1,7 @@
|
|||||||
global:
|
|
||||||
tolerations:
|
|
||||||
- key: "workload"
|
|
||||||
operator: "Exists"
|
|
||||||
effect: "NoSchedule"
|
|
||||||
- key: "node.kubernetes.io/unreachable"
|
|
||||||
operator: "Exists"
|
|
||||||
effect: "NoSchedule"
|
|
||||||
- key: "node.kubernetes.io/unreachable"
|
|
||||||
operator: "Exists"
|
|
||||||
effect: "NoExecute"
|
|
||||||
|
|
||||||
longhornManager:
|
|
||||||
tolerations:
|
|
||||||
- key: "workload"
|
|
||||||
operator: "Exists"
|
|
||||||
effect: "NoSchedule"
|
|
||||||
- key: "node.kubernetes.io/unreachable"
|
|
||||||
operator: "Exists"
|
|
||||||
effect: "NoSchedule"
|
|
||||||
- key: "node.kubernetes.io/unreachable"
|
|
||||||
operator: "Exists"
|
|
||||||
effect: "NoExecute"
|
|
||||||
|
|
||||||
longhornDriver:
|
|
||||||
tolerations:
|
|
||||||
- key: "workload"
|
|
||||||
operator: "Exists"
|
|
||||||
effect: "NoSchedule"
|
|
||||||
- key: "node.kubernetes.io/unreachable"
|
|
||||||
operator: "Exists"
|
|
||||||
effect: "NoSchedule"
|
|
||||||
- key: "node.kubernetes.io/unreachable"
|
|
||||||
operator: "Exists"
|
|
||||||
effect: "NoExecute"
|
|
||||||
|
|
||||||
longhornUI:
|
longhornUI:
|
||||||
replicas: 1
|
replicas: 1
|
||||||
tolerations:
|
|
||||||
- key: "workload"
|
|
||||||
operator: "Exists"
|
|
||||||
effect: "NoSchedule"
|
|
||||||
- key: "node.kubernetes.io/unreachable"
|
|
||||||
operator: "Exists"
|
|
||||||
effect: "NoSchedule"
|
|
||||||
- key: "node.kubernetes.io/unreachable"
|
|
||||||
operator: "Exists"
|
|
||||||
effect: "NoExecute"
|
|
||||||
|
|
||||||
defaultSettings:
|
defaultSettings:
|
||||||
taintToleration: "workload=ai:NoSchedule; workload=desktop:NoSchedule; node.kubernetes.io/unreachable:NoSchedule; node.kubernetes.io/unreachable:NoExecute"
|
|
||||||
# Keep new instance-manager pods schedulable on nodes with high CPU requests.
|
# Keep new instance-manager pods schedulable on nodes with high CPU requests.
|
||||||
guaranteedInstanceManagerCPU: '{"v1":"6","v2":"6"}'
|
guaranteedInstanceManagerCPU: '{"v1":"6","v2":"6"}'
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user