apiVersion: v1 kind: Service metadata: name: llamacpp-cuda labels: app: llamacpp-cuda spec: type: ClusterIP selector: app: llamacpp-cuda ports: - name: http port: 8080 targetPort: http protocol: TCP