13 lines
288 B
YAML
13 lines
288 B
YAML
|
|
apiVersion: v1
|
||
|
|
kind: ConfigMap
|
||
|
|
metadata:
|
||
|
|
name: llamacpp-config
|
||
|
|
data:
|
||
|
|
LLAMA_CACHE: /models
|
||
|
|
LLAMA_ARG_HOST: 0.0.0.0
|
||
|
|
LLAMA_ARG_PORT: "8080"
|
||
|
|
LLAMA_ARG_HF_REPO: unsloth/Qwen3.6-35B-A3B-MTP-GGUF:UD-Q6_K
|
||
|
|
LLAMA_ARG_CTX_SIZE: "32768"
|
||
|
|
LLAMA_ARG_FLASH_ATTN: auto
|
||
|
|
LLAMA_ARG_FIT: "on"
|