llama-server helm

No introduction found. Create it?

Install

Install with:

helm repo add app-template oci://ghcr.io/bjw-s-labs/charts/
helm install llama-server app-template/app-template -f values.yaml

Examples

See examples from other people.

Top Repositories (2 out of 3)

NameRepoStarsVersionTimestamp
llama-serverjoryirving/home-ops2165.0.17 hours ago
llama-serverjoryirving/home-ops2165.0.17 hours ago

Values

See the most popular values for this chart:

KeyTypes
number
number
string
string
string
string
string
controllers.llama-server.containers.app.args[] (2)
- --host
- "0.0.0.0"
- --port
- "8080"
- --alias
- self-hosted
- --model
- /models/gemma4-26b/gemma-4-26B-A4B-it-UD-Q5_K_XL.gguf
- --mmproj
- /models/gemma4-26b/mmproj-F16.gguf
- --ctx-size
- "262144"
- --n-gpu-layers
- "99"
- --flash-attn
- on
- --parallel
- "3"
- --cont-batching
- -sps
- "0.90"
- --no-context-shift
- --cache-prompt
- --kv-unified
- --ctx-checkpoints
- "4"
- --checkpoint-every-n-tokens
- "16384"
- --image-min-tokens
- "1120"
- --image-max-tokens
- "1120"
- --metrics
- --temp
- "0.4"
- --top-p
- "0.92"
- --top-k
- "40"
- --min-p
- "0"
- --batch-size
- "4096"
- --ubatch-size
- "2048"
- --threads
- "12"
- --threads-batch
- "16"
- --no-mmap
string
string
string
controllers.llama-server.containers.app.image.repository (2)
docker.io/kyuz0/amd-strix-halo-toolboxes
string
controllers.llama-server.containers.app.image.tag (2)
rocm-7.2.3@sha256:a07e7576a800a8f77cd6ae1a4522d6c7e005f49cf047470a5183a2e1a4031135
string
boolean
boolean
number
string
number
number
number
boolean
boolean
number
string
number
number
number
boolean
boolean
number
string
number
number
string
number, string
string
boolean
controllers.llama-server.initContainers.model-download.command[] (2)
- /bin/sh
- -ec
- set -euo pipefail if [ ! -s /models/gemma4-26b/gemma-4-26B-A4B-it-UD-Q5_K_XL.gguf ] || [ ! -s /models/gemma4-26b/mmproj-F16.gguf ]; then pip install --no-cache-dir "huggingface_hub[hf_transfer]" mkdir -p /models/gemma4-26b rm -rf /models/gemma4-26b/.cache/huggingface/download/gemma-4-26B-A4B-UD-Q5_K_XL.gguf.lock hf download \ unsloth/gemma-4-26B-A4B-it-GGUF \ gemma-4-26B-A4B-it-UD-Q5_K_XL.gguf \ mmproj-F16.gguf \ --local-dir /models/gemma4-26b echo "Gemma-4-26B-A4B-Q5_K_XL download complete" else echo "Gemma-4-26B-A4B-Q5_K_XL already downloaded, skipping" fi
string
string
string
string
string
string
string
string
string
controllers.app.containers.app.args[] (1)
- --host
- "0.0.0.0"
- --port
- "8080"
- --models-preset
- /app/models.ini
- --models-max
- "1"
- --parallel
- "1"
- --metrics
- --slots
string
string
string
string
controllers.app.containers.app.image.tag (1)
server-cuda13@sha256:1b3694b9a8f68b95e4667c8b598c3e46b69dc2702ab227ebe2b2bd2282bb34d6
string
boolean
boolean
number
string
number
number
number
number
boolean
boolean
number
string
number
number
number
number
boolean
boolean
number
string
number
number
number
number
number
string
number
number
string
number
boolean
string
string
string
string
string
string
string
string
string
string
string
string
string
string
string
string
boolean
string
string
string
boolean
string
persistence.config.name (1)
llama-server-config
string
string
route.app.hostnames[] (1)
- {{ .Release.Name }}.${SECRET_DOMAIN}
string
string
string
string
number