33 γραμμές
823 B
Plaintext
33 γραμμές
823 B
Plaintext
[Container]
|
|
ContainerName=llamacpp
|
|
Image=localhost/llamacpp:vulkan-amd64
|
|
#AutoUpdate=registry
|
|
Network=internal.network
|
|
PublishPort=8090:8090
|
|
|
|
# Production - Lemonade usa Hugging Face Hub per i modelli
|
|
Volume=/srv/containers/aitools/models:/root/.cache/llama.cpp
|
|
|
|
# ROCm tuning
|
|
AddDevice=/dev/dri/renderD128
|
|
PodmanArgs=--group-add=keep-groups --ipc=host
|
|
SecurityLabelType=container_runtime_t
|
|
|
|
Environment=LLAMA_ARG_HOST=0.0.0.0
|
|
Environment=LLAMA_ARG_PORT=8090
|
|
Environment=LLAMA_ARG_NO_MMAP=true
|
|
Environment=LLAMA_ARG_CTX_SIZE=131072
|
|
Environment=LLAMA_ARG_HF_REPO=unsloth/Qwen3-Coder-30B-A3B-Instruct-GGUF:Q2_K
|
|
|
|
# HF
|
|
Environment=HF_HOME=/root/.cache/huggingface
|
|
Environment=HF_TOKEN=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
|
|
|
|
|
|
[Service]
|
|
Restart=on-failure
|
|
TimeoutStartSec=15m
|
|
|
|
[Install]
|
|
WantedBy=multi-user.target default.target
|