Add llamacpp container
Esse commit está contido em:
32
Services/llamacpp.container
Arquivo normal
32
Services/llamacpp.container
Arquivo normal
@@ -0,0 +1,32 @@
|
||||
[Container]
|
||||
ContainerName=llamacpp
|
||||
Image=localhost/llamacpp:vulkan-amd64
|
||||
#AutoUpdate=registry
|
||||
Network=internal.network
|
||||
PublishPort=8090:8090
|
||||
|
||||
# Production - Lemonade usa Hugging Face Hub per i modelli
|
||||
Volume=/srv/containers/aitools/models:/root/.cache/llama.cpp
|
||||
|
||||
# ROCm tuning
|
||||
AddDevice=/dev/dri/renderD128
|
||||
PodmanArgs=--group-add=keep-groups --ipc=host
|
||||
SecurityLabelType=container_runtime_t
|
||||
|
||||
Environment=LLAMA_ARG_HOST=0.0.0.0
|
||||
Environment=LLAMA_ARG_PORT=8090
|
||||
Environment=LLAMA_ARG_NO_MMAP=true
|
||||
Environment=LLAMA_ARG_CTX_SIZE=131072
|
||||
Environment=LLAMA_ARG_HF_REPO=unsloth/Qwen3-Coder-30B-A3B-Instruct-GGUF:Q2_K
|
||||
|
||||
# HF
|
||||
Environment=HF_HOME=/root/.cache/huggingface
|
||||
Environment=HF_TOKEN=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
|
||||
|
||||
|
||||
[Service]
|
||||
Restart=on-failure
|
||||
TimeoutStartSec=15m
|
||||
|
||||
[Install]
|
||||
WantedBy=multi-user.target default.target
|
||||
Referência em uma Nova Issue
Bloquear um usuário