Cleanup: Remove redundant llama-slm service and use LXC IP

This commit is contained in:
Tudorel Oprisan 2026-06-09 12:41:32 +01:00
parent 4ea94f7d60
commit cb01b42f38

View File

@ -10,19 +10,3 @@ services:
- MAIN_PC_URL=http://10.0.4.11:8080/v1 - MAIN_PC_URL=http://10.0.4.11:8080/v1
- LOCAL_SLM_URL=http://10.0.4.200:8080/v1 - LOCAL_SLM_URL=http://10.0.4.200:8080/v1
- OPENAI_API_KEY=${OPENAI_API_KEY} - OPENAI_API_KEY=${OPENAI_API_KEY}
depends_on:
- llama-slm
# The Local SLM (Fallback Brain)
llama-slm:
image: ghcr.io/ggerganov/llama.cpp:server
volumes:
- ./models:/models
# Command to run a small, fast model (e.g., Llama-3-8B GGUF)
command: >
-m /models/llama-3-8b-instruct.Q4_K_M.gguf
--host 0.0.0.0
--port 8080
--ctx-size 2048
ports:
- "8081:8080"