Cleanup: Remove redundant llama-slm service and use LXC IP
This commit is contained in:
parent
4ea94f7d60
commit
cb01b42f38
@ -10,19 +10,3 @@ services:
|
|||||||
- MAIN_PC_URL=http://10.0.4.11:8080/v1
|
- MAIN_PC_URL=http://10.0.4.11:8080/v1
|
||||||
- LOCAL_SLM_URL=http://10.0.4.200:8080/v1
|
- LOCAL_SLM_URL=http://10.0.4.200:8080/v1
|
||||||
- OPENAI_API_KEY=${OPENAI_API_KEY}
|
- OPENAI_API_KEY=${OPENAI_API_KEY}
|
||||||
depends_on:
|
|
||||||
- llama-slm
|
|
||||||
|
|
||||||
# The Local SLM (Fallback Brain)
|
|
||||||
llama-slm:
|
|
||||||
image: ghcr.io/ggerganov/llama.cpp:server
|
|
||||||
volumes:
|
|
||||||
- ./models:/models
|
|
||||||
# Command to run a small, fast model (e.g., Llama-3-8B GGUF)
|
|
||||||
command: >
|
|
||||||
-m /models/llama-3-8b-instruct.Q4_K_M.gguf
|
|
||||||
--host 0.0.0.0
|
|
||||||
--port 8080
|
|
||||||
--ctx-size 2048
|
|
||||||
ports:
|
|
||||||
- "8081:8080"
|
|
||||||
|
|||||||
Loading…
Reference in New Issue
Block a user