fix(sgx): move LiteLLM off port 4000 to avoid uptime-kuma clash

Uptime Kuma already binds 4000, so the gateway never got the port and
requests hit the wrong service. Move LiteLLM to 4001 and update the rag
CLI default endpoint to match.
This commit is contained in:
Harald Hoyer 2026-05-22 07:08:26 +02:00
parent 95668b71a7
commit 116d04665d
2 changed files with 2 additions and 2 deletions

View file

@ -22,7 +22,7 @@ writers.writePython3Bin "rag"
from qdrant_client import QdrantClient from qdrant_client import QdrantClient
from qdrant_client.models import Distance, PointStruct, VectorParams from qdrant_client.models import Distance, PointStruct, VectorParams
API_BASE = os.environ.get("RAG_API_BASE", "http://localhost:4000/v1") API_BASE = os.environ.get("RAG_API_BASE", "http://localhost:4001/v1")
API_KEY = os.environ.get("RAG_API_KEY", "none") API_KEY = os.environ.get("RAG_API_KEY", "none")
QDRANT_URL = os.environ.get("RAG_QDRANT_URL", "http://localhost:6333") QDRANT_URL = os.environ.get("RAG_QDRANT_URL", "http://localhost:6333")
EMBED_MODEL = os.environ.get("RAG_EMBED_MODEL", "bge-m3") EMBED_MODEL = os.environ.get("RAG_EMBED_MODEL", "bge-m3")

View file

@ -6,7 +6,7 @@
services.litellm = { services.litellm = {
enable = true; enable = true;
host = "0.0.0.0"; host = "0.0.0.0";
port = 4000; # 8080 is Open WebUI, 8081 is searx port = 4001; # 8080 Open WebUI, 8081 searx, 4000 uptime-kuma
openFirewall = true; # reachable across the LAN openFirewall = true; # reachable across the LAN
environmentFile = config.sops.secrets."litellm/env".path; environmentFile = config.sops.secrets."litellm/env".path;