From 116d04665d6fa5d4c983b5af4497e3733562d8ca Mon Sep 17 00:00:00 2001 From: Harald Hoyer Date: Fri, 22 May 2026 07:08:26 +0200 Subject: [PATCH] fix(sgx): move LiteLLM off port 4000 to avoid uptime-kuma clash Uptime Kuma already binds 4000, so the gateway never got the port and requests hit the wrong service. Move LiteLLM to 4001 and update the rag CLI default endpoint to match. --- packages/rag/default.nix | 2 +- systems/x86_64-linux/sgx/litellm.nix | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/packages/rag/default.nix b/packages/rag/default.nix index 242b7dc..423c53a 100644 --- a/packages/rag/default.nix +++ b/packages/rag/default.nix @@ -22,7 +22,7 @@ writers.writePython3Bin "rag" from qdrant_client import QdrantClient from qdrant_client.models import Distance, PointStruct, VectorParams - API_BASE = os.environ.get("RAG_API_BASE", "http://localhost:4000/v1") + API_BASE = os.environ.get("RAG_API_BASE", "http://localhost:4001/v1") API_KEY = os.environ.get("RAG_API_KEY", "none") QDRANT_URL = os.environ.get("RAG_QDRANT_URL", "http://localhost:6333") EMBED_MODEL = os.environ.get("RAG_EMBED_MODEL", "bge-m3") diff --git a/systems/x86_64-linux/sgx/litellm.nix b/systems/x86_64-linux/sgx/litellm.nix index e22412e..29b03d8 100644 --- a/systems/x86_64-linux/sgx/litellm.nix +++ b/systems/x86_64-linux/sgx/litellm.nix @@ -6,7 +6,7 @@ services.litellm = { enable = true; host = "0.0.0.0"; - port = 4000; # 8080 is Open WebUI, 8081 is searx + port = 4001; # 8080 Open WebUI, 8081 searx, 4000 uptime-kuma openFirewall = true; # reachable across the LAN environmentFile = config.sops.secrets."litellm/env".path;