feat(rag): install on m4 and amd, default endpoints to sgx
Add the rag CLI to the m4 and amd hosts and point its default API_BASE and QDRANT_URL at sgx (where the gateway and Qdrant run) instead of localhost. The services live on sgx, so a localhost default only worked there; sgx resolves to itself on sgx, so this default is correct on every host and leaves only RAG_API_KEY to set.
This commit is contained in:
parent
fc3e40686a
commit
89c82cf804
3 changed files with 4 additions and 2 deletions
|
|
@ -22,9 +22,9 @@ writers.writePython3Bin "rag"
|
|||
from qdrant_client import QdrantClient
|
||||
from qdrant_client.models import Distance, PointStruct, VectorParams
|
||||
|
||||
API_BASE = os.environ.get("RAG_API_BASE", "http://localhost:4001/v1")
|
||||
API_BASE = os.environ.get("RAG_API_BASE", "http://sgx:4001/v1")
|
||||
API_KEY = os.environ.get("RAG_API_KEY", "none")
|
||||
QDRANT_URL = os.environ.get("RAG_QDRANT_URL", "http://localhost:6333")
|
||||
QDRANT_URL = os.environ.get("RAG_QDRANT_URL", "http://sgx:6333")
|
||||
EMBED_MODEL = os.environ.get("RAG_EMBED_MODEL", "bge-m3")
|
||||
CHAT_MODEL = os.environ.get("RAG_CHAT_MODEL", "coder")
|
||||
DEFAULT_COLLECTION = os.environ.get("RAG_COLLECTION", "docs")
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue