rag: resilient embedder — rotate/split on endpoint errors; 4-GPU embed pool (#8)
This commit was merged in pull request #8.
This commit is contained in:
@@ -22,7 +22,7 @@ env:
|
||||
# Two GPU-pinned Ollama containers on the Gitea host — same infra
|
||||
# zerto-docs uses. :11435 = Titan X, :11436 = 1080 Ti. Indexer
|
||||
# round-robins per batch.
|
||||
OLLAMA_URLS: http://192.168.0.2:11435,http://192.168.0.2:11436
|
||||
OLLAMA_URLS: http://192.168.0.2:11435,http://192.168.0.2:11436,http://192.168.0.125:11434,http://192.168.0.126:11434
|
||||
EMBED_MODEL: nomic-embed-text
|
||||
PRODUCT_NAME: hvm
|
||||
|
||||
|
||||
@@ -34,7 +34,7 @@ env:
|
||||
# :11435 owns the Titan X, :11436 owns the 1080 Ti; the indexer
|
||||
# round-robins per batch so both cards run in parallel. The host's
|
||||
# primary Ollama on :11434 is left alone for OpenWebUI etc.
|
||||
OLLAMA_URLS: http://192.168.0.2:11435,http://192.168.0.2:11436
|
||||
OLLAMA_URLS: http://192.168.0.2:11435,http://192.168.0.2:11436,http://192.168.0.125:11434,http://192.168.0.126:11434
|
||||
EMBED_MODEL: nomic-embed-text
|
||||
|
||||
PRODUCT_NAME: hvm
|
||||
|
||||
Reference in New Issue
Block a user