mirror of
https://github.com/NVIDIA/dgx-spark-playbooks.git
synced 2026-04-23 02:23:53 +00:00
chore: Regenerate all playbooks
This commit is contained in:
parent
911ca6db8b
commit
9414a5141f
@ -27,8 +27,8 @@ services:
|
||||
# Ollama configuration
|
||||
- OLLAMA_BASE_URL=http://ollama:11434/v1
|
||||
- OLLAMA_MODEL=llama3.1:8b
|
||||
# Disable vLLM
|
||||
- VLLM_BASE_URL=http://localhost:8001/v1
|
||||
# vLLM disabled in default Ollama mode
|
||||
# - VLLM_BASE_URL=http://localhost:8001/v1
|
||||
- VLLM_MODEL=disabled
|
||||
# Vector DB configuration
|
||||
- QDRANT_URL=http://qdrant:6333
|
||||
|
||||
@ -108,7 +108,7 @@ export class TextProcessor {
|
||||
|
||||
// Determine which LLM provider to use based on configuration
|
||||
// Priority: vLLM > NVIDIA > Ollama
|
||||
if (process.env.VLLM_BASE_URL) {
|
||||
if (process.env.VLLM_BASE_URL && process.env.VLLM_MODEL && process.env.VLLM_MODEL !== 'disabled') {
|
||||
this.selectedLLMProvider = 'vllm';
|
||||
} else if (process.env.NVIDIA_API_KEY) {
|
||||
this.selectedLLMProvider = 'nvidia';
|
||||
|
||||
Loading…
Reference in New Issue
Block a user