Skip to content

Commit 463dc37

Browse files
committed
Updated default config for agentic rag in rag server
1 parent d54e757 commit 463dc37

1 file changed

Lines changed: 4 additions & 4 deletions

File tree

deploy/compose/docker-compose-rag-server.yaml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -67,7 +67,7 @@ services:
6767
COLLECTION_NAME: ${COLLECTION_NAME:-multimodal_data}
6868
APP_RETRIEVER_SCORETHRESHOLD: 0.25
6969
# Top K from vector DB, which goes as input to reranker model if enabled, else goes to LLM prompt
70-
VECTOR_DB_TOPK: ${VECTOR_DB_TOPK:-100}
70+
VECTOR_DB_TOPK: ${VECTOR_DB_TOPK:-50}
7171

7272
##===LLM Model specific configurations===
7373
APP_LLM_MODELNAME: ${APP_LLM_MODELNAME:-"nvidia/nemotron-3-super-120b-a12b"}
@@ -90,7 +90,7 @@ services:
9090
AGENTIC_TASK_LLM_ENABLE_THINKING: ${AGENTIC_TASK_LLM_ENABLE_THINKING:-true}
9191
AGENTIC_TASK_LLM_REASONING_BUDGET: ${AGENTIC_TASK_LLM_REASONING_BUDGET:-0}
9292
AGENTIC_TASK_LLM_LOW_EFFORT: ${AGENTIC_TASK_LLM_LOW_EFFORT:-false}
93-
AGENTIC_SEED_GEN_LLM_ENABLE_THINKING: ${AGENTIC_SEED_GEN_LLM_ENABLE_THINKING:-true}
93+
AGENTIC_SEED_GEN_LLM_ENABLE_THINKING: ${AGENTIC_SEED_GEN_LLM_ENABLE_THINKING:-false}
9494
AGENTIC_SEED_GEN_LLM_REASONING_BUDGET: ${AGENTIC_SEED_GEN_LLM_REASONING_BUDGET:-0}
9595
AGENTIC_SEED_GEN_LLM_LOW_EFFORT: ${AGENTIC_SEED_GEN_LLM_LOW_EFFORT:-false}
9696
AGENTIC_SYNTHESIS_LLM_ENABLE_THINKING: ${AGENTIC_SYNTHESIS_LLM_ENABLE_THINKING:-true}
@@ -176,8 +176,8 @@ services:
176176
# Agentic RAG task-execute stage retrieval. Key-only form: passed through from the host
177177
# environment when set, omitted entirely when unset so the app falls back to
178178
# VECTOR_DB_TOPK / APP_RETRIEVER_TOPK (empty string would fail int parsing).
179-
APP_AGENTIC_TASK_VECTOR_DB_TOPK: ${APP_AGENTIC_TASK_VECTOR_DB_TOPK:-${VECTOR_DB_TOPK:-100}}
180-
APP_AGENTIC_TASK_RETRIEVER_TOPK: ${APP_AGENTIC_TASK_RETRIEVER_TOPK:-${APP_RETRIEVER_TOPK:-10}}
179+
APP_AGENTIC_TASK_VECTOR_DB_TOPK: ${APP_AGENTIC_TASK_VECTOR_DB_TOPK:-${VECTOR_DB_TOPK:-20}}
180+
APP_AGENTIC_TASK_RETRIEVER_TOPK: ${APP_AGENTIC_TASK_RETRIEVER_TOPK:-${APP_RETRIEVER_TOPK:-5}}
181181

182182
# Log level for server, supported level NOTSET, DEBUG, INFO, WARN, ERROR, CRITICAL
183183
LOGLEVEL: ${LOGLEVEL:-INFO}

0 commit comments

Comments
 (0)