@@ -67,7 +67,7 @@ services:
6767 COLLECTION_NAME : ${COLLECTION_NAME:-multimodal_data}
6868 APP_RETRIEVER_SCORETHRESHOLD : 0.25
6969 # Top K from vector DB, which goes as input to reranker model if enabled, else goes to LLM prompt
70- VECTOR_DB_TOPK : ${VECTOR_DB_TOPK:-100 }
70+ VECTOR_DB_TOPK : ${VECTOR_DB_TOPK:-50 }
7171
7272 # #===LLM Model specific configurations===
7373 APP_LLM_MODELNAME : ${APP_LLM_MODELNAME:-"nvidia/nemotron-3-super-120b-a12b"}
@@ -90,7 +90,7 @@ services:
9090 AGENTIC_TASK_LLM_ENABLE_THINKING : ${AGENTIC_TASK_LLM_ENABLE_THINKING:-true}
9191 AGENTIC_TASK_LLM_REASONING_BUDGET : ${AGENTIC_TASK_LLM_REASONING_BUDGET:-0}
9292 AGENTIC_TASK_LLM_LOW_EFFORT : ${AGENTIC_TASK_LLM_LOW_EFFORT:-false}
93- AGENTIC_SEED_GEN_LLM_ENABLE_THINKING : ${AGENTIC_SEED_GEN_LLM_ENABLE_THINKING:-true }
93+ AGENTIC_SEED_GEN_LLM_ENABLE_THINKING : ${AGENTIC_SEED_GEN_LLM_ENABLE_THINKING:-false }
9494 AGENTIC_SEED_GEN_LLM_REASONING_BUDGET : ${AGENTIC_SEED_GEN_LLM_REASONING_BUDGET:-0}
9595 AGENTIC_SEED_GEN_LLM_LOW_EFFORT : ${AGENTIC_SEED_GEN_LLM_LOW_EFFORT:-false}
9696 AGENTIC_SYNTHESIS_LLM_ENABLE_THINKING : ${AGENTIC_SYNTHESIS_LLM_ENABLE_THINKING:-true}
@@ -176,8 +176,8 @@ services:
176176 # Agentic RAG task-execute stage retrieval. Key-only form: passed through from the host
177177 # environment when set, omitted entirely when unset so the app falls back to
178178 # VECTOR_DB_TOPK / APP_RETRIEVER_TOPK (empty string would fail int parsing).
179- APP_AGENTIC_TASK_VECTOR_DB_TOPK : ${APP_AGENTIC_TASK_VECTOR_DB_TOPK:-${VECTOR_DB_TOPK:-100 }}
180- APP_AGENTIC_TASK_RETRIEVER_TOPK : ${APP_AGENTIC_TASK_RETRIEVER_TOPK:-${APP_RETRIEVER_TOPK:-10 }}
179+ APP_AGENTIC_TASK_VECTOR_DB_TOPK : ${APP_AGENTIC_TASK_VECTOR_DB_TOPK:-${VECTOR_DB_TOPK:-20 }}
180+ APP_AGENTIC_TASK_RETRIEVER_TOPK : ${APP_AGENTIC_TASK_RETRIEVER_TOPK:-${APP_RETRIEVER_TOPK:-5 }}
181181
182182 # Log level for server, supported level NOTSET, DEBUG, INFO, WARN, ERROR, CRITICAL
183183 LOGLEVEL : ${LOGLEVEL:-INFO}
0 commit comments