@@ -312,6 +312,28 @@ export RESULT_FILENAME="${RESULT_FILENAME:-}"
312312export SPEC_DECODING=" ${SPEC_DECODING:- } "
313313export IS_MULTINODE=" ${IS_MULTINODE:- false} "
314314
315+ # Agentic / custom vLLM-disagg connector knobs (threaded from submit.sh)
316+ export IS_AGENTIC=" ${IS_AGENTIC:- 0} "
317+ export DURATION=" ${DURATION:- 1800} "
318+ export MODEL=" ${MODEL:- } "
319+ export ROUTER_TYPE=" ${ROUTER_TYPE:- vllm-router} "
320+ export ROUTER_PORT=" ${ROUTER_PORT:- 30000} "
321+ export ENABLE_PREFIX_CACHING=" ${ENABLE_PREFIX_CACHING:- } "
322+ export MAX_MODEL_LEN=" ${MAX_MODEL_LEN:- } "
323+ export WEKA_LOADER_OVERRIDE=" ${WEKA_LOADER_OVERRIDE:- } "
324+ export VLLM_BIND_IP=" ${VLLM_BIND_IP:- } "
325+ export PREFILL_KV_CONNECTOR=" ${PREFILL_KV_CONNECTOR:- moriio} "
326+ export DECODE_KV_CONNECTOR=" ${DECODE_KV_CONNECTOR:- moriio} "
327+ export MC_PROTOCOL=" ${MC_PROTOCOL:- tcp} "
328+ export LMCACHE_HOST=" ${LMCACHE_HOST:- 127.0.0.1} "
329+ export LMCACHE_PORT=" ${LMCACHE_PORT:- 5555} "
330+ export LMCACHE_HTTP_PORT=" ${LMCACHE_HTTP_PORT:- 8080} "
331+ export LMCACHE_L1_SIZE_GB=" ${LMCACHE_L1_SIZE_GB:- 2500} "
332+ export LMCACHE_L1_INIT_SIZE_GB=" ${LMCACHE_L1_INIT_SIZE_GB:- 20} "
333+ export LMCACHE_L1_READ_TTL_SECONDS=" ${LMCACHE_L1_READ_TTL_SECONDS:- 3600} "
334+ export LMCACHE_CHUNK_SIZE=" ${LMCACHE_CHUNK_SIZE:- 256} "
335+ export LMCACHE_MAX_WORKERS=" ${LMCACHE_MAX_WORKERS:- 8} "
336+
315337SANITIZED_USER=$( echo " $USER_NAME " | tr -c ' a-zA-Z0-9_.-' ' _' )
316338export DOCKER_CONT_NAME=" container_${ENGINE} _${SANITIZED_USER} _${MODEL_NAME} _${SLURM_JOB_ID} "
317339
@@ -385,6 +407,26 @@ DOCKER_ENV_COMMON=(
385407 -e DECODE_ENABLE_DP=\$ DECODE_ENABLE_DP
386408 -e DECODE_MTP_SIZE=\$ DECODE_MTP_SIZE
387409 -e IS_MULTINODE=\$ IS_MULTINODE
410+ -e IS_AGENTIC=\$ IS_AGENTIC
411+ -e DURATION=\$ DURATION
412+ -e MODEL=\$ MODEL
413+ -e ROUTER_TYPE=\$ ROUTER_TYPE
414+ -e ROUTER_PORT=\$ ROUTER_PORT
415+ -e ENABLE_PREFIX_CACHING=\$ ENABLE_PREFIX_CACHING
416+ -e MAX_MODEL_LEN=\$ MAX_MODEL_LEN
417+ -e WEKA_LOADER_OVERRIDE=\$ WEKA_LOADER_OVERRIDE
418+ -e VLLM_BIND_IP=\$ VLLM_BIND_IP
419+ -e PREFILL_KV_CONNECTOR=\$ PREFILL_KV_CONNECTOR
420+ -e DECODE_KV_CONNECTOR=\$ DECODE_KV_CONNECTOR
421+ -e MC_PROTOCOL=\$ MC_PROTOCOL
422+ -e LMCACHE_HOST=\$ LMCACHE_HOST
423+ -e LMCACHE_PORT=\$ LMCACHE_PORT
424+ -e LMCACHE_HTTP_PORT=\$ LMCACHE_HTTP_PORT
425+ -e LMCACHE_L1_SIZE_GB=\$ LMCACHE_L1_SIZE_GB
426+ -e LMCACHE_L1_INIT_SIZE_GB=\$ LMCACHE_L1_INIT_SIZE_GB
427+ -e LMCACHE_L1_READ_TTL_SECONDS=\$ LMCACHE_L1_READ_TTL_SECONDS
428+ -e LMCACHE_CHUNK_SIZE=\$ LMCACHE_CHUNK_SIZE
429+ -e LMCACHE_MAX_WORKERS=\$ LMCACHE_MAX_WORKERS
388430)
389431
390432# Engine-specific env vars
0 commit comments