File tree Expand file tree Collapse file tree 1 file changed +3
-3
lines changed Expand file tree Collapse file tree 1 file changed +3
-3
lines changed Original file line number Diff line number Diff line change @@ -7,7 +7,7 @@ servingEngineSpec:
77 # Prefill node configuration
88 - name : " llama-prefill"
99 repository : " lmcache/vllm-openai"
10- tag : " nightly-2025-08-20 "
10+ tag : " nightly-2025-09-04 "
1111 modelURL : " meta-llama/Llama-3.1-8B-Instruct"
1212 replicaCount : 1
1313 requestCPU : 8
@@ -42,7 +42,7 @@ servingEngineSpec:
4242 # Decode node configuration
4343 - name : " llama-decode"
4444 repository : " lmcache/vllm-openai"
45- tag : " nightly-2025-08-20 "
45+ tag : " nightly-2025-09-04 "
4646 modelURL : " meta-llama/Llama-3.1-8B-Instruct"
4747 replicaCount : 1
4848 requestCPU : 8
@@ -69,7 +69,7 @@ servingEngineSpec:
6969 nixlPeerAllocPort : 7400
7070 nixlBufferSize : " 2147483648"
7171 nixlBufferDevice : " cuda"
72- nixlBackends : ["UCX"]
72+ # nixlBackends: ["UCX"]
7373 enablePD : true
7474 rpcPort : " consumer1"
7575 skipLastNTokens : 1
You can’t perform that action at this time.
0 commit comments