We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 6917d5b commit 7b7728cCopy full SHA for 7b7728c
ChatQnA/docker_compose/intel/cpu/xeon/compose.yaml
@@ -96,6 +96,7 @@ services:
96
HF_TOKEN: ${HUGGINGFACEHUB_API_TOKEN}
97
LLM_MODEL_ID: ${LLM_MODEL_ID}
98
VLLM_TORCH_PROFILER_DIR: "/mnt"
99
+ VLLM_CPU_KVCACHE_SPACE: 40
100
healthcheck:
101
test: ["CMD-SHELL", "curl -f http://$host_ip:9009/health || exit 1"]
102
interval: 10s
0 commit comments