Skip to content

Commit 0b9bc5a

Browse files
bo-nvzhengd-nv
andauthored
[None][infra] install mooncake in docker images (#8447)
Signed-off-by: Bo Deng <deemod@nvidia.com> Signed-off-by: zhengd-nv <200704041+zhengd-nv@users.noreply.github.com> Signed-off-by: Zheng Duan <200704041+zhengd-nv@users.noreply.github.com> Co-authored-by: zhengd-nv <200704041+zhengd-nv@users.noreply.github.com>
1 parent da1f0e2 commit 0b9bc5a

File tree

5 files changed

+99
-4
lines changed

5 files changed

+99
-4
lines changed

ATTRIBUTIONS-CPP-aarch64.md

Lines changed: 18 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -14889,6 +14889,24 @@ Chen, Tianqi
1488914889

1489014890
```
1489114891

14892+
## Mooncake
14893+
14894+
- **Repository URL**: https://github.com/kvcache-ai/Mooncake
14895+
- **License URL**: https://github.com/kvcache-ai/Mooncake/blob/main/LICENSE-APACHE
14896+
- **License name**: Apache 2.0
14897+
14898+
### Authors
14899+
14900+
© Copyright 2025, Mooncake Team.
14901+
Copyright (c) Meta Platforms, Inc. and affiliates.
14902+
Copyright 2024 KVCache.AI
14903+
Ruoyu Qin
14904+
Zheming Li
14905+
Weiran He
14906+
Mingxing Zhang
14907+
Yongwei Wu
14908+
Weimin Zheng
14909+
Xinran Xu
1489214910
## flashinfer
1489314911

1489414912
### License Text

ATTRIBUTIONS-CPP-x86_64.md

Lines changed: 18 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -14697,6 +14697,24 @@ Chen, Tianqi
1469714697

1469814698
```
1469914699

14700+
## Mooncake
14701+
14702+
- **Repository URL**: https://github.com/kvcache-ai/Mooncake
14703+
- **License URL**: https://github.com/kvcache-ai/Mooncake/blob/main/LICENSE-APACHE
14704+
- **License name**: Apache 2.0
14705+
14706+
### Authors
14707+
14708+
© Copyright 2025, Mooncake Team.
14709+
Copyright (c) Meta Platforms, Inc. and affiliates.
14710+
Copyright 2024 KVCache.AI
14711+
Ruoyu Qin
14712+
Zheming Li
14713+
Weiran He
14714+
Mingxing Zhang
14715+
Yongwei Wu
14716+
Weimin Zheng
14717+
Xinran Xu
1470014718
## flashinfer
1470114719

1470214720
### License Text

docker/Dockerfile.multi

Lines changed: 8 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -44,6 +44,7 @@ COPY docker/common/install.sh \
4444
docker/common/install_ucx.sh \
4545
docker/common/install_nixl.sh \
4646
docker/common/install_etcd.sh \
47+
docker/common/install_mooncake.sh \
4748
./
4849

4950
RUN GITHUB_MIRROR=${GITHUB_MIRROR} \
@@ -103,6 +104,13 @@ COPY docker/common/install_triton.sh \
103104

104105
RUN GITHUB_MIRROR=${GITHUB_MIRROR} bash ./install_triton.sh && rm install_triton.sh
105106

107+
# Install Mooncake, after triton handles boost requirement
108+
RUN if [ -f /etc/redhat-release ]; then \
109+
echo "Rocky8 detected, skipping mooncake installation"; \
110+
else \
111+
bash ./install_mooncake.sh; \
112+
fi && rm install_mooncake.sh
113+
106114
FROM ${DEVEL_IMAGE} AS wheel
107115
WORKDIR /src/tensorrt_llm
108116
COPY benchmarks benchmarks

docker/common/install_mooncake.sh

Lines changed: 51 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,51 @@
1+
#!/bin/bash
2+
set -ex
3+
4+
MOONCAKE_VERSION="v0.3.6.post1"
5+
MOONCAKE_REPO="https://github.com/kvcache-ai/Mooncake.git"
6+
MOONCAKE_INSTALL_PATH="/usr/local/Mooncake"
7+
8+
apt-get update
9+
10+
# https://kvcache-ai.github.io/Mooncake/getting_started/build.html
11+
# libboost-all-dev is removed because it will install a duplicated MPI library
12+
# triton also installed boost so the requirement is already met
13+
apt-get install -y --no-install-recommends \
14+
build-essential \
15+
libibverbs-dev \
16+
libgoogle-glog-dev \
17+
libgtest-dev \
18+
libjsoncpp-dev \
19+
libnuma-dev \
20+
libunwind-dev \
21+
libssl-dev \
22+
libyaml-cpp-dev \
23+
libcurl4-openssl-dev \
24+
libhiredis-dev \
25+
pkg-config \
26+
patchelf
27+
28+
mkdir -p /third-party-source
29+
30+
git clone --depth 1 https://github.com/alibaba/yalantinglibs.git
31+
tar -czf /third-party-source/yalantinglibs.tar.gz yalantinglibs
32+
cd yalantinglibs
33+
mkdir build && cd build
34+
cmake .. -DBUILD_EXAMPLES=OFF -DBUILD_BENCHMARK=OFF -DBUILD_UNIT_TESTS=OFF
35+
make -j
36+
make install
37+
cd ../..
38+
rm -rf yalantinglibs
39+
40+
git clone --depth 1 -b ${MOONCAKE_VERSION} ${MOONCAKE_REPO}
41+
tar -czf /third-party-source/Mooncake-${MOONCAKE_VERSION}.tar.gz Mooncake
42+
cd Mooncake
43+
git submodule update --init --recursive --depth 1
44+
mkdir build && cd build
45+
cmake .. -DUSE_CUDA=ON -DBUILD_SHARED_LIBS=ON -DCMAKE_INSTALL_PREFIX=${MOONCAKE_INSTALL_PATH}
46+
make -j
47+
make install
48+
cd ../..
49+
rm -rf Mooncake
50+
51+
echo "export LD_LIBRARY_PATH=${MOONCAKE_INSTALL_PATH}/lib:\$LD_LIBRARY_PATH" >> "${ENV}"

jenkins/current_image_tags.properties

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -13,7 +13,7 @@
1313
# images are adopted from PostMerge pipelines, the abbreviated commit hash is used instead.
1414
IMAGE_NAME=urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm
1515

16-
LLM_DOCKER_IMAGE=urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:pytorch-25.10-py3-x86_64-ubuntu24.04-trt10.13.3.9-skip-tritondevel-202511021230-8838
17-
LLM_SBSA_DOCKER_IMAGE=urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:pytorch-25.10-py3-aarch64-ubuntu24.04-trt10.13.3.9-skip-tritondevel-202511021230-8838
18-
LLM_ROCKYLINUX8_PY310_DOCKER_IMAGE=urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:cuda-13.0.2-devel-rocky8-x86_64-rocky8-py310-trt10.13.3.9-skip-tritondevel-202511021230-8838
19-
LLM_ROCKYLINUX8_PY312_DOCKER_IMAGE=urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:cuda-13.0.2-devel-rocky8-x86_64-rocky8-py312-trt10.13.3.9-skip-tritondevel-202511021230-8838
16+
LLM_DOCKER_IMAGE=urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:pytorch-25.10-py3-x86_64-ubuntu24.04-trt10.13.3.9-skip-tritondevel-202511110140-8447
17+
LLM_SBSA_DOCKER_IMAGE=urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:pytorch-25.10-py3-aarch64-ubuntu24.04-trt10.13.3.9-skip-tritondevel-202511110140-8447
18+
LLM_ROCKYLINUX8_PY310_DOCKER_IMAGE=urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:cuda-13.0.2-devel-rocky8-x86_64-rocky8-py310-trt10.13.3.9-skip-tritondevel-202511110140-8447
19+
LLM_ROCKYLINUX8_PY312_DOCKER_IMAGE=urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:cuda-13.0.2-devel-rocky8-x86_64-rocky8-py312-trt10.13.3.9-skip-tritondevel-202511110140-8447

0 commit comments

Comments
 (0)