File tree Expand file tree Collapse file tree 5 files changed +99
-4
lines changed Expand file tree Collapse file tree 5 files changed +99
-4
lines changed Original file line number Diff line number Diff line change @@ -14889,6 +14889,24 @@ Chen, Tianqi
1488914889
1489014890```
1489114891
14892+ ## Mooncake
14893+
14894+ - **Repository URL**: https://github.com/kvcache-ai/Mooncake
14895+ - **License URL**: https://github.com/kvcache-ai/Mooncake/blob/main/LICENSE-APACHE
14896+ - **License name**: Apache 2.0
14897+
14898+ ### Authors
14899+
14900+ © Copyright 2025, Mooncake Team.
14901+ Copyright (c) Meta Platforms, Inc. and affiliates.
14902+ Copyright 2024 KVCache.AI
14903+ Ruoyu Qin
14904+ Zheming Li
14905+ Weiran He
14906+ Mingxing Zhang
14907+ Yongwei Wu
14908+ Weimin Zheng
14909+ Xinran Xu
1489214910## flashinfer
1489314911
1489414912### License Text
Original file line number Diff line number Diff line change @@ -14697,6 +14697,24 @@ Chen, Tianqi
1469714697
1469814698```
1469914699
14700+ ## Mooncake
14701+
14702+ - **Repository URL**: https://github.com/kvcache-ai/Mooncake
14703+ - **License URL**: https://github.com/kvcache-ai/Mooncake/blob/main/LICENSE-APACHE
14704+ - **License name**: Apache 2.0
14705+
14706+ ### Authors
14707+
14708+ © Copyright 2025, Mooncake Team.
14709+ Copyright (c) Meta Platforms, Inc. and affiliates.
14710+ Copyright 2024 KVCache.AI
14711+ Ruoyu Qin
14712+ Zheming Li
14713+ Weiran He
14714+ Mingxing Zhang
14715+ Yongwei Wu
14716+ Weimin Zheng
14717+ Xinran Xu
1470014718## flashinfer
1470114719
1470214720### License Text
Original file line number Diff line number Diff line change @@ -44,6 +44,7 @@ COPY docker/common/install.sh \
4444 docker/common/install_ucx.sh \
4545 docker/common/install_nixl.sh \
4646 docker/common/install_etcd.sh \
47+ docker/common/install_mooncake.sh \
4748 ./
4849
4950RUN GITHUB_MIRROR=${GITHUB_MIRROR} \
@@ -103,6 +104,13 @@ COPY docker/common/install_triton.sh \
103104
104105RUN GITHUB_MIRROR=${GITHUB_MIRROR} bash ./install_triton.sh && rm install_triton.sh
105106
107+ # Install Mooncake, after triton handles boost requirement
108+ RUN if [ -f /etc/redhat-release ]; then \
109+ echo "Rocky8 detected, skipping mooncake installation"; \
110+ else \
111+ bash ./install_mooncake.sh; \
112+ fi && rm install_mooncake.sh
113+
106114FROM ${DEVEL_IMAGE} AS wheel
107115WORKDIR /src/tensorrt_llm
108116COPY benchmarks benchmarks
Original file line number Diff line number Diff line change 1+ #! /bin/bash
2+ set -ex
3+
4+ MOONCAKE_VERSION=" v0.3.6.post1"
5+ MOONCAKE_REPO=" https://github.com/kvcache-ai/Mooncake.git"
6+ MOONCAKE_INSTALL_PATH=" /usr/local/Mooncake"
7+
8+ apt-get update
9+
10+ # https://kvcache-ai.github.io/Mooncake/getting_started/build.html
11+ # libboost-all-dev is removed because it will install a duplicated MPI library
12+ # triton also installed boost so the requirement is already met
13+ apt-get install -y --no-install-recommends \
14+ build-essential \
15+ libibverbs-dev \
16+ libgoogle-glog-dev \
17+ libgtest-dev \
18+ libjsoncpp-dev \
19+ libnuma-dev \
20+ libunwind-dev \
21+ libssl-dev \
22+ libyaml-cpp-dev \
23+ libcurl4-openssl-dev \
24+ libhiredis-dev \
25+ pkg-config \
26+ patchelf
27+
28+ mkdir -p /third-party-source
29+
30+ git clone --depth 1 https://github.com/alibaba/yalantinglibs.git
31+ tar -czf /third-party-source/yalantinglibs.tar.gz yalantinglibs
32+ cd yalantinglibs
33+ mkdir build && cd build
34+ cmake .. -DBUILD_EXAMPLES=OFF -DBUILD_BENCHMARK=OFF -DBUILD_UNIT_TESTS=OFF
35+ make -j
36+ make install
37+ cd ../..
38+ rm -rf yalantinglibs
39+
40+ git clone --depth 1 -b ${MOONCAKE_VERSION} ${MOONCAKE_REPO}
41+ tar -czf /third-party-source/Mooncake-${MOONCAKE_VERSION} .tar.gz Mooncake
42+ cd Mooncake
43+ git submodule update --init --recursive --depth 1
44+ mkdir build && cd build
45+ cmake .. -DUSE_CUDA=ON -DBUILD_SHARED_LIBS=ON -DCMAKE_INSTALL_PREFIX=${MOONCAKE_INSTALL_PATH}
46+ make -j
47+ make install
48+ cd ../..
49+ rm -rf Mooncake
50+
51+ echo " export LD_LIBRARY_PATH=${MOONCAKE_INSTALL_PATH} /lib:\$ LD_LIBRARY_PATH" >> " ${ENV} "
Original file line number Diff line number Diff line change 1313# images are adopted from PostMerge pipelines, the abbreviated commit hash is used instead.
1414IMAGE_NAME =urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm
1515
16- LLM_DOCKER_IMAGE =urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:pytorch-25.10-py3-x86_64-ubuntu24.04-trt10.13.3.9-skip-tritondevel-202511021230-8838
17- LLM_SBSA_DOCKER_IMAGE =urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:pytorch-25.10-py3-aarch64-ubuntu24.04-trt10.13.3.9-skip-tritondevel-202511021230-8838
18- LLM_ROCKYLINUX8_PY310_DOCKER_IMAGE =urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:cuda-13.0.2-devel-rocky8-x86_64-rocky8-py310-trt10.13.3.9-skip-tritondevel-202511021230-8838
19- LLM_ROCKYLINUX8_PY312_DOCKER_IMAGE =urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:cuda-13.0.2-devel-rocky8-x86_64-rocky8-py312-trt10.13.3.9-skip-tritondevel-202511021230-8838
16+ LLM_DOCKER_IMAGE =urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:pytorch-25.10-py3-x86_64-ubuntu24.04-trt10.13.3.9-skip-tritondevel-202511110140-8447
17+ LLM_SBSA_DOCKER_IMAGE =urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:pytorch-25.10-py3-aarch64-ubuntu24.04-trt10.13.3.9-skip-tritondevel-202511110140-8447
18+ LLM_ROCKYLINUX8_PY310_DOCKER_IMAGE =urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:cuda-13.0.2-devel-rocky8-x86_64-rocky8-py310-trt10.13.3.9-skip-tritondevel-202511110140-8447
19+ LLM_ROCKYLINUX8_PY312_DOCKER_IMAGE =urm.nvidia.com/sw-tensorrt-docker/tensorrt-llm:cuda-13.0.2-devel-rocky8-x86_64-rocky8-py312-trt10.13.3.9-skip-tritondevel-202511110140-8447
You can’t perform that action at this time.
0 commit comments