Skip to content

Commit 85f5edf

Browse files
committed
Merge branch 'main' into bump-version
2 parents 91211e8 + 28a5dbb commit 85f5edf

File tree

3 files changed

+1
-4
lines changed

3 files changed

+1
-4
lines changed

docker/Dockerfile

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -66,6 +66,5 @@ RUN --mount=type=cache,target=/root/.cache \
6666
# explicitly set ptxas path for triton
6767
ENV PATH=/opt/py3/bin:$PATH
6868
ENV TRITON_PTXAS_PATH=/usr/local/cuda/bin/ptxas
69-
ENV NCCL_LAUNCH_MODE=GROUP
7069
ENV LD_LIBRARY_PATH=/nccl/lib:$LD_LIBRARY_PATH
7170
FROM ${IMAGE_TYPE}

docker/prepare_wheel.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -26,7 +26,7 @@ if [[ "${CUDA_VERSION_SHORT}" != "cu118" ]]; then
2626
DEEP_GEMM_VERSION=03d0be3
2727
FLASH_MLA_VERSION=9edee0c
2828
else
29-
DEEP_GEMM_VERSION=1876566
29+
DEEP_GEMM_VERSION=79f48ee
3030
FLASH_MLA_VERSION=c759027
3131
fi
3232

k8s/deployment.yaml

Lines changed: 0 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -24,8 +24,6 @@ spec:
2424
args:
2525
- "lmdeploy serve api_server internlm/internlm2-chat-7b --server-port 23333"
2626
env:
27-
- name: NCCL_LAUNCH_MODE
28-
value: GROUP
2927
- name: HUGGING_FACE_HUB_TOKEN
3028
value: "{{HUGGING_FACE_HUB_TOKEN}}"
3129
ports:

0 commit comments

Comments
 (0)