diff --git a/docker/cuda_version_12.8.0/Dockerfile.nixl b/docker/cuda_version_12.8.0/Dockerfile.nixl index 2febcc3f2..4bcb66af5 100644 --- a/docker/cuda_version_12.8.0/Dockerfile.nixl +++ b/docker/cuda_version_12.8.0/Dockerfile.nixl @@ -81,7 +81,7 @@ RUN apt-get update && apt-get install -y cmake automake autotools-dev libtool l RUN apt-get update && apt-get install -y pkg-config tmux net-tools libaio-dev ; \ cd /usr/local/src; \ pip install --upgrade meson pybind11 patchelf; \ - git clone https://github.com/ai-dynamo/nixl.git -b main && \ + git clone https://github.com/ai-dynamo/nixl.git -b 0.8.0 && \ cd nixl && \ rm -rf build && \ mkdir build && \ diff --git a/docker/cuda_version_12.8.0/Dockerfile.nixl.deepep b/docker/cuda_version_12.8.0/Dockerfile.nixl.deepep index bb58d8dc5..96461dcc1 100644 --- a/docker/cuda_version_12.8.0/Dockerfile.nixl.deepep +++ b/docker/cuda_version_12.8.0/Dockerfile.nixl.deepep @@ -108,7 +108,7 @@ RUN apt-get update && apt-get install -y cmake automake autotools-dev libtool l RUN apt-get update && apt-get install -y pkg-config tmux net-tools libaio-dev ; \ cd /usr/local/src; \ pip install --upgrade meson pybind11 patchelf; \ - git clone https://github.com/ai-dynamo/nixl.git -b main && \ + git clone https://github.com/ai-dynamo/nixl.git -b 0.8.0 && \ cd nixl && \ rm -rf build && \ mkdir build && \ diff --git a/docker/cuda_version_12.8.0/Dockerfile.nixl.deepep.cache b/docker/cuda_version_12.8.0/Dockerfile.nixl.deepep.cache index e60fc24ff..2ff2dc361 100644 --- a/docker/cuda_version_12.8.0/Dockerfile.nixl.deepep.cache +++ b/docker/cuda_version_12.8.0/Dockerfile.nixl.deepep.cache @@ -110,7 +110,7 @@ RUN apt-get update && apt-get install -y cmake automake autotools-dev libtool l RUN apt-get update && apt-get install -y pkg-config tmux net-tools libaio-dev ; \ cd /usr/local/src; \ pip install --upgrade meson pybind11 patchelf; \ - git clone https://github.com/ai-dynamo/nixl.git -b main && \ + git clone https://github.com/ai-dynamo/nixl.git -b 0.8.0 && \ cd nixl && \ rm -rf build && \ mkdir build && \ diff --git a/lightllm/common/basemodel/basemodel.py b/lightllm/common/basemodel/basemodel.py index 84d53f3b1..2d4209028 100755 --- a/lightllm/common/basemodel/basemodel.py +++ b/lightllm/common/basemodel/basemodel.py @@ -112,10 +112,10 @@ def __init__(self, kvargs): self._init_some_value() self._init_custom() self._init_inferstate_cls() - self._autotune_warmup() - self._init_padded_req() # wait必须在init cudagraph 之前,避免错误捕获 self._wait_other_modules_ready() + self._autotune_warmup() + self._init_padded_req() self._init_cudagraph() self._init_prefill_cuda_graph() self._check_max_len_infer() diff --git a/requirements.txt b/requirements.txt index d3b88e2e1..8d9a011be 100644 --- a/requirements.txt +++ b/requirements.txt @@ -92,4 +92,5 @@ torchvision==0.23.0 interegular==0.3.3 partial_json_parser==0.2.1.1.post6 websockets==15.0.1 -cupy-cuda12x==13.6.0 \ No newline at end of file +cupy-cuda12x==13.6.0 +nixl==0.8.0