From fdeee7c949462bf8c4e548de7cd1828628624682 Mon Sep 17 00:00:00 2001 From: omrishiv <327609+omrishiv@users.noreply.github.com> Date: Fri, 20 Sep 2024 11:34:17 -0700 Subject: [PATCH] update neuron to 2.20 Signed-off-by: omrishiv <327609+omrishiv@users.noreply.github.com> --- Dockerfile.neuron | 4 ++-- requirements-neuron.txt | 4 ++-- 2 files changed, 4 insertions(+), 4 deletions(-) diff --git a/Dockerfile.neuron b/Dockerfile.neuron index f0c3479625a70..647ed99a41e70 100644 --- a/Dockerfile.neuron +++ b/Dockerfile.neuron @@ -1,5 +1,5 @@ # default base image -ARG BASE_IMAGE="public.ecr.aws/neuron/pytorch-inference-neuronx:2.1.2-neuronx-py310-sdk2.19.1-ubuntu20.04" +ARG BASE_IMAGE="public.ecr.aws/neuron/pytorch-inference-neuronx:2.1.2-neuronx-py310-sdk2.20.0-ubuntu20.04" FROM $BASE_IMAGE @@ -20,7 +20,7 @@ RUN python3 -m pip install --upgrade pip RUN python3 -m pip install --no-cache-dir fastapi ninja tokenizers pandas RUN python3 -m pip install sentencepiece transformers==4.36.2 -U RUN python3 -m pip install transformers-neuronx --extra-index-url=https://pip.repos.neuron.amazonaws.com -U -RUN python3 -m pip install --pre neuronx-cc==2.12.* --extra-index-url=https://pip.repos.neuron.amazonaws.com -U +RUN python3 -m pip install --pre neuronx-cc==2.15.* --extra-index-url=https://pip.repos.neuron.amazonaws.com -U COPY ./vllm /app/vllm/vllm COPY ./setup.py /app/vllm/setup.py diff --git a/requirements-neuron.txt b/requirements-neuron.txt index 92b705b4b2d67..148fdbe0d6310 100644 --- a/requirements-neuron.txt +++ b/requirements-neuron.txt @@ -2,6 +2,6 @@ -r requirements-common.txt # Dependencies for Neuron devices -transformers-neuronx >= 0.9.0 -torch-neuronx >= 2.1.0 +transformers-neuronx >= 0.12.0 +torch-neuronx >= 2.1.2 neuronx-cc