diff --git a/serving/docker/fastertransformer.Dockerfile b/serving/docker/fastertransformer.Dockerfile index ed1746a3e32..d2609e12672 100644 --- a/serving/docker/fastertransformer.Dockerfile +++ b/serving/docker/fastertransformer.Dockerfile @@ -19,6 +19,7 @@ ARG torch_wheel="https://aws-pytorch-unified-cicd-binaries.s3.us-west-2.amazonaw ARG ft_wheel="https://publish.djl.ai/fastertransformer/fastertransformer-0.23.0-py3-none-any.whl" ARG tb_wheel="https://publish.djl.ai/tritonserver/r23.04/tritontoolkit-23.4-py3-none-any.whl" ARG ompi_version=4.1.4 +ARG protobuf_version=3.20.3 ARG transformers_version=4.29.2 ARG accelerate_version=0.19.0 ARG bitsandbytes_version=0.38.1 @@ -60,7 +61,7 @@ RUN apt-get update && apt-get install -y wget git libnuma-dev zlib1g-dev rapidjs ln -s /usr/local/openmpi-${ompi_version} /usr/local/mpi && \ cd ../../ && rm -rf ompi && \ scripts/install_python.sh ${python_version} && \ - pip3 install ${torch_wheel} ${ft_wheel} ${tb_wheel} safetensors && \ + pip3 install ${torch_wheel} ${ft_wheel} ${tb_wheel} safetensors protobuf==${protobuf_version} && \ pip3 install transformers==${transformers_version} accelerate==${accelerate_version} bitsandbytes==${bitsandbytes_version} einops && \ pip3 install cmake sentencepiece && \ pip3 cache purge && \ diff --git a/serving/docker/pytorch-inf2.Dockerfile b/serving/docker/pytorch-inf2.Dockerfile index 801d15f35ca..01d94c038c6 100644 --- a/serving/docker/pytorch-inf2.Dockerfile +++ b/serving/docker/pytorch-inf2.Dockerfile @@ -16,6 +16,7 @@ ARG python_version=3.8 ARG torch_neuronx_version=1.13.1.1.8.0 ARG transformers_neuronx_version=0.4.60 ARG neuronx_distributed_version=0.1.0 +ARG protobuf_version=3.20.3 ARG transformers_version=4.30.1 ARG accelerate_version=0.20.3 ARG diffusers_version=0.14.0 @@ -59,7 +60,7 @@ RUN mkdir -p /opt/djl/bin && cp scripts/telemetry.sh /opt/djl/bin && \ scripts/install_inferentia2.sh && \ pip install transformers==${transformers_version} accelerate==${accelerate_version} safetensors \ neuronx-cc==2.6.* torch_neuronx==${torch_neuronx_version} transformers-neuronx==${transformers_neuronx_version} \ - neuronx_distributed==${neuronx_distributed_version} \ + neuronx_distributed==${neuronx_distributed_version} protobuf==${protobuf_version} \ diffusers==${diffusers_version} opencv-contrib-python-headless Pillow --extra-index-url=https://pip.repos.neuron.amazonaws.com && \ scripts/install_s5cmd.sh x64 && \ scripts/patch_oss_dlc.sh python && \