diff --git a/.github/workflows/inference_cache_llm.yml b/.github/workflows/inference_cache_llm.yml index bc8cd7bfb..b6988fb72 100644 --- a/.github/workflows/inference_cache_llm.yml +++ b/.github/workflows/inference_cache_llm.yml @@ -39,7 +39,7 @@ jobs: EOF wget -qO - https://apt.repos.neuron.amazonaws.com/GPG-PUB-KEY-AMAZON-AWS-NEURON.PUB | sudo apt-key add - sudo apt-get update -y - sudo apt-get install aws-neuronx-tools=2.19.0.0 aws-neuronx-runtime-lib=2.22.14.0-6e27b8d5b aws-neuronx-collectives=2.22.26.0-17a033bc8 -y + sudo apt-get install aws-neuronx-tools=2.19.0.0 aws-neuronx-runtime-lib=2.22.19.0-5856c0b42 aws-neuronx-collectives=2.22.33.0-d2128d1aa -y export PATH=/opt/aws/neuron/bin:$PATH - name: Checkout uses: actions/checkout@v4 diff --git a/.github/workflows/inference_cache_stable_diffusion.yml b/.github/workflows/inference_cache_stable_diffusion.yml index 857aca840..2bd83eae1 100644 --- a/.github/workflows/inference_cache_stable_diffusion.yml +++ b/.github/workflows/inference_cache_stable_diffusion.yml @@ -29,7 +29,7 @@ jobs: EOF wget -qO - https://apt.repos.neuron.amazonaws.com/GPG-PUB-KEY-AMAZON-AWS-NEURON.PUB | sudo apt-key add - sudo apt-get update -y - sudo apt-get install aws-neuronx-tools=2.18.3.0 aws-neuronx-runtime-lib=2.21.41.0-fb1705f5f aws-neuronx-collectives=2.21.46.0-69b77134b -y + sudo apt-get install aws-neuronx-tools=2.19.0.0 aws-neuronx-runtime-lib=2.22.19.0-5856c0b42 aws-neuronx-collectives=2.22.33.0-d2128d1aa -y export PATH=/opt/aws/neuron/bin:$PATH - name: Checkout uses: actions/checkout@v4 diff --git a/.github/workflows/test_inf2.yml b/.github/workflows/test_inf2.yml index f6e18ef30..d71e47670 100644 --- a/.github/workflows/test_inf2.yml +++ b/.github/workflows/test_inf2.yml @@ -32,7 +32,7 @@ jobs: EOF wget -qO - https://apt.repos.neuron.amazonaws.com/GPG-PUB-KEY-AMAZON-AWS-NEURON.PUB | sudo apt-key add - sudo apt-get update -y - sudo apt-get install aws-neuronx-tools=2.19.0.0 aws-neuronx-runtime-lib=2.22.14.0-6e27b8d5b aws-neuronx-collectives=2.22.26.0-17a033bc8 -y + sudo apt-get install aws-neuronx-tools=2.19.0.0 aws-neuronx-runtime-lib=2.22.19.0-5856c0b42 aws-neuronx-collectives=2.22.33.0-d2128d1aa -y export PATH=/opt/aws/neuron/bin:$PATH - name: Checkout uses: actions/checkout@v2 diff --git a/.github/workflows/test_inf2_export.yml b/.github/workflows/test_inf2_export.yml index 836034240..a863652a0 100644 --- a/.github/workflows/test_inf2_export.yml +++ b/.github/workflows/test_inf2_export.yml @@ -32,7 +32,7 @@ jobs: EOF wget -qO - https://apt.repos.neuron.amazonaws.com/GPG-PUB-KEY-AMAZON-AWS-NEURON.PUB | sudo apt-key add - sudo apt-get update -y - sudo apt-get install aws-neuronx-tools=2.19.0.0 aws-neuronx-runtime-lib=2.22.14.0-6e27b8d5b aws-neuronx-collectives=2.22.26.0-17a033bc8 -y + sudo apt-get install aws-neuronx-tools=2.19.0.0 aws-neuronx-runtime-lib=2.22.19.0-5856c0b42 aws-neuronx-collectives=2.22.33.0-d2128d1aa -y export PATH=/opt/aws/neuron/bin:$PATH - name: Checkout uses: actions/checkout@v2 diff --git a/.github/workflows/test_inf2_full_export.yml b/.github/workflows/test_inf2_full_export.yml index 8607af5a1..921596bfe 100644 --- a/.github/workflows/test_inf2_full_export.yml +++ b/.github/workflows/test_inf2_full_export.yml @@ -30,7 +30,7 @@ jobs: EOF wget -qO - https://apt.repos.neuron.amazonaws.com/GPG-PUB-KEY-AMAZON-AWS-NEURON.PUB | sudo apt-key add - sudo apt-get update -y - sudo apt-get install aws-neuronx-tools=2.19.0.0 aws-neuronx-runtime-lib=2.22.14.0-6e27b8d5b aws-neuronx-collectives=2.22.26.0-17a033bc8 -y + sudo apt-get install aws-neuronx-tools=2.19.0.0 aws-neuronx-runtime-lib=2.22.19.0-5856c0b42 aws-neuronx-collectives=2.22.33.0-d2128d1aa -y export PATH=/opt/aws/neuron/bin:$PATH - name: Checkout uses: actions/checkout@v2 diff --git a/.github/workflows/test_inf2_inference.yml b/.github/workflows/test_inf2_inference.yml index 5a0405e00..1a37a23a2 100644 --- a/.github/workflows/test_inf2_inference.yml +++ b/.github/workflows/test_inf2_inference.yml @@ -32,7 +32,7 @@ jobs: EOF wget -qO - https://apt.repos.neuron.amazonaws.com/GPG-PUB-KEY-AMAZON-AWS-NEURON.PUB | sudo apt-key add - sudo apt-get update -y - sudo apt-get install aws-neuronx-tools=2.19.0.0 aws-neuronx-runtime-lib=2.22.14.0-6e27b8d5b aws-neuronx-collectives=2.22.26.0-17a033bc8 -y + sudo apt-get install aws-neuronx-tools=2.19.0.0 aws-neuronx-runtime-lib=2.22.19.0-5856c0b42 aws-neuronx-collectives=2.22.33.0-d2128d1aa -y export PATH=/opt/aws/neuron/bin:$PATH - name: Install cv2 dependencies run: | diff --git a/.github/workflows/test_inf2_tgi.yml b/.github/workflows/test_inf2_tgi.yml index 200c7d38a..c8dad05c1 100644 --- a/.github/workflows/test_inf2_tgi.yml +++ b/.github/workflows/test_inf2_tgi.yml @@ -34,7 +34,7 @@ jobs: EOF wget -qO - https://apt.repos.neuron.amazonaws.com/GPG-PUB-KEY-AMAZON-AWS-NEURON.PUB | sudo apt-key add - sudo apt-get update -y - sudo apt-get install aws-neuronx-tools=2.19.0.0 aws-neuronx-runtime-lib=2.22.14.0-6e27b8d5b aws-neuronx-collectives=2.22.26.0-17a033bc8 -y + sudo apt-get install aws-neuronx-tools=2.19.0.0 aws-neuronx-runtime-lib=2.22.19.0-5856c0b42 aws-neuronx-collectives=2.22.33.0-d2128d1aa -y export PATH=/opt/aws/neuron/bin:$PATH - name: Checkout uses: actions/checkout@v2 diff --git a/.github/workflows/test_trainium_common.yml b/.github/workflows/test_trainium_common.yml index c8c56fdf4..78233b641 100644 --- a/.github/workflows/test_trainium_common.yml +++ b/.github/workflows/test_trainium_common.yml @@ -34,7 +34,7 @@ jobs: EOF wget -qO - https://apt.repos.neuron.amazonaws.com/GPG-PUB-KEY-AMAZON-AWS-NEURON.PUB | sudo apt-key add - sudo apt-get update -y - sudo apt-get install aws-neuronx-tools=2.19.0.0 aws-neuronx-runtime-lib=2.22.14.0-6e27b8d5b aws-neuronx-collectives=2.22.26.0-17a033bc8 -y + sudo apt-get install aws-neuronx-tools=2.19.0.0 aws-neuronx-runtime-lib=2.22.19.0-5856c0b42 aws-neuronx-collectives=2.22.33.0-d2128d1aa -y export PATH=/opt/aws/neuron/bin:$PATH - name: Install cv2 dependencies run: | diff --git a/.github/workflows/test_trainium_distributed.yml b/.github/workflows/test_trainium_distributed.yml index 892111671..1571ec7c1 100644 --- a/.github/workflows/test_trainium_distributed.yml +++ b/.github/workflows/test_trainium_distributed.yml @@ -33,7 +33,7 @@ jobs: EOF wget -qO - https://apt.repos.neuron.amazonaws.com/GPG-PUB-KEY-AMAZON-AWS-NEURON.PUB | sudo apt-key add - sudo apt-get update -y - sudo apt-get install aws-neuronx-tools=2.19.0.0 aws-neuronx-runtime-lib=2.22.14.0-6e27b8d5b aws-neuronx-collectives=2.22.26.0-17a033bc8 -y + sudo apt-get install aws-neuronx-tools=2.19.0.0 aws-neuronx-runtime-lib=2.22.19.0-5856c0b42 aws-neuronx-collectives=2.22.33.0-d2128d1aa -y export PATH=/opt/aws/neuron/bin:$PATH - name: Install cv2 dependencies run: | diff --git a/.github/workflows/test_trainium_examples.yml b/.github/workflows/test_trainium_examples.yml index e1167ded5..d5a18d61d 100644 --- a/.github/workflows/test_trainium_examples.yml +++ b/.github/workflows/test_trainium_examples.yml @@ -41,7 +41,7 @@ jobs: EOF wget -qO - https://apt.repos.neuron.amazonaws.com/GPG-PUB-KEY-AMAZON-AWS-NEURON.PUB | sudo apt-key add - sudo apt-get update -y - sudo apt-get install aws-neuronx-tools=2.19.0.0 aws-neuronx-runtime-lib=2.22.14.0-6e27b8d5b aws-neuronx-collectives=2.22.26.0-17a033bc8 -y + sudo apt-get install aws-neuronx-tools=2.19.0.0 aws-neuronx-runtime-lib=2.22.19.0-5856c0b42 aws-neuronx-collectives=2.22.33.0-d2128d1aa -y export PATH=/opt/aws/neuron/bin:$PATH - name: Install cv2 dependencies run: | diff --git a/optimum/neuron/version.py b/optimum/neuron/version.py index 8ff56cce1..58724afd3 100644 --- a/optimum/neuron/version.py +++ b/optimum/neuron/version.py @@ -14,4 +14,4 @@ __version__ = "0.0.27.dev0" -__sdk_version__ = "2.20.0" +__sdk_version__ = "2.20.2" diff --git a/setup.py b/setup.py index 1dfa521ed..535a96f33 100644 --- a/setup.py +++ b/setup.py @@ -64,13 +64,13 @@ ], "neuronx": [ "wheel", - "neuronx-cc==2.15.128.0", - "torch-neuronx==2.1.2.2.3.0", + "neuronx-cc==2.15.143.0", + "torch-neuronx==2.1.2.2.3.2", "transformers-neuronx==0.12.313", "torch==2.1.2.*", "torchvision==0.16.*", "neuronx_distributed==0.9.0", - "libneuronxla==2.0.4115.0", + "libneuronxla==2.0.5347.0", ], "diffusers": ["diffusers>=0.28.0, <=0.30.3", "peft"], "sentence-transformers": ["sentence-transformers >= 2.2.0"], diff --git a/text-generation-inference/Dockerfile b/text-generation-inference/Dockerfile index 8dab8b378..01ff66472 100644 --- a/text-generation-inference/Dockerfile +++ b/text-generation-inference/Dockerfile @@ -95,9 +95,9 @@ RUN wget -qO - https://apt.repos.neuron.amazonaws.com/GPG-PUB-KEY-AMAZON-AWS-NEU # Install neuronx packages RUN apt-get update -y \ && apt-get install -y --no-install-recommends \ - aws-neuronx-dkms=2.18.12.0 \ - aws-neuronx-collectives=2.22.26.0-17a033bc8 \ - aws-neuronx-runtime-lib=2.22.14.0-6e27b8d5b \ + aws-neuronx-dkms=2.18.20.0 \ + aws-neuronx-collectives=2.22.33.0-d2128d1aa \ + aws-neuronx-runtime-lib=2.22.19.0-5856c0b42 \ aws-neuronx-tools=2.19.0.0 \ libxml2 \ && rm -rf /var/lib/apt/lists/* \ @@ -106,10 +106,10 @@ RUN apt-get update -y \ ENV PATH="/opt/bin/:/opt/aws/neuron/bin:${PATH}" RUN pip3 install \ - neuronx-cc==2.15.128.0 \ - torch-neuronx==2.1.2.2.3.0 \ + neuronx-cc==2.15.143.0 \ + torch-neuronx==2.1.2.2.3.2 \ transformers-neuronx==0.12.313 \ - libneuronxla==2.0.4115.0 \ + libneuronxla==2.0.5347.0 \ --extra-index-url=https://pip.repos.neuron.amazonaws.com # Install HuggingFace packages