-
Notifications
You must be signed in to change notification settings - Fork 65
53 lines (51 loc) · 1.54 KB
/
build-neuronx-tgi.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
name: Build and push NeuronX docker image to ghcr.io
on:
workflow_dispatch:
push:
tags:
- '*'
jobs:
docker:
runs-on:
group: aws-general-8-plus
permissions:
contents: write
packages: write
steps:
-
name: Checkout sources
uses: actions/checkout@v4
-
name: Install python and create venv
run: |
sudo apt update
sudo apt install python3-venv python3-dev -y
python3 -m venv aws_neuron_venv_pytorch
source aws_neuron_venv_pytorch/bin/activate
python -m pip install -U pip
python -m pip install build
python -m pip config set global.extra-index-url https://pip.repos.neuron.amazonaws.com
python -m build .
-
name: Extract version
run: |
pkg=$(ls dist/optimum_neuron*.tar.gz); tmp=${pkg#*-}; echo "ON_VERSION=${tmp%.tar.gz*}">> $GITHUB_ENV
-
name: Set up Docker Buildx
uses: docker/setup-buildx-action@v3
-
name: Login to ghcr.io
uses: docker/login-action@v3
with:
registry: ghcr.io
username: ${{ github.actor }}
password: ${{ secrets.GITHUB_TOKEN }}
-
name: Build and push
uses: docker/build-push-action@v6
with:
context: .
file: text-generation-inference/Dockerfile
push: true
build-args: VERSION=${{ env.ON_VERSION }}
tags: ghcr.io/huggingface/neuronx-tgi:${{ env.ON_VERSION }}, ghcr.io/huggingface/neuronx-tgi:latest