forked from kserve/kserve
-
Notifications
You must be signed in to change notification settings - Fork 0
109 lines (93 loc) · 3.06 KB
/
sklearnserver-docker-publish.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
name: Sklearn Server Docker Publisher
on:
push:
branches:
- master
- sklearn-runtime-schedule-retry-on-failure
tags:
- v*
pull_request:
env:
IMAGE_NAME: sklearnserver
concurrency:
group: ${{ github.workflow }}-${{ github.ref }}
cancel-in-progress: true
jobs:
# Main Test job
test:
runs-on: ubuntu-latest
strategy:
matrix:
platform: [linux/amd64, linux/arm64/v8, linux/ppc64le]
steps:
- name: Checkout source
uses: actions/checkout@v4
- name: Setup QEMU
uses: docker/setup-qemu-action@v3
- name: Setup Docker Buildx
uses: docker/setup-buildx-action@v3
# Cache Docker layers from previous runs
- name: Restore Docker Cache
uses: actions/cache@v4
with:
path: /tmp/.buildx-cache
key: ${{ runner.os }}-docker-${{ matrix.platform }}-${{ hashFiles('python/sklearn.Dockerfile') }}
restore-keys: |
${{ runner.os }}-docker-${{ matrix.platform }}-
# Run tests using Docker Buildx
- name: Run tests
id: run_tests # Give this step an ID to reference its result
uses: docker/build-push-action@v5
with:
platforms: ${{ matrix.platform }}
context: python
file: python/sklearn.Dockerfile
push: false
cache-from: type=gha,src=/tmp/.buildx-cache
cache-to: type=gha,dest=/tmp/.buildx-cache,mode=max
provenance: false
timeout-minutes: 20 # timeout for the test job
# Log the test result after the test job
log-result:
runs-on: ubuntu-latest
needs: test
if: ${{ always() }}
steps:
- name: Log test result
run: |
echo "Test job result: ${{ needs.test.result }}"
# Retry job that executes if the test job fails for any platform, retry only on linux/ppc64le
retry:
runs-on: ubuntu-latest
needs: log-result
if: ${{ always() }}
strategy:
matrix:
platform: [linux/ppc64le] # Only retry for linux/ppc64le
timeout-minutes: 20 # Set timeout for the retry job
steps:
- name: Checkout source
uses: actions/checkout@v4
- name: Setup QEMU
uses: docker/setup-qemu-action@v3
- name: Setup Docker Buildx
uses: docker/setup-buildx-action@v3
# Restore Docker Cache for retry job
- name: Restore Docker Cache
uses: actions/cache@v4
with:
path: /tmp/.buildx-cache
key: ${{ runner.os }}-docker-${{ matrix.platform }}-${{ hashFiles('python/sklearn.Dockerfile') }}
restore-keys: |
${{ runner.os }}-docker-${{ matrix.platform }}-
# Run retry tests using Docker Buildx and cached layers
- name: Run tests again for ppc64le
uses: docker/build-push-action@v5
with:
platforms: ${{ matrix.platform }}
context: python
file: python/sklearn.Dockerfile
push: false
cache-from: type=gha,src=/tmp/.buildx-cache
cache-to: type=gha,dest=/tmp/.buildx-cache,mode=max
provenance: false