-
Notifications
You must be signed in to change notification settings - Fork 3
71 lines (58 loc) · 1.99 KB
/
build.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
name: Build and Push
on:
push:
branches: ["main"]
paths-ignore:
- "**.md"
pull_request:
paths-ignore:
- "**.md"
workflow_dispatch:
env:
QUAY_REPO: "quay.io/dtrifiro/llama-cpp-python-serving"
CI: true
DOCKER_BUILDKIT: 1
FORCE_COLOR: 1
jobs:
build-and-push:
name: Build and Push Image
runs-on: ubuntu-latest
steps:
- uses: actions/checkout@v4
- name: "Setup Docker Buildx"
uses: docker/setup-buildx-action@v3
- name: "Build"
run: |
date="$(date +%Y%m%d%H%M)"
rev="$(git rev-parse --short HEAD)"
docker build -t "${QUAY_REPO}:latest" -t "${QUAY_REPO}:${rev}" -t "${QUAY_REPO}:${date}" .
- name: "Build CUDA image"
run: |
date="$(date +%Y%m%d%H%M)"
rev="$(git rev-parse --short HEAD)"
docker build -t "${QUAY_REPO}:latest-cuda" -t "${QUAY_REPO}:${rev}-cuda" -t "${QUAY_REPO}:${date}-cuda" -f Dockerfile.cuda .
- name: "Push to quay"
if: github.ref == 'refs/heads/main' && github.event_name != 'pull_request'
run: |
docker login -u="${{secrets.QUAY_USERNAME}}" -p="${{secrets.QUAY_TOKEN}}" quay.io
docker push --all-tags "${QUAY_REPO}"
smoke-test:
name: "Smoke test"
needs: build-and-push
if: github.ref == 'refs/heads/main' && github.event_name != 'pull_request'
runs-on: ubuntu-latest
steps:
- uses: actions/checkout@v4
- uses: dtrifiro/[email protected]
- name: Setup Model
run: |
bash scripts/setup_model.sh
- name: Deploy InferenceService/ServingRuntime
run: |
bash scripts/deploy.sh cpu
- name: Perform sample inference
run: |
ISVC_HOST=$(kubectl get isvc llama-cpp-python -o jsonpath='{.status.components.predictor.url}' | cut -d / -f 3-)
# Add the ISVC_HOST to /etc/hosts since we can't resolve it
echo "127.0.0.1 ${ISVC_HOST}" | sudo tee -a /etc/hosts
bash scripts/inference_simple.sh