Skip to content

feat: Automated Preset Docker Image Building #113

feat: Automated Preset Docker Image Building

feat: Automated Preset Docker Image Building #113

name: Build and Push Preset Models
on:
pull_request:
branches:
- main
paths:
- 'pkg/presets/falcon/**'
- 'pkg/presets/llama-2/**'
- 'pkg/presets/llama-2-chat/**'
push:
branches:
- main
paths:
- 'pkg/presets/falcon/**'
- 'pkg/presets/llama-2/**'
- 'pkg/presets/llama-2-chat/**'
workflow_dispatch:
inputs:
release:
description: 'Release (yes/no)'
required: true
default: 'no'
image_tag:
description: 'Image Tag'
required: false
permissions:
id-token: write
contents: read
jobs:
setup:
runs-on: ubuntu-latest
outputs:
image_tag: ${{ steps.set_tag.outputs.image_tag }}
FALCON_MODIFIED: ${{ steps.check_modified_paths.outputs.FALCON_MODIFIED }}
LLAMA2_MODIFIED: ${{ steps.check_modified_paths.outputs.LLAMA2_MODIFIED }}
LLAMA2_CHAT_MODIFIED: ${{ steps.check_modified_paths.outputs.LLAMA2_CHAT_MODIFIED }}
steps:
- name: Checkout
uses: actions/checkout@v4
with:
submodules: true
fetch-depth: 0
- name: Check Available Disk Space
run: df -h
- name: Get Modified files
run: |
files=$(git diff --name-only HEAD^ HEAD)
echo "Modified files: $files"
FILES_MODIFIED=""
while IFS= read -r file; do
trimmed_file=$(echo "$file" | tr -d '[:space:]')
echo "Trimmed file: $trimmed_file"
FILES_MODIFIED="${FILES_MODIFIED}${trimmed_file};"
done <<< "$files"
echo "FILES_MODIFIED=${FILES_MODIFIED}" >> $GITHUB_ENV
- name: Check Modified Paths
id: check_modified_paths
run: |
FALCON_MODIFIED=false
LLAMA2_MODIFIED=false
LLAMA2_CHAT_MODIFIED=false
IFS=';' read -ra ADDR <<< "$FILES_MODIFIED"
for file in "${ADDR[@]}"; do
echo "Checking file: $file"
if [[ "$file" == pkg/presets/falcon/* ]] && [[ "$FALCON_MODIFIED" == false ]]; then
echo "File matches falcon path: $file"
FALCON_MODIFIED=true
elif [[ "$file" == pkg/presets/llama-2/* ]] && [[ "$LLAMA2_MODIFIED" == false ]]; then
echo "File matches llama-2 path: $file"
LLAMA2_MODIFIED=true
elif [[ "$file" == pkg/presets/llama-2-chat/* ]] && [[ "$LLAMA2_CHAT_MODIFIED" == false ]]; then
echo "File matches llama-2-chat path: $file"
LLAMA2_CHAT_MODIFIED=true
else
echo "File does not match any paths: $file"
fi
done
echo "FALCON_MODIFIED=$FALCON_MODIFIED" >> $GITHUB_OUTPUT
echo "LLAMA2_MODIFIED=$LLAMA2_MODIFIED" >> $GITHUB_OUTPUT
echo "LLAMA2_CHAT_MODIFIED=$LLAMA2_CHAT_MODIFIED" >> $GITHUB_OUTPUT
- name: Images to Build
run: |
echo "FALCON_MODIFIED for this job: ${{ steps.check_modified_paths.outputs.FALCON_MODIFIED }}"
echo "LLAMA2_MODIFIED for this job: ${{ steps.check_modified_paths.outputs.LLAMA2_MODIFIED }}"
echo "LLAMA2_CHAT_MODIFIED for this job: ${{ steps.check_modified_paths.outputs.LLAMA2_CHAT_MODIFIED }}"
- name: Set Image Tag
id: set_tag
run: |
if [[ "${{ github.event_name }}" == "workflow_dispatch" && -n "${{ github.event.inputs.image_tag }}" ]]; then
echo "Using workflow dispatch to set image tag"
echo "image_tag=${{ github.event.inputs.image_tag }}" >> $GITHUB_OUTPUT
elif [[ "${{ github.event_name }}" == "push" && "${{ github.ref }}" == "refs/heads/main" ]]; then
echo "Setting image tag to be latest"
echo "image_tag=latest" >> $GITHUB_OUTPUT
else
echo "Setting image tag based on latest commit"
echo "image_tag=$(git rev-parse --short HEAD)" >> $GITHUB_OUTPUT
fi
- name: Print Image Tag
run: |
echo "image_tag for this job: ${{ steps.set_tag.outputs.image_tag }}"
- name: Save image tag as artifact
id: image_tag_path
run: |
echo "${{ steps.set_tag.outputs.image_tag }}" > image_tag.txt
echo "IMAGE_TAG_PATH=$(pwd)/image_tag.txt" >> $GITHUB_OUTPUT
- name: Upload image tag as artifact
uses: actions/upload-artifact@v3
with:
name: image-tag-artifact
path: ${{ steps.image_tag_path.outputs.IMAGE_TAG_PATH }}
build-small-models:
needs: setup
runs-on: ubuntu-latest
strategy:
fail-fast: false
matrix:
model:
- name: falcon-7b
dockerfile: docker/presets/falcon/Dockerfile
build_args: "--build-arg FALCON_MODEL_NAME=tiiuae/falcon-7b"
- name: falcon-7b-instruct
dockerfile: docker/presets/falcon/Dockerfile
build_args: "--build-arg FALCON_MODEL_NAME=tiiuae/falcon-7b-instruct"
- name: llama-2-7b
dockerfile: docker/presets/llama-2/Dockerfile
build_args: "--build-arg EXTERNAL_IP=__EXTERNAL_IP__ --build-arg EXTERNAL_PORT=__EXTERNAL_PORT__ --build-arg LLAMA_VERSION=llama-2-7b --build-arg SRC_DIR=pkg/presets/llama-2 --build-arg WEB_SERVER_AUTH_TOKEN=__WEB_SERVER_AUTH_TOKEN__"
- name: llama-2-7b-chat
dockerfile: docker/presets/llama-2/Dockerfile
build_args: "--build-arg EXTERNAL_IP=__EXTERNAL_IP__ --build-arg EXTERNAL_PORT=__EXTERNAL_PORT__ --build-arg LLAMA_VERSION=llama-2-7b-chat --build-arg SRC_DIR=pkg/presets/llama-2-chat --build-arg WEB_SERVER_AUTH_TOKEN=__WEB_SERVER_AUTH_TOKEN__"
- name: llama-2-13b
dockerfile: docker/presets/llama-2/Dockerfile
build_args: "--build-arg EXTERNAL_IP=__EXTERNAL_IP__ --build-arg EXTERNAL_PORT=__EXTERNAL_PORT__ --build-arg LLAMA_VERSION=llama-2-13b --build-arg SRC_DIR=pkg/presets/llama-2 --build-arg WEB_SERVER_AUTH_TOKEN=__WEB_SERVER_AUTH_TOKEN__"
- name: llama-2-13b-chat
dockerfile: docker/presets/llama-2/Dockerfile
build_args: "--build-arg EXTERNAL_IP=__EXTERNAL_IP__ --build-arg EXTERNAL_PORT=__EXTERNAL_PORT__ --build-arg LLAMA_VERSION=llama-2-13b-chat --build-arg SRC_DIR=pkg/presets/llama-2-chat --build-arg WEB_SERVER_AUTH_TOKEN=__WEB_SERVER_AUTH_TOKEN__"
include:
- name: falcon-7b
if: ${{ needs.setup.outputs.FALCON_MODIFIED == 'true' }}
- name: falcon-7b-instruct
if: ${{ needs.setup.outputs.FALCON_MODIFIED == 'true' }}
- name: llama-2-7b
if: ${{ needs.setup.outputs.LLAMA2_MODIFIED == 'true' }}
- name: llama-2-7b-chat
if: ${{ needs.setup.outputs.LLAMA2_CHAT_MODIFIED == 'true' }}
- name: llama-2-13b
if: ${{ needs.setup.outputs.LLAMA2_MODIFIED == 'true' }}
- name: llama-2-13b-chat
if: ${{ needs.setup.outputs.LLAMA2_CHAT_MODIFIED == 'true' }}
steps:
- name: Checkout
uses: actions/checkout@v4
with:
submodules: true
fetch-depth: 0
- name: Install Azure CLI latest
run: |
curl -sL https://aka.ms/InstallAzureCLIDeb | sudo bash
- name: 'Az CLI login'
uses: azure/[email protected]
with:
client-id: ${{ secrets.AZURE_CLIENT_ID }}
tenant-id: ${{ secrets.AZURE_TENANT_ID }}
subscription-id: ${{ secrets.AZURE_SUBSCRIPTION_ID }}
- name: 'Login to ACR'
id: acr_login
run: |
if [[ ${{ needs.setup.outputs.image_tag == 'latest'}} ]]; then
echo "ACR_NAME=aimodelsregistry" >> $GITHUB_OUTPUT
az acr login --name aimodelsregistry
else
echo "ACR_NAME=aimodelsregistrytest" >> $GITHUB_OUTPUT
az acr login --name aimodelsregistrytest
fi
- name: Build and push model (with retries)
run: |
retries=3
while [ $retries -gt 0 ]; do
BUILD_ARGS="${{ matrix.model.build_args }}"
BUILD_ARGS=${BUILD_ARGS/__EXTERNAL_IP__/${{ secrets.AZURE_WEB_SERVER_EXTERNAL_IP }}}
BUILD_ARGS=${BUILD_ARGS/__EXTERNAL_PORT__/${{ secrets.AZURE_WEB_SERVER_EXTERNAL_PORT }}}
BUILD_ARGS=${BUILD_ARGS/__WEB_SERVER_AUTH_TOKEN__/${{ secrets.WEB_SERVER_AUTH_TOKEN }}}
echo "Docker BUILD_ARGS: $BUILD_ARGS"
az acr build \
$BUILD_ARGS \
-t ${{ steps.acr_login.outputs.ACR_NAME }}.azurecr.io/${{ matrix.model.name }}:${{ needs.setup.outputs.image_tag }} \
-r ${{ steps.acr_login.outputs.ACR_NAME }} \
-f ${{ matrix.model.dockerfile }} \
. && break
retries=$((retries-1))
sleep 15
done
build-large-models:
needs: setup
if: false
runs-on: self-hosted
strategy:
fail-fast: false
matrix:
model:
# # TODO: Support large models
- name: falcon-40b
dockerfile: docker/presets/falcon/Dockerfile
build_args: "--build-arg FALCON_MODEL_NAME=tiiuae/falcon-40b"
- name: falcon-40b-instruct
dockerfile: docker/presets/falcon/Dockerfile
build_args: "--build-arg FALCON_MODEL_NAME=tiiuae/falcon-40b-instruct"
- name: llama-2-70b
dockerfile: docker/presets/llama-2/Dockerfile
build_args: "--build-arg EXTERNAL_IP=__EXTERNAL_IP__ --build-arg EXTERNAL_PORT=__EXTERNAL_PORT__ --build-arg LLAMA_VERSION=llama-2-70b --build-arg SRC_DIR=pkg/presets/llama-2 --build-arg WEB_SERVER_AUTH_TOKEN=__WEB_SERVER_AUTH_TOKEN__"
- name: llama-2-70b-chat
dockerfile: docker/presets/llama-2/Dockerfile
build_args: "--build-arg EXTERNAL_IP=__EXTERNAL_IP__ --build-arg EXTERNAL_PORT=__EXTERNAL_PORT__ --build-arg LLAMA_VERSION=llama-2-70b-chat --build-arg SRC_DIR=pkg/presets/llama-2-chat --build-arg WEB_SERVER_AUTH_TOKEN=__WEB_SERVER_AUTH_TOKEN__"
include:
# TODO: Support large models
- name: falcon-40b
if: ${{ needs.setup.outputs.FALCON_MODIFIED == 'true' }}
- name: falcon-40b-instruct
if: ${{ needs.setup.outputs.FALCON_MODIFIED == 'true' }}
- name: llama-2-70b
if: ${{ needs.setup.outputs.LLAMA2_MODIFIED == 'true' }}
- name: llama-2-70b-chat
if: ${{ needs.setup.outputs.LLAMA2_CHAT_MODIFIED == 'true' }}
steps:
- name: Checkout
uses: actions/checkout@v4
with:
submodules: true
fetch-depth: 0
- name: Install Azure CLI latest
run: |
curl -sL https://aka.ms/InstallAzureCLIDeb | sudo bash
- name: Az CLI login
uses: azure/[email protected]
with:
client-id: ${{ secrets.AZURE_KDM_PRESET_CLIENT_ID }}
tenant-id: ${{ secrets.AZURE_TENANT_ID }}
allow-no-subscriptions: true
- name: Set AZ Subscription
run: az account set --subscription ${{ secrets.SUBSCRIPTION_ID }}
- name: 'Login to ACR'
id: acr_login
run: |
if [[ ${{ needs.setup.outputs.image_tag == 'latest'}} ]]; then
echo "ACR_NAME=aimodelsregistry" >> $GITHUB_OUTPUT
az acr login --name aimodelsregistry
else
echo "ACR_NAME=aimodelsregistrytest" >> $GITHUB_OUTPUT
az acr login --name aimodelsregistrytest
fi
- name: Check if Docker Pod is Running (if not run it)
run: |
DEPLOYMENT=$(kubectl get deployment docker-deployment -o=jsonpath='{.metadata.name}' --ignore-not-found)
if [ -z "$DEPLOYMENT" ]; then
# Apply the deployment if it does not exist
kubectl apply -f pkg/presets/k8s/docker.yaml
fi
kubectl wait --for=condition=ready pod -l app=docker --timeout=300s
# - name: AZ Attach ACR
# run: |
- name: Build and push model (with retries)
run: |
POD_NAME=$(kubectl get pod -l app=docker -o=jsonpath='{.items[0].metadata.name}')
retries=3
while [ $retries -gt 0 ]; do
BUILD_ARGS="${{ matrix.model.build_args }}"
BUILD_ARGS=${BUILD_ARGS/__EXTERNAL_IP__/${{ secrets.AZURE_WEB_SERVER_EXTERNAL_IP }}}
BUILD_ARGS=${BUILD_ARGS/__EXTERNAL_PORT__/${{ secrets.AZURE_WEB_SERVER_EXTERNAL_PORT }}}
BUILD_ARGS=${BUILD_ARGS/__WEB_SERVER_AUTH_TOKEN__/${{ secrets.WEB_SERVER_AUTH_TOKEN }}}
echo "Docker BUILD_ARGS: $BUILD_ARGS"
kubectl exec $POD_NAME -- \
docker build \
$BUILD_ARGS \
-t ${{ steps.acr_login.outputs.ACR_NAME }}.azurecr.io/${{ matrix.model.name }}:${{ needs.setup.outputs.image_tag }} \
-r ${{ steps.acr_login.outputs.ACR_NAME }} \
-f ${{ matrix.model.dockerfile }} \
. && break
retries=$((retries-1))
sleep 15
done