feat: Automated Preset Docker Image Building #113

Workflow file for this run

.github/workflows/preset-image-build.yml at 4700c36

	name: Build and Push Preset Models

	on:
	pull_request:
	branches:
	- main
	paths:
	- 'pkg/presets/falcon/**'
	- 'pkg/presets/llama-2/**'
	- 'pkg/presets/llama-2-chat/**'
	push:
	branches:
	- main
	paths:
	- 'pkg/presets/falcon/**'
	- 'pkg/presets/llama-2/**'
	- 'pkg/presets/llama-2-chat/**'
	workflow_dispatch:
	inputs:
	release:
	description: 'Release (yes/no)'
	required: true
	default: 'no'
	image_tag:
	description: 'Image Tag'
	required: false

	permissions:
	id-token: write
	contents: read

	jobs:
	setup:
	runs-on: ubuntu-latest
	outputs:
	image_tag: ${{ steps.set_tag.outputs.image_tag }}
	FALCON_MODIFIED: ${{ steps.check_modified_paths.outputs.FALCON_MODIFIED }}
	LLAMA2_MODIFIED: ${{ steps.check_modified_paths.outputs.LLAMA2_MODIFIED }}
	LLAMA2_CHAT_MODIFIED: ${{ steps.check_modified_paths.outputs.LLAMA2_CHAT_MODIFIED }}
	steps:
	- name: Checkout
	uses: actions/checkout@v4
	with:
	submodules: true
	fetch-depth: 0

	- name: Check Available Disk Space
	run: df -h

	- name: Get Modified files
	run: \|
	files=$(git diff --name-only HEAD^ HEAD)
	echo "Modified files: $files"
	FILES_MODIFIED=""
	while IFS= read -r file; do
	trimmed_file=$(echo "$file" \| tr -d '[:space:]')
	echo "Trimmed file: $trimmed_file"
	FILES_MODIFIED="${FILES_MODIFIED}${trimmed_file};"
	done <<< "$files"
	echo "FILES_MODIFIED=${FILES_MODIFIED}" >> $GITHUB_ENV

	- name: Check Modified Paths
	id: check_modified_paths
	run: \|
	FALCON_MODIFIED=false
	LLAMA2_MODIFIED=false
	LLAMA2_CHAT_MODIFIED=false
	IFS=';' read -ra ADDR <<< "$FILES_MODIFIED"
	for file in "${ADDR[@]}"; do
	echo "Checking file: $file"
	if [[ "$file" == pkg/presets/falcon/* ]] && [[ "$FALCON_MODIFIED" == false ]]; then
	echo "File matches falcon path: $file"
	FALCON_MODIFIED=true
	elif [[ "$file" == pkg/presets/llama-2/* ]] && [[ "$LLAMA2_MODIFIED" == false ]]; then
	echo "File matches llama-2 path: $file"
	LLAMA2_MODIFIED=true
	elif [[ "$file" == pkg/presets/llama-2-chat/* ]] && [[ "$LLAMA2_CHAT_MODIFIED" == false ]]; then
	echo "File matches llama-2-chat path: $file"
	LLAMA2_CHAT_MODIFIED=true
	else
	echo "File does not match any paths: $file"
	fi
	done
	echo "FALCON_MODIFIED=$FALCON_MODIFIED" >> $GITHUB_OUTPUT
	echo "LLAMA2_MODIFIED=$LLAMA2_MODIFIED" >> $GITHUB_OUTPUT
	echo "LLAMA2_CHAT_MODIFIED=$LLAMA2_CHAT_MODIFIED" >> $GITHUB_OUTPUT

	- name: Images to Build
	run: \|
	echo "FALCON_MODIFIED for this job: ${{ steps.check_modified_paths.outputs.FALCON_MODIFIED }}"
	echo "LLAMA2_MODIFIED for this job: ${{ steps.check_modified_paths.outputs.LLAMA2_MODIFIED }}"
	echo "LLAMA2_CHAT_MODIFIED for this job: ${{ steps.check_modified_paths.outputs.LLAMA2_CHAT_MODIFIED }}"

	- name: Set Image Tag
	id: set_tag
	run: \|
	if [[ "${{ github.event_name }}" == "workflow_dispatch" && -n "${{ github.event.inputs.image_tag }}" ]]; then
	echo "Using workflow dispatch to set image tag"
	echo "image_tag=${{ github.event.inputs.image_tag }}" >> $GITHUB_OUTPUT
	elif [[ "${{ github.event_name }}" == "push" && "${{ github.ref }}" == "refs/heads/main" ]]; then
	echo "Setting image tag to be latest"
	echo "image_tag=latest" >> $GITHUB_OUTPUT
	else
	echo "Setting image tag based on latest commit"
	echo "image_tag=$(git rev-parse --short HEAD)" >> $GITHUB_OUTPUT
	fi

	- name: Print Image Tag
	run: \|
	echo "image_tag for this job: ${{ steps.set_tag.outputs.image_tag }}"

	- name: Save image tag as artifact
	id: image_tag_path
	run: \|
	echo "${{ steps.set_tag.outputs.image_tag }}" > image_tag.txt
	echo "IMAGE_TAG_PATH=$(pwd)/image_tag.txt" >> $GITHUB_OUTPUT

	- name: Upload image tag as artifact
	uses: actions/upload-artifact@v3
	with:
	name: image-tag-artifact
	path: ${{ steps.image_tag_path.outputs.IMAGE_TAG_PATH }}

	build-small-models:
	needs: setup
	runs-on: ubuntu-latest
	strategy:
	fail-fast: false
	matrix:
	model:
	- name: falcon-7b
	dockerfile: docker/presets/falcon/Dockerfile
	build_args: "--build-arg FALCON_MODEL_NAME=tiiuae/falcon-7b"

	- name: falcon-7b-instruct
	dockerfile: docker/presets/falcon/Dockerfile
	build_args: "--build-arg FALCON_MODEL_NAME=tiiuae/falcon-7b-instruct"

	- name: llama-2-7b
	dockerfile: docker/presets/llama-2/Dockerfile
	build_args: "--build-arg EXTERNAL_IP=__EXTERNAL_IP__ --build-arg EXTERNAL_PORT=__EXTERNAL_PORT__ --build-arg LLAMA_VERSION=llama-2-7b --build-arg SRC_DIR=pkg/presets/llama-2 --build-arg WEB_SERVER_AUTH_TOKEN=__WEB_SERVER_AUTH_TOKEN__"

	- name: llama-2-7b-chat
	dockerfile: docker/presets/llama-2/Dockerfile
	build_args: "--build-arg EXTERNAL_IP=__EXTERNAL_IP__ --build-arg EXTERNAL_PORT=__EXTERNAL_PORT__ --build-arg LLAMA_VERSION=llama-2-7b-chat --build-arg SRC_DIR=pkg/presets/llama-2-chat --build-arg WEB_SERVER_AUTH_TOKEN=__WEB_SERVER_AUTH_TOKEN__"

	- name: llama-2-13b
	dockerfile: docker/presets/llama-2/Dockerfile
	build_args: "--build-arg EXTERNAL_IP=__EXTERNAL_IP__ --build-arg EXTERNAL_PORT=__EXTERNAL_PORT__ --build-arg LLAMA_VERSION=llama-2-13b --build-arg SRC_DIR=pkg/presets/llama-2 --build-arg WEB_SERVER_AUTH_TOKEN=__WEB_SERVER_AUTH_TOKEN__"

	- name: llama-2-13b-chat
	dockerfile: docker/presets/llama-2/Dockerfile
	build_args: "--build-arg EXTERNAL_IP=__EXTERNAL_IP__ --build-arg EXTERNAL_PORT=__EXTERNAL_PORT__ --build-arg LLAMA_VERSION=llama-2-13b-chat --build-arg SRC_DIR=pkg/presets/llama-2-chat --build-arg WEB_SERVER_AUTH_TOKEN=__WEB_SERVER_AUTH_TOKEN__"

	include:
	- name: falcon-7b
	if: ${{ needs.setup.outputs.FALCON_MODIFIED == 'true' }}
	- name: falcon-7b-instruct
	if: ${{ needs.setup.outputs.FALCON_MODIFIED == 'true' }}
	- name: llama-2-7b
	if: ${{ needs.setup.outputs.LLAMA2_MODIFIED == 'true' }}
	- name: llama-2-7b-chat
	if: ${{ needs.setup.outputs.LLAMA2_CHAT_MODIFIED == 'true' }}
	- name: llama-2-13b
	if: ${{ needs.setup.outputs.LLAMA2_MODIFIED == 'true' }}
	- name: llama-2-13b-chat
	if: ${{ needs.setup.outputs.LLAMA2_CHAT_MODIFIED == 'true' }}
	steps:
	- name: Checkout
	uses: actions/checkout@v4
	with:
	submodules: true
	fetch-depth: 0

	- name: Install Azure CLI latest
	run: \|
	curl -sL https://aka.ms/InstallAzureCLIDeb \| sudo bash

	- name: 'Az CLI login'
	uses: azure/[email protected]
	with:
	client-id: ${{ secrets.AZURE_CLIENT_ID }}
	tenant-id: ${{ secrets.AZURE_TENANT_ID }}
	subscription-id: ${{ secrets.AZURE_SUBSCRIPTION_ID }}

	- name: 'Login to ACR'
	id: acr_login
	run: \|
	if [[ ${{ needs.setup.outputs.image_tag == 'latest'}} ]]; then
	echo "ACR_NAME=aimodelsregistry" >> $GITHUB_OUTPUT
	az acr login --name aimodelsregistry
	else
	echo "ACR_NAME=aimodelsregistrytest" >> $GITHUB_OUTPUT
	az acr login --name aimodelsregistrytest
	fi

	- name: Build and push model (with retries)
	run: \|
	retries=3
	while [ $retries -gt 0 ]; do
	BUILD_ARGS="${{ matrix.model.build_args }}"
	BUILD_ARGS=${BUILD_ARGS/__EXTERNAL_IP__/${{ secrets.AZURE_WEB_SERVER_EXTERNAL_IP }}}
	BUILD_ARGS=${BUILD_ARGS/__EXTERNAL_PORT__/${{ secrets.AZURE_WEB_SERVER_EXTERNAL_PORT }}}
	BUILD_ARGS=${BUILD_ARGS/__WEB_SERVER_AUTH_TOKEN__/${{ secrets.WEB_SERVER_AUTH_TOKEN }}}

	echo "Docker BUILD_ARGS: $BUILD_ARGS"

	az acr build \
	$BUILD_ARGS \
	-t ${{ steps.acr_login.outputs.ACR_NAME }}.azurecr.io/${{ matrix.model.name }}:${{ needs.setup.outputs.image_tag }} \
	-r ${{ steps.acr_login.outputs.ACR_NAME }} \
	-f ${{ matrix.model.dockerfile }} \
	. && break
	retries=$((retries-1))
	sleep 15
	done

	build-large-models:
	needs: setup
	if: false
	runs-on: self-hosted
	strategy:
	fail-fast: false
	matrix:
	model:
	# # TODO: Support large models
	- name: falcon-40b
	dockerfile: docker/presets/falcon/Dockerfile
	build_args: "--build-arg FALCON_MODEL_NAME=tiiuae/falcon-40b"

	- name: falcon-40b-instruct
	dockerfile: docker/presets/falcon/Dockerfile
	build_args: "--build-arg FALCON_MODEL_NAME=tiiuae/falcon-40b-instruct"

	- name: llama-2-70b
	dockerfile: docker/presets/llama-2/Dockerfile
	build_args: "--build-arg EXTERNAL_IP=__EXTERNAL_IP__ --build-arg EXTERNAL_PORT=__EXTERNAL_PORT__ --build-arg LLAMA_VERSION=llama-2-70b --build-arg SRC_DIR=pkg/presets/llama-2 --build-arg WEB_SERVER_AUTH_TOKEN=__WEB_SERVER_AUTH_TOKEN__"

	- name: llama-2-70b-chat
	dockerfile: docker/presets/llama-2/Dockerfile
	build_args: "--build-arg EXTERNAL_IP=__EXTERNAL_IP__ --build-arg EXTERNAL_PORT=__EXTERNAL_PORT__ --build-arg LLAMA_VERSION=llama-2-70b-chat --build-arg SRC_DIR=pkg/presets/llama-2-chat --build-arg WEB_SERVER_AUTH_TOKEN=__WEB_SERVER_AUTH_TOKEN__"

	include:
	# TODO: Support large models
	- name: falcon-40b
	if: ${{ needs.setup.outputs.FALCON_MODIFIED == 'true' }}
	- name: falcon-40b-instruct
	if: ${{ needs.setup.outputs.FALCON_MODIFIED == 'true' }}

	- name: llama-2-70b
	if: ${{ needs.setup.outputs.LLAMA2_MODIFIED == 'true' }}
	- name: llama-2-70b-chat
	if: ${{ needs.setup.outputs.LLAMA2_CHAT_MODIFIED == 'true' }}

	steps:
	- name: Checkout
	uses: actions/checkout@v4
	with:
	submodules: true
	fetch-depth: 0

	- name: Install Azure CLI latest
	run: \|
	curl -sL https://aka.ms/InstallAzureCLIDeb \| sudo bash

	- name: Az CLI login
	uses: azure/[email protected]
	with:
	client-id: ${{ secrets.AZURE_KDM_PRESET_CLIENT_ID }}
	tenant-id: ${{ secrets.AZURE_TENANT_ID }}
	allow-no-subscriptions: true

	- name: Set AZ Subscription
	run: az account set --subscription ${{ secrets.SUBSCRIPTION_ID }}

	- name: 'Login to ACR'
	id: acr_login
	run: \|
	if [[ ${{ needs.setup.outputs.image_tag == 'latest'}} ]]; then
	echo "ACR_NAME=aimodelsregistry" >> $GITHUB_OUTPUT
	az acr login --name aimodelsregistry
	else
	echo "ACR_NAME=aimodelsregistrytest" >> $GITHUB_OUTPUT
	az acr login --name aimodelsregistrytest
	fi

	- name: Check if Docker Pod is Running (if not run it)
	run: \|
	DEPLOYMENT=$(kubectl get deployment docker-deployment -o=jsonpath='{.metadata.name}' --ignore-not-found)
	if [ -z "$DEPLOYMENT" ]; then
	# Apply the deployment if it does not exist
	kubectl apply -f pkg/presets/k8s/docker.yaml
	fi
	kubectl wait --for=condition=ready pod -l app=docker --timeout=300s

	# - name: AZ Attach ACR
	# run: \|

	- name: Build and push model (with retries)
	run: \|
	POD_NAME=$(kubectl get pod -l app=docker -o=jsonpath='{.items[0].metadata.name}')
	retries=3
	while [ $retries -gt 0 ]; do
	BUILD_ARGS="${{ matrix.model.build_args }}"
	BUILD_ARGS=${BUILD_ARGS/__EXTERNAL_IP__/${{ secrets.AZURE_WEB_SERVER_EXTERNAL_IP }}}
	BUILD_ARGS=${BUILD_ARGS/__EXTERNAL_PORT__/${{ secrets.AZURE_WEB_SERVER_EXTERNAL_PORT }}}
	BUILD_ARGS=${BUILD_ARGS/__WEB_SERVER_AUTH_TOKEN__/${{ secrets.WEB_SERVER_AUTH_TOKEN }}}

	echo "Docker BUILD_ARGS: $BUILD_ARGS"

	kubectl exec $POD_NAME -- \
	docker build \
	$BUILD_ARGS \
	-t ${{ steps.acr_login.outputs.ACR_NAME }}.azurecr.io/${{ matrix.model.name }}:${{ needs.setup.outputs.image_tag }} \
	-r ${{ steps.acr_login.outputs.ACR_NAME }} \
	-f ${{ matrix.model.dockerfile }} \
	. && break
	retries=$((retries-1))
	sleep 15
	done

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

feat: Automated Preset Docker Image Building #113

Workflow file

feat: Automated Preset Docker Image Building #113

Jobs

Run details

Workflow file for this run