diff --git a/.github/workflows/extract-binary.yaml b/.github/workflows/extract-binary.yaml index 5910570a..46cb79a1 100644 --- a/.github/workflows/extract-binary.yaml +++ b/.github/workflows/extract-binary.yaml @@ -4,18 +4,14 @@ on: workflow_dispatch: permissions: - # contents: write packages: write jobs: extract-binary: - # strategy: - # fail-fast: true - # matrix: - # build-type: - # - cublas-cuda12 runs-on: ubuntu-latest timeout-minutes: 240 + env: + LOCAL_AI_VERSION: v2.1.0 steps: - uses: easimon/maximize-build-space@master with: @@ -25,15 +21,6 @@ jobs: remove-haskell: 'true' remove-android: 'true' - - name: cleanup disk space - run: | - # docker system prune -f -a --volumes - # sudo rm -rf /usr/share/dotnet - # sudo rm -rf /opt/ghc - # sudo rm -rf "/usr/local/share/boost" - # sudo rm -rf "$AGENT_TOOLSDIRECTORY" - df -H - - name: install oras env: ORAS_VERSION: 1.1.0 @@ -50,7 +37,7 @@ jobs: - name: extract artifacts from local-ai container run: | - crane export quay.io/go-skynet/local-ai:v2.0.0-cublas-cuda12 > export.tar + crane export quay.io/go-skynet/local-ai:${LOCAL_AI_VERSION}-cublas-cuda12 > export.tar tar -xvf export.tar build - name: Login to GHCR @@ -62,6 +49,6 @@ jobs: - name: create and push oci artifact run: | - oras push ghcr.io/sozercan/test/local-ai:v2.0.0-cublas-cuda12 \ + oras push ghcr.io/sozercan/test/local-ai:${LOCAL_AI_VERSION}-cublas-cuda12 \ build/local-ai:application/octet-stream \ build/backend-assets/:application/octet-stream diff --git a/pkg/aikit2llb/convert.go b/pkg/aikit2llb/convert.go index 1b3d8e1f..2903e822 100644 --- a/pkg/aikit2llb/convert.go +++ b/pkg/aikit2llb/convert.go @@ -15,7 +15,7 @@ import ( const ( debianSlim = "docker.io/library/debian:12-slim" distrolessBase = "gcr.io/distroless/cc-debian12:latest" - localAIVersion = "v2.0.0" + localAIVersion = "v2.1.0" cudaVersion = "12-3" )