configure nightly docker builds (#1454) [skip ci]
Browse files* configure nightly docker builds
* also test update pytorch in modal ci
- .github/workflows/main.yml +3 -5
- .github/workflows/nightlies.yml +114 -0
- .github/workflows/tests.yml +5 -0
.github/workflows/main.yml
CHANGED
|
@@ -28,7 +28,7 @@ jobs:
|
|
| 28 |
- cuda: 121
|
| 29 |
cuda_version: 12.1.0
|
| 30 |
python_version: "3.11"
|
| 31 |
-
pytorch: 2.1
|
| 32 |
axolotl_extras:
|
| 33 |
runs-on: axolotl-gpu-runner
|
| 34 |
steps:
|
|
@@ -63,7 +63,7 @@ jobs:
|
|
| 63 |
${{ (matrix.is_latest) && format('{0}-latest', steps.metadata.outputs.tags) || '' }}
|
| 64 |
labels: ${{ steps.metadata.outputs.labels }}
|
| 65 |
|
| 66 |
-
build-axolotl-
|
| 67 |
needs: build-axolotl
|
| 68 |
if: ${{ ! contains(github.event.commits[0].message, '[skip docker]]') && github.repository_owner == 'OpenAccess-AI-Collective' }}
|
| 69 |
# this job needs to be run on self-hosted GPU runners...
|
|
@@ -84,7 +84,7 @@ jobs:
|
|
| 84 |
- cuda: 121
|
| 85 |
cuda_version: 12.1.0
|
| 86 |
python_version: "3.11"
|
| 87 |
-
pytorch: 2.1
|
| 88 |
axolotl_extras:
|
| 89 |
runs-on: axolotl-gpu-runner
|
| 90 |
steps:
|
|
@@ -113,7 +113,5 @@ jobs:
|
|
| 113 |
push: ${{ github.event_name != 'pull_request' }}
|
| 114 |
tags: |
|
| 115 |
${{ steps.metadata.outputs.tags }}-py${{ matrix.python_version }}-cu${{ matrix.cuda }}-${{ matrix.pytorch }}${{ matrix.axolotl_extras != '' && '-' || '' }}${{ matrix.axolotl_extras }}
|
| 116 |
-
winglian/axolotl-runpod:main-py${{ matrix.python_version }}-cu${{ matrix.cuda }}-${{ matrix.pytorch }}${{ matrix.axolotl_extras != '' && '-' || '' }}${{ matrix.axolotl_extras }}
|
| 117 |
${{ (matrix.is_latest) && format('{0}-latest', steps.metadata.outputs.tags) || '' }}
|
| 118 |
-
${{ (matrix.is_latest) && format('{0}-latest', 'winglian/axolotl-runpod:main') || '' }}
|
| 119 |
labels: ${{ steps.metadata.outputs.labels }}
|
|
|
|
| 28 |
- cuda: 121
|
| 29 |
cuda_version: 12.1.0
|
| 30 |
python_version: "3.11"
|
| 31 |
+
pytorch: 2.2.1
|
| 32 |
axolotl_extras:
|
| 33 |
runs-on: axolotl-gpu-runner
|
| 34 |
steps:
|
|
|
|
| 63 |
${{ (matrix.is_latest) && format('{0}-latest', steps.metadata.outputs.tags) || '' }}
|
| 64 |
labels: ${{ steps.metadata.outputs.labels }}
|
| 65 |
|
| 66 |
+
build-axolotl-cloud:
|
| 67 |
needs: build-axolotl
|
| 68 |
if: ${{ ! contains(github.event.commits[0].message, '[skip docker]]') && github.repository_owner == 'OpenAccess-AI-Collective' }}
|
| 69 |
# this job needs to be run on self-hosted GPU runners...
|
|
|
|
| 84 |
- cuda: 121
|
| 85 |
cuda_version: 12.1.0
|
| 86 |
python_version: "3.11"
|
| 87 |
+
pytorch: 2.2.1
|
| 88 |
axolotl_extras:
|
| 89 |
runs-on: axolotl-gpu-runner
|
| 90 |
steps:
|
|
|
|
| 113 |
push: ${{ github.event_name != 'pull_request' }}
|
| 114 |
tags: |
|
| 115 |
${{ steps.metadata.outputs.tags }}-py${{ matrix.python_version }}-cu${{ matrix.cuda }}-${{ matrix.pytorch }}${{ matrix.axolotl_extras != '' && '-' || '' }}${{ matrix.axolotl_extras }}
|
|
|
|
| 116 |
${{ (matrix.is_latest) && format('{0}-latest', steps.metadata.outputs.tags) || '' }}
|
|
|
|
| 117 |
labels: ${{ steps.metadata.outputs.labels }}
|
.github/workflows/nightlies.yml
ADDED
|
@@ -0,0 +1,114 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
name: docker-nightlies
|
| 2 |
+
|
| 3 |
+
on:
|
| 4 |
+
workflow_dispatch:
|
| 5 |
+
schedule:
|
| 6 |
+
- cron: '0 0 * * *' # Runs at 00:00 UTC every day
|
| 7 |
+
|
| 8 |
+
jobs:
|
| 9 |
+
build-axolotl:
|
| 10 |
+
if: ${{ ! contains(github.event.commits[0].message, '[skip docker]]') && github.repository_owner == 'OpenAccess-AI-Collective' }}
|
| 11 |
+
strategy:
|
| 12 |
+
fail-fast: false
|
| 13 |
+
matrix:
|
| 14 |
+
include:
|
| 15 |
+
- cuda: 118
|
| 16 |
+
cuda_version: 11.8.0
|
| 17 |
+
python_version: "3.10"
|
| 18 |
+
pytorch: 2.1.2
|
| 19 |
+
axolotl_extras:
|
| 20 |
+
axolotl_args: "--extra-index-url https://download.pytorch.org/whl/cu118"
|
| 21 |
+
is_latest: true
|
| 22 |
+
- cuda: 121
|
| 23 |
+
cuda_version: 12.1.0
|
| 24 |
+
python_version: "3.10"
|
| 25 |
+
pytorch: 2.1.2
|
| 26 |
+
axolotl_extras:
|
| 27 |
+
- cuda: 121
|
| 28 |
+
cuda_version: 12.1.0
|
| 29 |
+
python_version: "3.11"
|
| 30 |
+
pytorch: 2.2.1
|
| 31 |
+
axolotl_extras:
|
| 32 |
+
runs-on: axolotl-gpu-runner
|
| 33 |
+
steps:
|
| 34 |
+
- name: Checkout
|
| 35 |
+
uses: actions/checkout@v4
|
| 36 |
+
- name: Docker metadata
|
| 37 |
+
id: metadata
|
| 38 |
+
uses: docker/metadata-action@v5
|
| 39 |
+
with:
|
| 40 |
+
images: winglian/axolotl
|
| 41 |
+
- name: Set up Docker Buildx
|
| 42 |
+
uses: docker/setup-buildx-action@v3
|
| 43 |
+
- name: Login to Docker Hub
|
| 44 |
+
uses: docker/login-action@v3
|
| 45 |
+
with:
|
| 46 |
+
username: ${{ secrets.DOCKERHUB_USERNAME }}
|
| 47 |
+
password: ${{ secrets.DOCKERHUB_TOKEN }}
|
| 48 |
+
# guidance for testing before pushing: https://docs.docker.com/build/ci/github-actions/test-before-push/
|
| 49 |
+
- name: Build and export to Docker
|
| 50 |
+
uses: docker/build-push-action@v5
|
| 51 |
+
with:
|
| 52 |
+
context: .
|
| 53 |
+
build-args: |
|
| 54 |
+
BASE_TAG=${{ github.ref_name }}-base-py${{ matrix.python_version }}-cu${{ matrix.cuda }}-${{ matrix.pytorch }}
|
| 55 |
+
CUDA=${{ matrix.cuda }}
|
| 56 |
+
PYTORCH_VERSION=${{ matrix.pytorch }}
|
| 57 |
+
AXOLOTL_ARGS=${{ matrix.axolotl_args }}
|
| 58 |
+
file: ./docker/Dockerfile
|
| 59 |
+
push: ${{ github.event_name != 'pull_request' }}
|
| 60 |
+
tags: |
|
| 61 |
+
${{ steps.metadata.outputs.tags }}-${{ format('{0:yyyyMMdd}', github.event.repository.pushed_at) }}-py${{ matrix.python_version }}-cu${{ matrix.cuda }}-${{ matrix.pytorch }}${{ matrix.axolotl_extras != '' && '-' || '' }}${{ matrix.axolotl_extras }}
|
| 62 |
+
labels: ${{ steps.metadata.outputs.labels }}
|
| 63 |
+
|
| 64 |
+
build-axolotl-cloud:
|
| 65 |
+
needs: build-axolotl
|
| 66 |
+
if: ${{ ! contains(github.event.commits[0].message, '[skip docker]]') && github.repository_owner == 'OpenAccess-AI-Collective' }}
|
| 67 |
+
# this job needs to be run on self-hosted GPU runners...
|
| 68 |
+
strategy:
|
| 69 |
+
matrix:
|
| 70 |
+
include:
|
| 71 |
+
- cuda: 118
|
| 72 |
+
cuda_version: 11.8.0
|
| 73 |
+
python_version: "3.10"
|
| 74 |
+
pytorch: 2.1.2
|
| 75 |
+
axolotl_extras:
|
| 76 |
+
is_latest: true
|
| 77 |
+
- cuda: 121
|
| 78 |
+
cuda_version: 12.1.0
|
| 79 |
+
python_version: "3.10"
|
| 80 |
+
pytorch: 2.1.2
|
| 81 |
+
axolotl_extras:
|
| 82 |
+
- cuda: 121
|
| 83 |
+
cuda_version: 12.1.0
|
| 84 |
+
python_version: "3.11"
|
| 85 |
+
pytorch: 2.2.1
|
| 86 |
+
axolotl_extras:
|
| 87 |
+
runs-on: axolotl-gpu-runner
|
| 88 |
+
steps:
|
| 89 |
+
- name: Checkout
|
| 90 |
+
uses: actions/checkout@v4
|
| 91 |
+
- name: Docker metadata
|
| 92 |
+
id: metadata
|
| 93 |
+
uses: docker/metadata-action@v5
|
| 94 |
+
with:
|
| 95 |
+
images: winglian/axolotl-cloud
|
| 96 |
+
- name: Login to Docker Hub
|
| 97 |
+
uses: docker/login-action@v3
|
| 98 |
+
with:
|
| 99 |
+
username: ${{ secrets.DOCKERHUB_USERNAME }}
|
| 100 |
+
password: ${{ secrets.DOCKERHUB_TOKEN }}
|
| 101 |
+
- name: Set up Docker Buildx
|
| 102 |
+
uses: docker/setup-buildx-action@v2
|
| 103 |
+
- name: Build
|
| 104 |
+
uses: docker/build-push-action@v5
|
| 105 |
+
with:
|
| 106 |
+
context: .
|
| 107 |
+
build-args: |
|
| 108 |
+
BASE_TAG=${{ github.ref_name }}-py${{ matrix.python_version }}-cu${{ matrix.cuda }}-${{ matrix.pytorch }}${{ matrix.axolotl_extras != '' && '-' || '' }}${{ matrix.axolotl_extras }}
|
| 109 |
+
CUDA=${{ matrix.cuda }}
|
| 110 |
+
file: ./docker/Dockerfile-cloud
|
| 111 |
+
push: ${{ github.event_name != 'pull_request' }}
|
| 112 |
+
tags: |
|
| 113 |
+
${{ steps.metadata.outputs.tags }}-${{ format('{0:yyyyMMdd}', github.event.repository.pushed_at) }}-py${{ matrix.python_version }}-cu${{ matrix.cuda }}-${{ matrix.pytorch }}${{ matrix.axolotl_extras != '' && '-' || '' }}${{ matrix.axolotl_extras }}
|
| 114 |
+
labels: ${{ steps.metadata.outputs.labels }}
|
.github/workflows/tests.yml
CHANGED
|
@@ -79,6 +79,11 @@ jobs:
|
|
| 79 |
python_version: "3.10"
|
| 80 |
pytorch: 2.1.2
|
| 81 |
num_gpus: 1
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 82 |
steps:
|
| 83 |
- name: Checkout
|
| 84 |
uses: actions/checkout@v4
|
|
|
|
| 79 |
python_version: "3.10"
|
| 80 |
pytorch: 2.1.2
|
| 81 |
num_gpus: 1
|
| 82 |
+
- cuda: 121
|
| 83 |
+
cuda_version: 12.1.0
|
| 84 |
+
python_version: "3.11"
|
| 85 |
+
pytorch: 2.2.1
|
| 86 |
+
num_gpus: 1
|
| 87 |
steps:
|
| 88 |
- name: Checkout
|
| 89 |
uses: actions/checkout@v4
|