winglian commited on
Commit
8cb127a
·
unverified ·
1 Parent(s): 05b398a

configure nightly docker builds (#1454) [skip ci]

Browse files

* configure nightly docker builds

* also test update pytorch in modal ci

.github/workflows/main.yml CHANGED
@@ -28,7 +28,7 @@ jobs:
28
  - cuda: 121
29
  cuda_version: 12.1.0
30
  python_version: "3.11"
31
- pytorch: 2.1.2
32
  axolotl_extras:
33
  runs-on: axolotl-gpu-runner
34
  steps:
@@ -63,7 +63,7 @@ jobs:
63
  ${{ (matrix.is_latest) && format('{0}-latest', steps.metadata.outputs.tags) || '' }}
64
  labels: ${{ steps.metadata.outputs.labels }}
65
 
66
- build-axolotl-runpod:
67
  needs: build-axolotl
68
  if: ${{ ! contains(github.event.commits[0].message, '[skip docker]]') && github.repository_owner == 'OpenAccess-AI-Collective' }}
69
  # this job needs to be run on self-hosted GPU runners...
@@ -84,7 +84,7 @@ jobs:
84
  - cuda: 121
85
  cuda_version: 12.1.0
86
  python_version: "3.11"
87
- pytorch: 2.1.2
88
  axolotl_extras:
89
  runs-on: axolotl-gpu-runner
90
  steps:
@@ -113,7 +113,5 @@ jobs:
113
  push: ${{ github.event_name != 'pull_request' }}
114
  tags: |
115
  ${{ steps.metadata.outputs.tags }}-py${{ matrix.python_version }}-cu${{ matrix.cuda }}-${{ matrix.pytorch }}${{ matrix.axolotl_extras != '' && '-' || '' }}${{ matrix.axolotl_extras }}
116
- winglian/axolotl-runpod:main-py${{ matrix.python_version }}-cu${{ matrix.cuda }}-${{ matrix.pytorch }}${{ matrix.axolotl_extras != '' && '-' || '' }}${{ matrix.axolotl_extras }}
117
  ${{ (matrix.is_latest) && format('{0}-latest', steps.metadata.outputs.tags) || '' }}
118
- ${{ (matrix.is_latest) && format('{0}-latest', 'winglian/axolotl-runpod:main') || '' }}
119
  labels: ${{ steps.metadata.outputs.labels }}
 
28
  - cuda: 121
29
  cuda_version: 12.1.0
30
  python_version: "3.11"
31
+ pytorch: 2.2.1
32
  axolotl_extras:
33
  runs-on: axolotl-gpu-runner
34
  steps:
 
63
  ${{ (matrix.is_latest) && format('{0}-latest', steps.metadata.outputs.tags) || '' }}
64
  labels: ${{ steps.metadata.outputs.labels }}
65
 
66
+ build-axolotl-cloud:
67
  needs: build-axolotl
68
  if: ${{ ! contains(github.event.commits[0].message, '[skip docker]]') && github.repository_owner == 'OpenAccess-AI-Collective' }}
69
  # this job needs to be run on self-hosted GPU runners...
 
84
  - cuda: 121
85
  cuda_version: 12.1.0
86
  python_version: "3.11"
87
+ pytorch: 2.2.1
88
  axolotl_extras:
89
  runs-on: axolotl-gpu-runner
90
  steps:
 
113
  push: ${{ github.event_name != 'pull_request' }}
114
  tags: |
115
  ${{ steps.metadata.outputs.tags }}-py${{ matrix.python_version }}-cu${{ matrix.cuda }}-${{ matrix.pytorch }}${{ matrix.axolotl_extras != '' && '-' || '' }}${{ matrix.axolotl_extras }}
 
116
  ${{ (matrix.is_latest) && format('{0}-latest', steps.metadata.outputs.tags) || '' }}
 
117
  labels: ${{ steps.metadata.outputs.labels }}
.github/workflows/nightlies.yml ADDED
@@ -0,0 +1,114 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ name: docker-nightlies
2
+
3
+ on:
4
+ workflow_dispatch:
5
+ schedule:
6
+ - cron: '0 0 * * *' # Runs at 00:00 UTC every day
7
+
8
+ jobs:
9
+ build-axolotl:
10
+ if: ${{ ! contains(github.event.commits[0].message, '[skip docker]]') && github.repository_owner == 'OpenAccess-AI-Collective' }}
11
+ strategy:
12
+ fail-fast: false
13
+ matrix:
14
+ include:
15
+ - cuda: 118
16
+ cuda_version: 11.8.0
17
+ python_version: "3.10"
18
+ pytorch: 2.1.2
19
+ axolotl_extras:
20
+ axolotl_args: "--extra-index-url https://download.pytorch.org/whl/cu118"
21
+ is_latest: true
22
+ - cuda: 121
23
+ cuda_version: 12.1.0
24
+ python_version: "3.10"
25
+ pytorch: 2.1.2
26
+ axolotl_extras:
27
+ - cuda: 121
28
+ cuda_version: 12.1.0
29
+ python_version: "3.11"
30
+ pytorch: 2.2.1
31
+ axolotl_extras:
32
+ runs-on: axolotl-gpu-runner
33
+ steps:
34
+ - name: Checkout
35
+ uses: actions/checkout@v4
36
+ - name: Docker metadata
37
+ id: metadata
38
+ uses: docker/metadata-action@v5
39
+ with:
40
+ images: winglian/axolotl
41
+ - name: Set up Docker Buildx
42
+ uses: docker/setup-buildx-action@v3
43
+ - name: Login to Docker Hub
44
+ uses: docker/login-action@v3
45
+ with:
46
+ username: ${{ secrets.DOCKERHUB_USERNAME }}
47
+ password: ${{ secrets.DOCKERHUB_TOKEN }}
48
+ # guidance for testing before pushing: https://docs.docker.com/build/ci/github-actions/test-before-push/
49
+ - name: Build and export to Docker
50
+ uses: docker/build-push-action@v5
51
+ with:
52
+ context: .
53
+ build-args: |
54
+ BASE_TAG=${{ github.ref_name }}-base-py${{ matrix.python_version }}-cu${{ matrix.cuda }}-${{ matrix.pytorch }}
55
+ CUDA=${{ matrix.cuda }}
56
+ PYTORCH_VERSION=${{ matrix.pytorch }}
57
+ AXOLOTL_ARGS=${{ matrix.axolotl_args }}
58
+ file: ./docker/Dockerfile
59
+ push: ${{ github.event_name != 'pull_request' }}
60
+ tags: |
61
+ ${{ steps.metadata.outputs.tags }}-${{ format('{0:yyyyMMdd}', github.event.repository.pushed_at) }}-py${{ matrix.python_version }}-cu${{ matrix.cuda }}-${{ matrix.pytorch }}${{ matrix.axolotl_extras != '' && '-' || '' }}${{ matrix.axolotl_extras }}
62
+ labels: ${{ steps.metadata.outputs.labels }}
63
+
64
+ build-axolotl-cloud:
65
+ needs: build-axolotl
66
+ if: ${{ ! contains(github.event.commits[0].message, '[skip docker]]') && github.repository_owner == 'OpenAccess-AI-Collective' }}
67
+ # this job needs to be run on self-hosted GPU runners...
68
+ strategy:
69
+ matrix:
70
+ include:
71
+ - cuda: 118
72
+ cuda_version: 11.8.0
73
+ python_version: "3.10"
74
+ pytorch: 2.1.2
75
+ axolotl_extras:
76
+ is_latest: true
77
+ - cuda: 121
78
+ cuda_version: 12.1.0
79
+ python_version: "3.10"
80
+ pytorch: 2.1.2
81
+ axolotl_extras:
82
+ - cuda: 121
83
+ cuda_version: 12.1.0
84
+ python_version: "3.11"
85
+ pytorch: 2.2.1
86
+ axolotl_extras:
87
+ runs-on: axolotl-gpu-runner
88
+ steps:
89
+ - name: Checkout
90
+ uses: actions/checkout@v4
91
+ - name: Docker metadata
92
+ id: metadata
93
+ uses: docker/metadata-action@v5
94
+ with:
95
+ images: winglian/axolotl-cloud
96
+ - name: Login to Docker Hub
97
+ uses: docker/login-action@v3
98
+ with:
99
+ username: ${{ secrets.DOCKERHUB_USERNAME }}
100
+ password: ${{ secrets.DOCKERHUB_TOKEN }}
101
+ - name: Set up Docker Buildx
102
+ uses: docker/setup-buildx-action@v2
103
+ - name: Build
104
+ uses: docker/build-push-action@v5
105
+ with:
106
+ context: .
107
+ build-args: |
108
+ BASE_TAG=${{ github.ref_name }}-py${{ matrix.python_version }}-cu${{ matrix.cuda }}-${{ matrix.pytorch }}${{ matrix.axolotl_extras != '' && '-' || '' }}${{ matrix.axolotl_extras }}
109
+ CUDA=${{ matrix.cuda }}
110
+ file: ./docker/Dockerfile-cloud
111
+ push: ${{ github.event_name != 'pull_request' }}
112
+ tags: |
113
+ ${{ steps.metadata.outputs.tags }}-${{ format('{0:yyyyMMdd}', github.event.repository.pushed_at) }}-py${{ matrix.python_version }}-cu${{ matrix.cuda }}-${{ matrix.pytorch }}${{ matrix.axolotl_extras != '' && '-' || '' }}${{ matrix.axolotl_extras }}
114
+ labels: ${{ steps.metadata.outputs.labels }}
.github/workflows/tests.yml CHANGED
@@ -79,6 +79,11 @@ jobs:
79
  python_version: "3.10"
80
  pytorch: 2.1.2
81
  num_gpus: 1
 
 
 
 
 
82
  steps:
83
  - name: Checkout
84
  uses: actions/checkout@v4
 
79
  python_version: "3.10"
80
  pytorch: 2.1.2
81
  num_gpus: 1
82
+ - cuda: 121
83
+ cuda_version: 12.1.0
84
+ python_version: "3.11"
85
+ pytorch: 2.2.1
86
+ num_gpus: 1
87
  steps:
88
  - name: Checkout
89
  uses: actions/checkout@v4