Skip to content

Commit dd0752f

Browse files
authored
Merge pull request #1 from nomyx-io/ovai
Ovai
2 parents d485a08 + 61c40c2 commit dd0752f

File tree

126 files changed

+5462
-2704
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

126 files changed

+5462
-2704
lines changed

.github/workflows/base.yml

Lines changed: 13 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -16,17 +16,27 @@ jobs:
1616
cuda_version: 11.8.0
1717
python_version: "3.10"
1818
pytorch: 2.1.2
19-
torch_cuda_arch_list: "7.0 7.5 8.0 8.6 9.0+PTX"
19+
torch_cuda_arch_list: "7.0 7.5 8.0 8.6 8.7 8.9 9.0+PTX"
2020
- cuda: "121"
2121
cuda_version: 12.1.0
2222
python_version: "3.10"
2323
pytorch: 2.1.2
24-
torch_cuda_arch_list: "7.0 7.5 8.0 8.6 9.0+PTX"
24+
torch_cuda_arch_list: "7.0 7.5 8.0 8.6 8.7 8.9 9.0+PTX"
2525
- cuda: "121"
2626
cuda_version: 12.1.0
2727
python_version: "3.11"
2828
pytorch: 2.1.2
29-
torch_cuda_arch_list: "7.0 7.5 8.0 8.6 9.0+PTX"
29+
torch_cuda_arch_list: "7.0 7.5 8.0 8.6 8.7 8.9 9.0+PTX"
30+
- cuda: "121"
31+
cuda_version: 12.1.0
32+
python_version: "3.11"
33+
pytorch: 2.2.1
34+
torch_cuda_arch_list: "7.0 7.5 8.0 8.6 8.7 8.9 9.0+PTX"
35+
- cuda: "121"
36+
cuda_version: 12.1.0
37+
python_version: "3.11"
38+
pytorch: 2.3.0
39+
torch_cuda_arch_list: "7.0 7.5 8.0 8.6 8.7 8.9 9.0+PTX"
3040
steps:
3141
- name: Checkout
3242
uses: actions/checkout@v3

.github/workflows/docs.yml

Lines changed: 31 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,31 @@
1+
name: Publish Docs
2+
on:
3+
push:
4+
branches:
5+
- main
6+
7+
permissions:
8+
contents: write
9+
pages: write
10+
11+
jobs:
12+
build-deploy:
13+
runs-on: ubuntu-latest
14+
steps:
15+
- name: Check out repository
16+
uses: actions/checkout@v4
17+
- name: Set up Quarto
18+
uses: quarto-dev/quarto-actions/setup@v2
19+
- name: Setup Python
20+
uses: actions/setup-python@v3
21+
with:
22+
python-version: '3.10'
23+
- name: install dependencies
24+
run: |
25+
python3 -m pip install jupyter
26+
- name: Publish to GitHub Pages (and render)
27+
uses: quarto-dev/quarto-actions/publish@v2
28+
with:
29+
target: gh-pages
30+
env:
31+
GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}

.github/workflows/lint.yml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -7,6 +7,7 @@ on:
77
- 'requirements.txt'
88
- '.github/workflows/*.yml'
99
- "*.md"
10+
- "examples/**/*.y[a]?ml"
1011
workflow_dispatch:
1112

1213
jobs:

.github/workflows/main.yml

Lines changed: 13 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -28,7 +28,12 @@ jobs:
2828
- cuda: 121
2929
cuda_version: 12.1.0
3030
python_version: "3.11"
31-
pytorch: 2.1.2
31+
pytorch: 2.2.1
32+
axolotl_extras:
33+
- cuda: 121
34+
cuda_version: 12.1.0
35+
python_version: "3.11"
36+
pytorch: 2.3.0
3237
axolotl_extras:
3338
runs-on: axolotl-gpu-runner
3439
steps:
@@ -63,7 +68,7 @@ jobs:
6368
${{ (matrix.is_latest) && format('{0}-latest', steps.metadata.outputs.tags) || '' }}
6469
labels: ${{ steps.metadata.outputs.labels }}
6570

66-
build-axolotl-runpod:
71+
build-axolotl-cloud:
6772
needs: build-axolotl
6873
if: ${{ ! contains(github.event.commits[0].message, '[skip docker]]') && github.repository_owner == 'OpenAccess-AI-Collective' }}
6974
# this job needs to be run on self-hosted GPU runners...
@@ -84,7 +89,12 @@ jobs:
8489
- cuda: 121
8590
cuda_version: 12.1.0
8691
python_version: "3.11"
87-
pytorch: 2.1.2
92+
pytorch: 2.2.1
93+
axolotl_extras:
94+
- cuda: 121
95+
cuda_version: 12.1.0
96+
python_version: "3.11"
97+
pytorch: 2.3.0
8898
axolotl_extras:
8999
runs-on: axolotl-gpu-runner
90100
steps:
@@ -113,7 +123,5 @@ jobs:
113123
push: ${{ github.event_name != 'pull_request' }}
114124
tags: |
115125
${{ steps.metadata.outputs.tags }}-py${{ matrix.python_version }}-cu${{ matrix.cuda }}-${{ matrix.pytorch }}${{ matrix.axolotl_extras != '' && '-' || '' }}${{ matrix.axolotl_extras }}
116-
winglian/axolotl-runpod:main-py${{ matrix.python_version }}-cu${{ matrix.cuda }}-${{ matrix.pytorch }}${{ matrix.axolotl_extras != '' && '-' || '' }}${{ matrix.axolotl_extras }}
117126
${{ (matrix.is_latest) && format('{0}-latest', steps.metadata.outputs.tags) || '' }}
118-
${{ (matrix.is_latest) && format('{0}-latest', 'winglian/axolotl-runpod:main') || '' }}
119127
labels: ${{ steps.metadata.outputs.labels }}

.github/workflows/nightlies.yml

Lines changed: 128 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,128 @@
1+
name: docker-nightlies
2+
3+
on:
4+
workflow_dispatch:
5+
schedule:
6+
- cron: '0 0 * * *' # Runs at 00:00 UTC every day
7+
8+
jobs:
9+
build-axolotl:
10+
if: ${{ ! contains(github.event.commits[0].message, '[skip docker]]') && github.repository_owner == 'OpenAccess-AI-Collective' }}
11+
strategy:
12+
fail-fast: false
13+
matrix:
14+
include:
15+
- cuda: 118
16+
cuda_version: 11.8.0
17+
python_version: "3.10"
18+
pytorch: 2.1.2
19+
axolotl_extras:
20+
axolotl_args: "--extra-index-url https://download.pytorch.org/whl/cu118"
21+
is_latest: true
22+
- cuda: 121
23+
cuda_version: 12.1.0
24+
python_version: "3.10"
25+
pytorch: 2.1.2
26+
axolotl_extras:
27+
- cuda: 121
28+
cuda_version: 12.1.0
29+
python_version: "3.11"
30+
pytorch: 2.2.1
31+
axolotl_extras:
32+
- cuda: 121
33+
cuda_version: 12.1.0
34+
python_version: "3.11"
35+
pytorch: 2.3.0
36+
axolotl_extras:
37+
runs-on: axolotl-gpu-runner
38+
steps:
39+
- name: Checkout
40+
uses: actions/checkout@v4
41+
- name: Docker metadata
42+
id: metadata
43+
uses: docker/metadata-action@v5
44+
with:
45+
images: winglian/axolotl
46+
tags: |
47+
type=raw,value={{ branch }}-{{ date 'YYYYMMDD' }}
48+
- name: Set up Docker Buildx
49+
uses: docker/setup-buildx-action@v3
50+
- name: Login to Docker Hub
51+
uses: docker/login-action@v3
52+
with:
53+
username: ${{ secrets.DOCKERHUB_USERNAME }}
54+
password: ${{ secrets.DOCKERHUB_TOKEN }}
55+
# guidance for testing before pushing: https://docs.docker.com/build/ci/github-actions/test-before-push/
56+
- name: Build and export to Docker
57+
uses: docker/build-push-action@v5
58+
with:
59+
context: .
60+
build-args: |
61+
BASE_TAG=${{ github.ref_name }}-base-py${{ matrix.python_version }}-cu${{ matrix.cuda }}-${{ matrix.pytorch }}
62+
CUDA=${{ matrix.cuda }}
63+
PYTORCH_VERSION=${{ matrix.pytorch }}
64+
AXOLOTL_ARGS=${{ matrix.axolotl_args }}
65+
file: ./docker/Dockerfile
66+
push: ${{ github.event_name != 'pull_request' }}
67+
tags: |
68+
${{ steps.metadata.outputs.tags }}-py${{ matrix.python_version }}-cu${{ matrix.cuda }}-${{ matrix.pytorch }}${{ matrix.axolotl_extras != '' && '-' || '' }}${{ matrix.axolotl_extras }}
69+
labels: ${{ steps.metadata.outputs.labels }}
70+
71+
build-axolotl-cloud:
72+
needs: build-axolotl
73+
if: ${{ ! contains(github.event.commits[0].message, '[skip docker]]') && github.repository_owner == 'OpenAccess-AI-Collective' }}
74+
# this job needs to be run on self-hosted GPU runners...
75+
strategy:
76+
matrix:
77+
include:
78+
- cuda: 118
79+
cuda_version: 11.8.0
80+
python_version: "3.10"
81+
pytorch: 2.1.2
82+
axolotl_extras:
83+
is_latest: true
84+
- cuda: 121
85+
cuda_version: 12.1.0
86+
python_version: "3.10"
87+
pytorch: 2.1.2
88+
axolotl_extras:
89+
- cuda: 121
90+
cuda_version: 12.1.0
91+
python_version: "3.11"
92+
pytorch: 2.2.1
93+
axolotl_extras:
94+
- cuda: 121
95+
cuda_version: 12.1.0
96+
python_version: "3.11"
97+
pytorch: 2.3.0
98+
axolotl_extras:
99+
runs-on: axolotl-gpu-runner
100+
steps:
101+
- name: Checkout
102+
uses: actions/checkout@v4
103+
- name: Docker metadata
104+
id: metadata
105+
uses: docker/metadata-action@v5
106+
with:
107+
images: winglian/axolotl-cloud
108+
tags: |
109+
type=raw,value={{ branch }}-{{ date 'YYYYMMDD' }}
110+
- name: Login to Docker Hub
111+
uses: docker/login-action@v3
112+
with:
113+
username: ${{ secrets.DOCKERHUB_USERNAME }}
114+
password: ${{ secrets.DOCKERHUB_TOKEN }}
115+
- name: Set up Docker Buildx
116+
uses: docker/setup-buildx-action@v2
117+
- name: Build
118+
uses: docker/build-push-action@v5
119+
with:
120+
context: .
121+
build-args: |
122+
BASE_TAG=${{ github.ref_name }}-py${{ matrix.python_version }}-cu${{ matrix.cuda }}-${{ matrix.pytorch }}${{ matrix.axolotl_extras != '' && '-' || '' }}${{ matrix.axolotl_extras }}
123+
CUDA=${{ matrix.cuda }}
124+
file: ./docker/Dockerfile-cloud
125+
push: ${{ github.event_name != 'pull_request' }}
126+
tags: |
127+
${{ steps.metadata.outputs.tags }}-py${{ matrix.python_version }}-cu${{ matrix.cuda }}-${{ matrix.pytorch }}${{ matrix.axolotl_extras != '' && '-' || '' }}${{ matrix.axolotl_extras }}
128+
labels: ${{ steps.metadata.outputs.labels }}

.github/workflows/pypi.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -25,7 +25,7 @@ jobs:
2525

2626
- name: Install dependencies
2727
run: |
28-
pip3 install wheel
28+
pip3 install wheel packaging
2929
pip3 install -e .
3030
pip3 install -r requirements-tests.txt
3131

.github/workflows/tests.yml

Lines changed: 8 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -34,7 +34,7 @@ jobs:
3434
fail-fast: false
3535
matrix:
3636
python_version: ["3.10", "3.11"]
37-
timeout-minutes: 10
37+
timeout-minutes: 20
3838

3939
steps:
4040
- name: Check out repository code
@@ -48,6 +48,8 @@ jobs:
4848

4949
- name: Install dependencies
5050
run: |
51+
pip3 install --upgrade pip
52+
pip3 install --upgrade packaging
5153
pip3 install -U -e .
5254
pip3 install -r requirements-tests.txt
5355
@@ -77,6 +79,11 @@ jobs:
7779
python_version: "3.10"
7880
pytorch: 2.1.2
7981
num_gpus: 1
82+
- cuda: 121
83+
cuda_version: 12.1.0
84+
python_version: "3.11"
85+
pytorch: 2.2.1
86+
num_gpus: 1
8087
steps:
8188
- name: Checkout
8289
uses: actions/checkout@v4

.gitignore

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -2,6 +2,9 @@
22
configs
33
last_run_prepared/
44
.vscode
5+
data/
6+
outputs/
7+
_site/
58

69
# Byte-compiled / optimized / DLL files
710
__pycache__/
@@ -132,6 +135,7 @@ venv/
132135
ENV/
133136
env.bak/
134137
venv.bak/
138+
venv3.10/
135139

136140
# Spyder project settings
137141
.spyderproject
@@ -172,3 +176,5 @@ wandb
172176
lora-out/*
173177
qlora-out/*
174178
mlruns/*
179+
180+
/.quarto/

0 commit comments

Comments
 (0)