winglian commited on
Commit
cf62cfd
·
unverified ·
1 Parent(s): c5df969

add runpod envs to .bashrc, fix bnb env (#316)

Browse files

* hopper support for base dockerfile, add runpod envs to .bashrc

* set BNB_CUDA_VERSION env for latest bnb

* don't support hopper yet w 118

.github/workflows/main.yml CHANGED
@@ -69,22 +69,22 @@ jobs:
69
  strategy:
70
  matrix:
71
  include:
72
- - cuda: cu118
73
  cuda_version: 11.8.0
74
  python_version: "3.9"
75
  pytorch: 2.0.1
76
  axolotl_extras:
77
- - cuda: cu118
78
  cuda_version: 11.8.0
79
  python_version: "3.10"
80
  pytorch: 2.0.1
81
  axolotl_extras:
82
- - cuda: cu118
83
  cuda_version: 11.8.0
84
  python_version: "3.9"
85
  pytorch: 2.0.1
86
  axolotl_extras: gptq
87
- - cuda: cu117
88
  cuda_version: 11.7.1
89
  python_version: "3.9"
90
  pytorch: 1.13.1
@@ -110,8 +110,9 @@ jobs:
110
  with:
111
  context: .
112
  build-args: |
113
- BASE_TAG=${{ github.ref_name }}-py${{ matrix.python_version }}-${{ matrix.cuda }}-${{ matrix.pytorch }}${{ matrix.axolotl_extras != '' && '-' || '' }}${{ matrix.axolotl_extras }}
 
114
  file: ./docker/Dockerfile-runpod
115
  push: ${{ github.event_name != 'pull_request' }}
116
- tags: ${{ steps.metadata.outputs.tags }}-py${{ matrix.python_version }}-${{ matrix.cuda }}-${{ matrix.pytorch }}${{ matrix.axolotl_extras != '' && '-' || '' }}${{ matrix.axolotl_extras }}
117
  labels: ${{ steps.metadata.outputs.labels }}
 
69
  strategy:
70
  matrix:
71
  include:
72
+ - cuda: 118
73
  cuda_version: 11.8.0
74
  python_version: "3.9"
75
  pytorch: 2.0.1
76
  axolotl_extras:
77
+ - cuda: 118
78
  cuda_version: 11.8.0
79
  python_version: "3.10"
80
  pytorch: 2.0.1
81
  axolotl_extras:
82
+ - cuda: 118
83
  cuda_version: 11.8.0
84
  python_version: "3.9"
85
  pytorch: 2.0.1
86
  axolotl_extras: gptq
87
+ - cuda: 117
88
  cuda_version: 11.7.1
89
  python_version: "3.9"
90
  pytorch: 1.13.1
 
110
  with:
111
  context: .
112
  build-args: |
113
+ BASE_TAG=${{ github.ref_name }}-py${{ matrix.python_version }}-cu${{ matrix.cuda }}-${{ matrix.pytorch }}${{ matrix.axolotl_extras != '' && '-' || '' }}${{ matrix.axolotl_extras }}
114
+ CUDA=${{ matrix.cuda }}
115
  file: ./docker/Dockerfile-runpod
116
  push: ${{ github.event_name != 'pull_request' }}
117
+ tags: ${{ steps.metadata.outputs.tags }}-py${{ matrix.python_version }}-cu${{ matrix.cuda }}-${{ matrix.pytorch }}${{ matrix.axolotl_extras != '' && '-' || '' }}${{ matrix.axolotl_extras }}
118
  labels: ${{ steps.metadata.outputs.labels }}
docker/Dockerfile CHANGED
@@ -3,6 +3,8 @@ FROM winglian/axolotl-base:$BASE_TAG
3
 
4
  ARG TORCH_CUDA_ARCH_LIST="7.0 7.5 8.0 8.6+PTX"
5
  ARG AXOLOTL_EXTRAS=""
 
 
6
 
7
  RUN apt-get update && \
8
  apt-get install -y vim curl
 
3
 
4
  ARG TORCH_CUDA_ARCH_LIST="7.0 7.5 8.0 8.6+PTX"
5
  ARG AXOLOTL_EXTRAS=""
6
+ ARG CUDA="118"
7
+ ENV BNB_CUDA_VERSION=$CUDA
8
 
9
  RUN apt-get update && \
10
  apt-get install -y vim curl
scripts/runpod-entrypoint.sh CHANGED
@@ -1,10 +1,21 @@
1
  #!/bin/bash
2
 
3
- echo $PUBLIC_KEY >> ~/.ssh/authorized_keys
4
- chmod 700 -R ~/.ssh
 
 
5
 
6
- # Start the SSH service in the background
7
- service ssh start
 
 
 
 
 
 
 
 
 
8
 
9
  # Execute the passed arguments (CMD)
10
  exec "$@"
 
1
  #!/bin/bash
2
 
3
+ # Export specific ENV variables to /etc/rp_environment
4
+ echo "Exporting environment variables..."
5
+ printenv | grep -E '^RUNPOD_|^PATH=|^_=' | sed 's/^\(.*\)=\(.*\)$/export \1="\2"/' >> /etc/rp_environment
6
+ echo 'source /etc/rp_environment' >> ~/.bashrc
7
 
8
+ if [[ $PUBLIC_KEY ]]
9
+ then
10
+ mkdir -p ~/.ssh
11
+ chmod 700 ~/.ssh
12
+ echo $PUBLIC_KEY >> ~/.ssh/authorized_keys
13
+ chmod 700 -R ~/.ssh
14
+ # Start the SSH service in the background
15
+ service ssh start
16
+ else
17
+ echo "No PUBLIC_KEY ENV variable provided, not starting openSSH daemon"
18
+ fi
19
 
20
  # Execute the passed arguments (CMD)
21
  exec "$@"