add runpod envs to .bashrc, fix bnb env (#316)
Browse files* hopper support for base dockerfile, add runpod envs to .bashrc
* set BNB_CUDA_VERSION env for latest bnb
* don't support hopper yet w 118
- .github/workflows/main.yml +7 -6
- docker/Dockerfile +2 -0
- scripts/runpod-entrypoint.sh +15 -4
.github/workflows/main.yml
CHANGED
@@ -69,22 +69,22 @@ jobs:
|
|
69 |
strategy:
|
70 |
matrix:
|
71 |
include:
|
72 |
-
- cuda:
|
73 |
cuda_version: 11.8.0
|
74 |
python_version: "3.9"
|
75 |
pytorch: 2.0.1
|
76 |
axolotl_extras:
|
77 |
-
- cuda:
|
78 |
cuda_version: 11.8.0
|
79 |
python_version: "3.10"
|
80 |
pytorch: 2.0.1
|
81 |
axolotl_extras:
|
82 |
-
- cuda:
|
83 |
cuda_version: 11.8.0
|
84 |
python_version: "3.9"
|
85 |
pytorch: 2.0.1
|
86 |
axolotl_extras: gptq
|
87 |
-
- cuda:
|
88 |
cuda_version: 11.7.1
|
89 |
python_version: "3.9"
|
90 |
pytorch: 1.13.1
|
@@ -110,8 +110,9 @@ jobs:
|
|
110 |
with:
|
111 |
context: .
|
112 |
build-args: |
|
113 |
-
BASE_TAG=${{ github.ref_name }}-py${{ matrix.python_version }}
|
|
|
114 |
file: ./docker/Dockerfile-runpod
|
115 |
push: ${{ github.event_name != 'pull_request' }}
|
116 |
-
tags: ${{ steps.metadata.outputs.tags }}-py${{ matrix.python_version }}
|
117 |
labels: ${{ steps.metadata.outputs.labels }}
|
|
|
69 |
strategy:
|
70 |
matrix:
|
71 |
include:
|
72 |
+
- cuda: 118
|
73 |
cuda_version: 11.8.0
|
74 |
python_version: "3.9"
|
75 |
pytorch: 2.0.1
|
76 |
axolotl_extras:
|
77 |
+
- cuda: 118
|
78 |
cuda_version: 11.8.0
|
79 |
python_version: "3.10"
|
80 |
pytorch: 2.0.1
|
81 |
axolotl_extras:
|
82 |
+
- cuda: 118
|
83 |
cuda_version: 11.8.0
|
84 |
python_version: "3.9"
|
85 |
pytorch: 2.0.1
|
86 |
axolotl_extras: gptq
|
87 |
+
- cuda: 117
|
88 |
cuda_version: 11.7.1
|
89 |
python_version: "3.9"
|
90 |
pytorch: 1.13.1
|
|
|
110 |
with:
|
111 |
context: .
|
112 |
build-args: |
|
113 |
+
BASE_TAG=${{ github.ref_name }}-py${{ matrix.python_version }}-cu${{ matrix.cuda }}-${{ matrix.pytorch }}${{ matrix.axolotl_extras != '' && '-' || '' }}${{ matrix.axolotl_extras }}
|
114 |
+
CUDA=${{ matrix.cuda }}
|
115 |
file: ./docker/Dockerfile-runpod
|
116 |
push: ${{ github.event_name != 'pull_request' }}
|
117 |
+
tags: ${{ steps.metadata.outputs.tags }}-py${{ matrix.python_version }}-cu${{ matrix.cuda }}-${{ matrix.pytorch }}${{ matrix.axolotl_extras != '' && '-' || '' }}${{ matrix.axolotl_extras }}
|
118 |
labels: ${{ steps.metadata.outputs.labels }}
|
docker/Dockerfile
CHANGED
@@ -3,6 +3,8 @@ FROM winglian/axolotl-base:$BASE_TAG
|
|
3 |
|
4 |
ARG TORCH_CUDA_ARCH_LIST="7.0 7.5 8.0 8.6+PTX"
|
5 |
ARG AXOLOTL_EXTRAS=""
|
|
|
|
|
6 |
|
7 |
RUN apt-get update && \
|
8 |
apt-get install -y vim curl
|
|
|
3 |
|
4 |
ARG TORCH_CUDA_ARCH_LIST="7.0 7.5 8.0 8.6+PTX"
|
5 |
ARG AXOLOTL_EXTRAS=""
|
6 |
+
ARG CUDA="118"
|
7 |
+
ENV BNB_CUDA_VERSION=$CUDA
|
8 |
|
9 |
RUN apt-get update && \
|
10 |
apt-get install -y vim curl
|
scripts/runpod-entrypoint.sh
CHANGED
@@ -1,10 +1,21 @@
|
|
1 |
#!/bin/bash
|
2 |
|
3 |
-
|
4 |
-
|
|
|
|
|
5 |
|
6 |
-
|
7 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
8 |
|
9 |
# Execute the passed arguments (CMD)
|
10 |
exec "$@"
|
|
|
1 |
#!/bin/bash
|
2 |
|
3 |
+
# Export specific ENV variables to /etc/rp_environment
|
4 |
+
echo "Exporting environment variables..."
|
5 |
+
printenv | grep -E '^RUNPOD_|^PATH=|^_=' | sed 's/^\(.*\)=\(.*\)$/export \1="\2"/' >> /etc/rp_environment
|
6 |
+
echo 'source /etc/rp_environment' >> ~/.bashrc
|
7 |
|
8 |
+
if [[ $PUBLIC_KEY ]]
|
9 |
+
then
|
10 |
+
mkdir -p ~/.ssh
|
11 |
+
chmod 700 ~/.ssh
|
12 |
+
echo $PUBLIC_KEY >> ~/.ssh/authorized_keys
|
13 |
+
chmod 700 -R ~/.ssh
|
14 |
+
# Start the SSH service in the background
|
15 |
+
service ssh start
|
16 |
+
else
|
17 |
+
echo "No PUBLIC_KEY ENV variable provided, not starting openSSH daemon"
|
18 |
+
fi
|
19 |
|
20 |
# Execute the passed arguments (CMD)
|
21 |
exec "$@"
|