-
Notifications
You must be signed in to change notification settings - Fork 20
/
Copy pathcuda.Dockerfile
45 lines (40 loc) · 2.27 KB
/
cuda.Dockerfile
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
#--- dockerfile to test hugot ---
ARG GO_VERSION=1.23.3
ARG ONNXRUNTIME_VERSION=1.20.0
ARG BUILD_PLATFORM=linux/amd64
#--- runtime layer with all hugot dependencies for cpu and gpu ---
FROM --platform=$BUILD_PLATFORM public.ecr.aws/amazonlinux/amazonlinux:2023 AS hugot-runtime
ARG GO_VERSION
ARG ONNXRUNTIME_VERSION
ENV PATH="$PATH:/usr/local/go/bin" \
GOPJRT_NOSUDO=1
COPY ./scripts/download-onnxruntime-gpu.sh /download-onnxruntime-gpu.sh
RUN --mount=src=./go.mod,dst=/go.mod \
dnf --allowerasing -y install gcc jq bash tar xz gzip glibc-static libstdc++ wget zip git dirmngr sudo which && \
ln -s /usr/lib64/libstdc++.so.6 /usr/lib64/libstdc++.so && \
dnf install -y 'dnf-command(config-manager)' && \
# from rhel
dnf config-manager --add-repo https://developer.download.nvidia.com/compute/cuda/repos/rhel9/x86_64/cuda-rhel9.repo && \
dnf install -y cuda-cudart-12-6 cuda-nvrtc-12-6 libcublas-12-6 libcurand-12-6 libcufft-12-6 libcudnn9-cuda-12 && \
dnf clean all && \
# tokenizers
tokenizer_version=$(grep 'github.com/daulet/tokenizers' /go.mod | awk '{print $2}') && \
tokenizer_version=$(echo $tokenizer_version | awk -F'-' '{print $NF}') && \
echo "tokenizer_version: $tokenizer_version" && \
curl -LO https://github.com/daulet/tokenizers/releases/download/${tokenizer_version}/libtokenizers.linux-amd64.tar.gz && \
tar -C /usr/lib -xzf libtokenizers.linux-amd64.tar.gz && \
rm libtokenizers.linux-amd64.tar.gz && \
# onnxruntime cpu and gpu
sed -i 's/\r//g' /download-onnxruntime-gpu.sh && chmod +x /download-onnxruntime-gpu.sh && \
/download-onnxruntime-gpu.sh ${ONNXRUNTIME_VERSION} && \
# XLA/goMLX
curl -sSf https://raw.githubusercontent.com/gomlx/gopjrt/main/cmd/install_linux_amd64_amazonlinux.sh | bash && \
curl -sSf https://raw.githubusercontent.com/gomlx/gopjrt/main/cmd/install_cuda.sh | bash && \
# go
curl -LO https://golang.org/dl/go${GO_VERSION}.linux-amd64.tar.gz && \
tar -C /usr/local -xzf go${GO_VERSION}.linux-amd64.tar.gz && \
rm go${GO_VERSION}.linux-amd64.tar.gz && \
# NON-PRIVILEGED USER
# create non-privileged testuser with id: 1000
useradd -u 1000 -m testuser && usermod -a -G wheel testuser && \
echo "testuser ALL=(ALL) NOPASSWD: ALL" >> /etc/sudoers.d/testuser