-
Notifications
You must be signed in to change notification settings - Fork 39
Expand file tree
/
Copy pathcuda.Dockerfile
More file actions
51 lines (46 loc) · 2.52 KB
/
cuda.Dockerfile
File metadata and controls
51 lines (46 loc) · 2.52 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
#--- dockerfile to test hugot ---
ARG GO_VERSION=1.26.0
ARG ONNXRUNTIME_VERSION=1.24.2
ARG ONNXRUNTIME_GENAI_VERSION=0.12.0
ARG GOPJRT_VERSION=0.83.4
ARG JAX_CUDA_VERSION=0.8.1
ARG BUILD_PLATFORM=linux/amd64
#--- runtime layer with all hugot dependencies for cpu and gpu ---
FROM --platform=$BUILD_PLATFORM public.ecr.aws/amazonlinux/amazonlinux:2023 AS hugot-runtime
ARG GO_VERSION
ARG ONNXRUNTIME_VERSION
ARG ONNXRUNTIME_GENAI_VERSION
ARG GOPJRT_VERSION
ARG JAX_CUDA_VERSION
ENV PATH="$PATH:/usr/local/go/bin" \
GOPJRT_NOSUDO=1
COPY ./scripts/download-onnxruntime.sh /download-onnxruntime.sh
COPY ./scripts/download-onnxruntime-genai.sh /download-onnxruntime-genai.sh
COPY ./scripts/download-tokenizers.sh /download-tokenizers.sh
RUN --mount=src=./go.mod,dst=/go.mod \
dnf --allowerasing -y install gcc jq bash tar xz gzip glibc-static libstdc++ wget zip git dirmngr sudo which && \
ln -s /usr/lib64/libstdc++.so.6 /usr/lib64/libstdc++.so && \
dnf install -y 'dnf-command(config-manager)' && \
# from rhel
dnf config-manager --add-repo https://developer.download.nvidia.com/compute/cuda/repos/rhel9/x86_64/cuda-rhel9.repo && \
dnf install -y cuda-cudart-12-9 cuda-nvrtc-12-9 libcublas-12-9 libcurand-12-9 libcufft-12-9 libcudnn9-cuda-12 && \
dnf clean all && \
# go
curl -LO https://golang.org/dl/go${GO_VERSION}.linux-amd64.tar.gz && \
tar -C /usr/local -xzf go${GO_VERSION}.linux-amd64.tar.gz && \
rm go${GO_VERSION}.linux-amd64.tar.gz && \
# tokenizers
sed -i 's/\r//g' /download-tokenizers.sh && chmod +x /download-tokenizers.sh && \
./download-tokenizers.sh && \
# onnxruntime cpu and gpu
sed -i 's/\r//g' /download-onnxruntime.sh && chmod +x /download-onnxruntime.sh && \
/download-onnxruntime.sh --onnxruntime-version=${ONNXRUNTIME_VERSION} --cuda && \
sed -i 's/\r//g' /download-onnxruntime-genai.sh && chmod +x /download-onnxruntime-genai.sh && \
/download-onnxruntime-genai.sh --onnxruntime-genai-version=${ONNXRUNTIME_GENAI_VERSION} --cuda && \
# XLA/goMLX
GOPROXY=direct go run github.com/gomlx/go-xla/cmd/pjrt_installer@latest -plugin=linux -version=v${GOPJRT_VERSION} -path=/usr/local/lib/go-xla && \
GOPROXY=direct go run github.com/gomlx/go-xla/cmd/pjrt_installer@latest -plugin=cuda13 -version=${JAX_CUDA_VERSION} -path=/usr/local/lib/go-xla && \
# NON-PRIVILEGED USER
# create non-privileged testuser with id: 1000
useradd -u 1000 -m testuser && usermod -a -G wheel testuser && \
echo "testuser ALL=(ALL) NOPASSWD: ALL" >> /etc/sudoers.d/testuser