|
|
|
@ -5,9 +5,6 @@ ARG CUDA_V11_ARCHITECTURES="50;52;53;60;61;62;70;72;75;80;86" |
|
|
|
ARG CUDA_VERSION_12=12.4.0 |
|
|
|
ARG CUDA_V12_ARCHITECTURES="60;61;62;70;72;75;80;86;87;89;90;90a" |
|
|
|
ARG ROCM_VERSION=6.1.2 |
|
|
|
ARG JETPACK_6=r36.2.0 |
|
|
|
ARG JETPACK_5=r35.4.1 |
|
|
|
ARG JETPACK_4=r32.7.1 |
|
|
|
|
|
|
|
# Copy the minimal context we need to run the generate scripts |
|
|
|
FROM scratch AS llm-code |
|
|
|
@ -84,39 +81,6 @@ RUN --mount=type=cache,target=/root/.ccache \ |
|
|
|
OLLAMA_CUSTOM_CUDA_DEFS="-DGGML_CUDA_USE_GRAPHS=on" \ |
|
|
|
bash gen_linux.sh |
|
|
|
|
|
|
|
FROM --platform=linux/arm64 nvcr.io/nvidia/l4t-jetpack:${JETPACK_6} AS cuda-build-jetpack6-arm64 |
|
|
|
ARG CMAKE_VERSION |
|
|
|
RUN apt-get update && apt-get install -y git curl && \ |
|
|
|
curl -s -L https://github.com/Kitware/CMake/releases/download/v${CMAKE_VERSION}/cmake-${CMAKE_VERSION}-linux-$(uname -m).tar.gz | tar -zx -C /usr --strip-components 1 |
|
|
|
COPY --from=llm-code / /go/src/github.com/ollama/ollama/ |
|
|
|
WORKDIR /go/src/github.com/ollama/ollama/llm/generate |
|
|
|
ARG CGO_CFLAGS |
|
|
|
ENV GOARCH arm64 |
|
|
|
ENV LIBRARY_PATH /usr/local/cuda/lib64/stubs |
|
|
|
RUN --mount=type=cache,target=/root/.ccache \ |
|
|
|
OLLAMA_SKIP_STATIC_GENERATE=1 \ |
|
|
|
OLLAMA_SKIP_CPU_GENERATE=1 \ |
|
|
|
CUDA_VARIANT="_jetpack6" \ |
|
|
|
CUDA_DIST_DIR="/go/src/github.com/ollama/ollama/dist/linux-arm64/ollama_libs/cuda_jetpack6" \ |
|
|
|
CMAKE_CUDA_ARCHITECTURES="87" \ |
|
|
|
bash gen_linux.sh |
|
|
|
|
|
|
|
FROM --platform=linux/arm64 nvcr.io/nvidia/l4t-jetpack:${JETPACK_5} AS cuda-build-jetpack5-arm64 |
|
|
|
ARG CMAKE_VERSION |
|
|
|
RUN apt-get update && apt-get install -y git curl && \ |
|
|
|
curl -s -L https://github.com/Kitware/CMake/releases/download/v${CMAKE_VERSION}/cmake-${CMAKE_VERSION}-linux-$(uname -m).tar.gz | tar -zx -C /usr --strip-components 1 |
|
|
|
COPY --from=llm-code / /go/src/github.com/ollama/ollama/ |
|
|
|
WORKDIR /go/src/github.com/ollama/ollama/llm/generate |
|
|
|
ARG CGO_CFLAGS |
|
|
|
ENV GOARCH arm64 |
|
|
|
ENV LIBRARY_PATH /usr/local/cuda/lib64/stubs |
|
|
|
RUN --mount=type=cache,target=/root/.ccache \ |
|
|
|
OLLAMA_SKIP_STATIC_GENERATE=1 \ |
|
|
|
OLLAMA_SKIP_CPU_GENERATE=1 \ |
|
|
|
CUDA_VARIANT="_jetpack5" \ |
|
|
|
CUDA_DIST_DIR="/go/src/github.com/ollama/ollama/dist/linux-arm64/ollama_libs/cuda_jetpack5" \ |
|
|
|
CMAKE_CUDA_ARCHITECTURES="72;87" \ |
|
|
|
bash gen_linux.sh |
|
|
|
|
|
|
|
FROM --platform=linux/amd64 rocm/dev-centos-7:${ROCM_VERSION}-complete AS rocm-build-amd64 |
|
|
|
ARG CMAKE_VERSION |
|
|
|
@ -209,12 +173,6 @@ COPY --from=cuda-11-build-server-arm64 /go/src/github.com/ollama/ollama/dist/ di |
|
|
|
COPY --from=cuda-11-build-server-arm64 /go/src/github.com/ollama/ollama/llm/build/linux/ llm/build/linux/ |
|
|
|
COPY --from=cuda-12-build-server-arm64 /go/src/github.com/ollama/ollama/dist/ dist/ |
|
|
|
COPY --from=cuda-12-build-server-arm64 /go/src/github.com/ollama/ollama/llm/build/linux/ llm/build/linux/ |
|
|
|
## arm binary += 381M |
|
|
|
COPY --from=cuda-build-jetpack6-arm64 /go/src/github.com/ollama/ollama/llm/build/linux/ llm/build/linux/ |
|
|
|
COPY --from=cuda-build-jetpack6-arm64 /go/src/github.com/ollama/ollama/dist/ dist/ |
|
|
|
## arm binary += 330M |
|
|
|
COPY --from=cuda-build-jetpack5-arm64 /go/src/github.com/ollama/ollama/llm/build/linux/ llm/build/linux/ |
|
|
|
COPY --from=cuda-build-jetpack5-arm64 /go/src/github.com/ollama/ollama/dist/ dist/ |
|
|
|
ARG GOFLAGS |
|
|
|
ARG CGO_CFLAGS |
|
|
|
RUN --mount=type=cache,target=/root/.ccache \ |
|
|
|
|