matrix-pygmalion-bot/runpod/runpod-worker-transformers/Dockerfile

ARG DEV_IMAGE=nvidia/cuda:11.8.0-cudnn8-devel-ubuntu22.04
ARG BASE_IMAGE=nvidia/cuda:11.8.0-cudnn8-runtime-ubuntu22.04
#ARG BASE_IMAGE=nvidia/cuda:11.6.2-cudnn8-devel-ubuntu20.04
#ARG BASE_IMAGE=runpod/pytorch:3.10-2.0.0-117
#ARG BASE_IMAGE=nvcr.io/nvidia/pytorch:23.03-py3
FROM ${DEV_IMAGE} as builder

ARG MODEL_NAME
ENV MODEL_NAME=${MODEL_NAME}

WORKDIR /
SHELL ["/bin/bash", "-o", "pipefail", "-c"]
ENV DEBIAN_FRONTEND noninteractive\
    SHELL=/bin/bash

RUN apt-get update --yes && \
    # - apt-get upgrade is run to patch known vulnerabilities in apt-get packages as
    #   the ubuntu base image is rebuilt too seldom sometimes (less than once a month)
    apt-get upgrade --yes && \
    apt install --yes --no-install-recommends \
      build-essential \
      cmake \
      ca-certificates \
      git \
      git-lfs \
      wget \
      curl \
      bash \
#      libgl1 \
      software-properties-common \
      openssh-server && \
      apt-get clean && rm -rf /var/lib/apt/lists/* && \
      echo "en_US.UTF-8 UTF-8" > /etc/locale.gen

#RUN apt-key del 7fa2af80 && \
#    apt-key adv --fetch-keys https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2004/x86_64/3bf863cc.pub
#
#RUN add-apt-repository ppa:deadsnakes/ppa && \
#    apt-get install python3.10 python3.10-dev python3.10-venv python3-pip -y --no-install-recommends && \
#    update-alternatives --install /usr/bin/python3 python3 /usr/bin/python3.10 1 && \
#    update-alternatives --install /usr/bin/python python /usr/bin/python3 1 && \
##    update-alternatives --install /usr/bin/pip pip /usr/bin/pip3 1 && \
#    update-alternatives --set python3 /usr/bin/python3.10 && \
#    update-alternatives --set python /usr/bin/python3 && \
#    apt-get clean && rm -rf /var/lib/apt/lists/*

RUN apt-get update --yes && \
    apt install --yes --no-install-recommends \
      python3 python3-dev python3-venv python3-pip && \
    apt-get clean && rm -rf /var/lib/apt/lists/*

ENV TORCH_CUDA_ARCH_LIST="3.5;5.0;6.0;6.1;7.0;7.5;8.0;8.6+PTX"
RUN pip3 install --upgrade pip && \
    pip3 install cuda-python==11.8.0 && \
    pip3 install --default-timeout=100 torch torchvision torchaudio --extra-index-url=https://download.pytorch.org/whl/cu118 && \
    pip3 install bitsandbytes && \
    pip3 install safetensors && \
    pip3 install sentencepiece && \
    pip3 install diffusers && \
    pip3 install accelerate xformers triton && \
    pip3 install git+https://github.com/huggingface/transformers.git && \
    pip3 install huggingface-hub && \
    pip3 install runpod && \
    pip3 cache purge

RUN mkdir -p /workspace
WORKDIR /workspace

RUN mkdir repositories && git clone --branch cuda --single-branch https://github.com/qwopqwop200/GPTQ-for-LLaMa.git repositories/GPTQ-for-LLaMa && \
#    (cd repositories/GPTQ-for-LLaMa && git reset --hard 437154dd434c3f9d5c9c4e6f401d6d71116ac248) && \
#RUN mkdir repositories && git clone --depth 1 https://github.com/AlpinDale/gptq-gptj.git repositories/GPTQ-for-LLaMa && \
    (cd repositories/GPTQ-for-LLaMa && python3 setup_cuda.py install)

COPY model_fetcher.py /workspace/
RUN python3 model_fetcher.py --model_name=${MODEL_NAME}


FROM ${BASE_IMAGE}
ARG MODEL_NAME
ENV MODEL_NAME=${MODEL_NAME}
ENV TORCH_CUDA_ARCH_LIST="3.5;5.0;6.0;6.1;7.0;7.5;8.0;8.6+PTX"
RUN mkdir -p /workspace
WORKDIR /workspace

RUN apt-get update --yes && \
    apt install --yes --no-install-recommends \
      python3 python3-dev python3-venv python3-pip \
      git && \
    apt-get clean && rm -rf /var/lib/apt/lists/*

RUN pip3 install --upgrade pip && \
    pip3 install cuda-python==11.8.0 && \
    pip3 install --default-timeout=100 torch torchvision torchaudio --extra-index-url=https://download.pytorch.org/whl/cu118 && \
    pip3 install bitsandbytes && \
    pip3 install safetensors && \
    pip3 install sentencepiece && \
    pip3 install diffusers && \
    pip3 install accelerate xformers triton && \
    pip3 install git+https://github.com/huggingface/transformers.git && \
    pip3 install rwkv && \
    pip3 install huggingface-hub && \
    pip3 install runpod && \
    pip3 cache purge

RUN mkdir -p /workspace/repositories && mkdir -p /root/.cache/huggingface
COPY --from=builder /workspace/repositories /workspace/repositories/
COPY --from=builder /root/.cache/huggingface /root/.cache/huggingface

#RUN git lfs install && \
#    git clone --depth 1 https://huggingface.co/${MODEL_NAME}

COPY model_fetcher.py /workspace/
COPY runpod_infer.py /workspace/
COPY RWKV.py /workspace/
COPY test_input.json /workspace/

CMD python3 -u runpod_infer.py --model_name=${MODEL_NAME}
more tests on remote worker container 2 years ago			`ARG DEV_IMAGE=nvidia/cuda:11.8.0-cudnn8-devel-ubuntu22.04`
rewrite remote transformers container 2 years ago			`ARG BASE_IMAGE=nvidia/cuda:11.8.0-cudnn8-runtime-ubuntu22.04`
test 2 years ago			`#ARG BASE_IMAGE=nvidia/cuda:11.6.2-cudnn8-devel-ubuntu20.04`
rewrite remote transformers container 2 years ago			`#ARG BASE_IMAGE=runpod/pytorch:3.10-2.0.0-117`
test 2 years ago			`#ARG BASE_IMAGE=nvcr.io/nvidia/pytorch:23.03-py3`
more tests on remote worker container 2 years ago			`FROM ${DEV_IMAGE} as builder`
work on remote workers 2 years ago
chatbot remote worker test 2 years ago			`ARG MODEL_NAME`
			`ENV MODEL_NAME=${MODEL_NAME}`

add experimental and wip worker containers 2 years ago			`WORKDIR /`
work on remote workers 2 years ago			`SHELL ["/bin/bash", "-o", "pipefail", "-c"]`
			`ENV DEBIAN_FRONTEND noninteractive\`
			`SHELL=/bin/bash`
add experimental and wip worker containers 2 years ago
work on remote workers 2 years ago			`RUN apt-get update --yes && \`
add experimental and wip worker containers 2 years ago			`# - apt-get upgrade is run to patch known vulnerabilities in apt-get packages as`
			`# the ubuntu base image is rebuilt too seldom sometimes (less than once a month)`
more tests on remote worker container 2 years ago			`apt-get upgrade --yes && \`
add experimental and wip worker containers 2 years ago			`apt install --yes --no-install-recommends \`
more tests on remote worker container 2 years ago			`build-essential \`
			`cmake \`
test 2 years ago			`ca-certificates \`
			`git \`
			`git-lfs \`
			`wget \`
			`curl \`
			`bash \`
more tests on remote worker container 2 years ago			`# libgl1 \`
test 2 years ago			`software-properties-common \`
			`openssh-server && \`
			`apt-get clean && rm -rf /var/lib/apt/lists/* && \`
			`echo "en_US.UTF-8 UTF-8" > /etc/locale.gen`

			`#RUN apt-key del 7fa2af80 && \`
			`# apt-key adv --fetch-keys https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2004/x86_64/3bf863cc.pub`
			`#`
			`#RUN add-apt-repository ppa:deadsnakes/ppa && \`
			`# apt-get install python3.10 python3.10-dev python3.10-venv python3-pip -y --no-install-recommends && \`
			`# update-alternatives --install /usr/bin/python3 python3 /usr/bin/python3.10 1 && \`
			`# update-alternatives --install /usr/bin/python python /usr/bin/python3 1 && \`
			`## update-alternatives --install /usr/bin/pip pip /usr/bin/pip3 1 && \`
			`# update-alternatives --set python3 /usr/bin/python3.10 && \`
			`# update-alternatives --set python /usr/bin/python3 && \`
			`# apt-get clean && rm -rf /var/lib/apt/lists/*`

			`RUN apt-get update --yes && \`
			`apt install --yes --no-install-recommends \`
			`python3 python3-dev python3-venv python3-pip && \`
add experimental and wip worker containers 2 years ago			`apt-get clean && rm -rf /var/lib/apt/lists/*`
work on remote workers 2 years ago
remote worker 2 years ago			`ENV TORCH_CUDA_ARCH_LIST="3.5;5.0;6.0;6.1;7.0;7.5;8.0;8.6+PTX"`
test 2 years ago			`RUN pip3 install --upgrade pip && \`
remote worker 2 years ago			`pip3 install cuda-python==11.8.0 && \`
			`pip3 install --default-timeout=100 torch torchvision torchaudio --extra-index-url=https://download.pytorch.org/whl/cu118 && \`
test 2 years ago			`pip3 install bitsandbytes && \`
			`pip3 install safetensors && \`
more tests on the remote workers 2 years ago			`pip3 install sentencepiece && \`
test 2 years ago			`pip3 install diffusers && \`
prepare RWKV 2 years ago			`pip3 install accelerate xformers triton && \`
			`pip3 install git+https://github.com/huggingface/transformers.git && \`
test 2 years ago			`pip3 install huggingface-hub && \`
rewrite remote transformers container 2 years ago			`pip3 install runpod && \`
			`pip3 cache purge`
work on remote workers 2 years ago
test 2 years ago			`RUN mkdir -p /workspace`
add experimental and wip worker containers 2 years ago			`WORKDIR /workspace`
work on remote workers 2 years ago
more tests on remote worker container 2 years ago			`RUN mkdir repositories && git clone --branch cuda --single-branch https://github.com/qwopqwop200/GPTQ-for-LLaMa.git repositories/GPTQ-for-LLaMa && \`
try other quantized model 2 years ago			`# (cd repositories/GPTQ-for-LLaMa && git reset --hard 437154dd434c3f9d5c9c4e6f401d6d71116ac248) && \`
more tests on remote worker container 2 years ago			`#RUN mkdir repositories && git clone --depth 1 https://github.com/AlpinDale/gptq-gptj.git repositories/GPTQ-for-LLaMa && \`
			`(cd repositories/GPTQ-for-LLaMa && python3 setup_cuda.py install)`

add experimental and wip worker containers 2 years ago			`COPY model_fetcher.py /workspace/`
chatbot remote worker test 2 years ago			`RUN python3 model_fetcher.py --model_name=${MODEL_NAME}`
more tests on remote worker container 2 years ago

			`FROM ${BASE_IMAGE}`
remote worker 2 years ago			`ARG MODEL_NAME`
			`ENV MODEL_NAME=${MODEL_NAME}`
			`ENV TORCH_CUDA_ARCH_LIST="3.5;5.0;6.0;6.1;7.0;7.5;8.0;8.6+PTX"`
more tests on remote worker container 2 years ago			`RUN mkdir -p /workspace`
			`WORKDIR /workspace`

			`RUN apt-get update --yes && \`
			`apt install --yes --no-install-recommends \`
update dependencies 2 years ago			`python3 python3-dev python3-venv python3-pip \`
			`git && \`
more tests on remote worker container 2 years ago			`apt-get clean && rm -rf /var/lib/apt/lists/*`

			`RUN pip3 install --upgrade pip && \`
remote worker 2 years ago			`pip3 install cuda-python==11.8.0 && \`
			`pip3 install --default-timeout=100 torch torchvision torchaudio --extra-index-url=https://download.pytorch.org/whl/cu118 && \`
more tests on remote worker container 2 years ago			`pip3 install bitsandbytes && \`
			`pip3 install safetensors && \`
more tests on the remote workers 2 years ago			`pip3 install sentencepiece && \`
more tests on remote worker container 2 years ago			`pip3 install diffusers && \`
prepare RWKV 2 years ago			`pip3 install accelerate xformers triton && \`
			`pip3 install git+https://github.com/huggingface/transformers.git && \`
			`pip3 install rwkv && \`
more tests on remote worker container 2 years ago			`pip3 install huggingface-hub && \`
			`pip3 install runpod && \`
			`pip3 cache purge`

more tests on the remote workers 2 years ago			`RUN mkdir -p /workspace/repositories && mkdir -p /root/.cache/huggingface`
more tests on remote worker container 2 years ago			`COPY --from=builder /workspace/repositories /workspace/repositories/`
			`COPY --from=builder /root/.cache/huggingface /root/.cache/huggingface`

add experimental and wip worker containers 2 years ago			`#RUN git lfs install && \`
			`# git clone --depth 1 https://huggingface.co/${MODEL_NAME}`
work on remote workers 2 years ago
more tests on remote worker container 2 years ago			`COPY model_fetcher.py /workspace/`
add experimental and wip worker containers 2 years ago			`COPY runpod_infer.py /workspace/`
prepare RWKV 2 years ago			`COPY RWKV.py /workspace/`
add experimental and wip worker containers 2 years ago			`COPY test_input.json /workspace/`
work on remote workers 2 years ago
chatbot remote worker test 2 years ago			`CMD python3 -u runpod_infer.py --model_name=${MODEL_NAME}`