Dockerfile 3.0 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768
  1. FROM nvidia/cuda:11.8.0-devel-ubuntu22.04 as builder
  2. RUN apt-get update && \
  3. apt-get install --no-install-recommends -y git vim build-essential python3-dev python3-venv && \
  4. rm -rf /var/lib/apt/lists/*
  5. RUN git clone https://github.com/oobabooga/GPTQ-for-LLaMa /build
  6. WORKDIR /build
  7. RUN python3 -m venv /build/venv
  8. RUN . /build/venv/bin/activate && \
  9. pip3 install --upgrade pip setuptools && \
  10. pip3 install torch torchvision torchaudio && \
  11. pip3 install -r requirements.txt
  12. # https://developer.nvidia.com/cuda-gpus
  13. # for a rtx 2060: ARG TORCH_CUDA_ARCH_LIST="7.5"
  14. ARG TORCH_CUDA_ARCH_LIST="3.5;5.0;6.0;6.1;7.0;7.5;8.0;8.6+PTX"
  15. RUN . /build/venv/bin/activate && \
  16. python3 setup_cuda.py bdist_wheel -d .
  17. FROM nvidia/cuda:11.8.0-runtime-ubuntu22.04
  18. LABEL maintainer="Your Name <your.email@example.com>"
  19. LABEL description="Docker image for GPTQ-for-LLaMa and Text Generation WebUI"
  20. RUN apt-get update && \
  21. apt-get install --no-install-recommends -y git python3 python3-pip && \
  22. rm -rf /var/lib/apt/lists/*
  23. RUN --mount=type=cache,target=/root/.cache/pip pip3 install virtualenv
  24. RUN mkdir /app
  25. WORKDIR /app
  26. ARG WEBUI_VERSION
  27. RUN test -n "${WEBUI_VERSION}" && git reset --hard ${WEBUI_VERSION} || echo "Using provided webui source"
  28. RUN virtualenv /app/venv
  29. RUN . /app/venv/bin/activate && \
  30. pip3 install --upgrade pip setuptools && \
  31. pip3 install torch torchvision torchaudio
  32. COPY --from=builder /build /app/repositories/GPTQ-for-LLaMa
  33. RUN . /app/venv/bin/activate && \
  34. pip3 install /app/repositories/GPTQ-for-LLaMa/*.whl
  35. COPY extensions/api/requirements.txt /app/extensions/api/requirements.txt
  36. COPY extensions/elevenlabs_tts/requirements.txt /app/extensions/elevenlabs_tts/requirements.txt
  37. COPY extensions/google_translate/requirements.txt /app/extensions/google_translate/requirements.txt
  38. COPY extensions/silero_tts/requirements.txt /app/extensions/silero_tts/requirements.txt
  39. COPY extensions/whisper_stt/requirements.txt /app/extensions/whisper_stt/requirements.txt
  40. RUN --mount=type=cache,target=/root/.cache/pip . /app/venv/bin/activate && cd extensions/api && pip3 install -r requirements.txt
  41. RUN --mount=type=cache,target=/root/.cache/pip . /app/venv/bin/activate && cd extensions/elevenlabs_tts && pip3 install -r requirements.txt
  42. RUN --mount=type=cache,target=/root/.cache/pip . /app/venv/bin/activate && cd extensions/google_translate && pip3 install -r requirements.txt
  43. RUN --mount=type=cache,target=/root/.cache/pip . /app/venv/bin/activate && cd extensions/silero_tts && pip3 install -r requirements.txt
  44. RUN --mount=type=cache,target=/root/.cache/pip . /app/venv/bin/activate && cd extensions/whisper_stt && pip3 install -r requirements.txt
  45. COPY requirements.txt /app/requirements.txt
  46. RUN . /app/venv/bin/activate && \
  47. pip3 install -r requirements.txt
  48. RUN cp /app/venv/lib/python3.10/site-packages/bitsandbytes/libbitsandbytes_cuda118.so /app/venv/lib/python3.10/site-packages/bitsandbytes/libbitsandbytes_cpu.so
  49. COPY . /app/
  50. ENV CLI_ARGS=""
  51. CMD . /app/venv/bin/activate && python3 server.py ${CLI_ARGS}