Dockerfile.cpu 1.8 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243
  1. # This Aphrodite Dockerfile is used to construct image that can build and run Aphrodite on x86 CPU platform.
  2. FROM ubuntu:22.04 AS cpu-test-1
  3. RUN apt-get update -y \
  4. && apt-get install -y curl git wget vim numactl gcc-12 g++-12 python3 python3-pip libtcmalloc-minimal4 libnuma-dev \
  5. && apt-get install -y ffmpeg libsm6 libxext6 libgl1 \
  6. && update-alternatives --install /usr/bin/gcc gcc /usr/bin/gcc-12 10 --slave /usr/bin/g++ g++ /usr/bin/g++-12
  7. # https://intel.github.io/intel-extension-for-pytorch/cpu/latest/tutorials/performance_tuning/tuning_guide.html
  8. # intel-openmp provides additional performance improvement vs. openmp
  9. # tcmalloc provides better memory allocation efficiency, e.g, holding memory in caches to speed up access of commonly-used objects.
  10. RUN pip install intel-openmp
  11. ENV LD_PRELOAD="/usr/lib/x86_64-linux-gnu/libtcmalloc_minimal.so.4:/usr/local/lib/libiomp5.so"
  12. RUN echo 'ulimit -c 0' >> ~/.bashrc
  13. RUN pip install https://intel-extension-for-pytorch.s3.amazonaws.com/ipex_dev/cpu/intel_extension_for_pytorch-2.4.0%2Bgitfbaa4bc-cp310-cp310-linux_x86_64.whl
  14. RUN pip install --upgrade pip \
  15. && pip install wheel packaging ninja "setuptools>=49.4.0" numpy
  16. FROM cpu-test-1 AS build
  17. COPY ./ /workspace/aphrodite-engine
  18. WORKDIR /workspace/aphrodite-engine
  19. RUN pip install -v -r requirements-cpu.txt --extra-index-url https://download.pytorch.org/whl/cpu
  20. # Support for building with non-AVX512 Aphrodite: docker build --build-arg APHRODITE_CPU_DISABLE_AVX512="true" ...
  21. ARG APHRODITE_CPU_DISABLE_AVX512
  22. ENV APHRODITE_CPU_DISABLE_AVX512=${APHRODITE_CPU_DISABLE_AVX512}
  23. RUN APHRODITE_TARGET_DEVICE=cpu python3 setup.py install
  24. RUN pip install triton
  25. WORKDIR /workspace/
  26. RUN ln -s /workspace/aphrodite-engine/examples && ln -s /workspace/aphrodite-engine/tests/benchmarks
  27. ENTRYPOINT ["python3", "-m", "aphrodite.endpoints.openai.api_server"]