FROM ubuntu:latest

RUN apt-get update; \
    apt-get install -y --no-install-recommends \
    build-essential cmake python3 python3-pip

WORKDIR /usr/src/app

RUN CMAKE_ARGS="-DLLAMA_METAL=on" FORCE_CMAKE=1 pip install llama-cpp-python[server]

CMD python3 -m llama_cpp.server