FROM python:bullseye

RUN apt-get update; \
    apt-get install -y --no-install-recommends \
    build-essential

WORKDIR /usr/src/app

RUN pip install --no-cache-dir llama-cpp-python[server]

CMD python3 -m llama_cpp.server --model /usr/src/app/models/gpt4-x-alpaca-13b-native-4bit-128g.bin