Files
Open-Assistant/docker/inference/Dockerfile.worker-full
T
2023-02-10 22:53:40 +01:00

23 lines
623 B
Docker

FROM ghcr.io/huggingface/text-generation-inference
ARG MODULE="inference"
ARG SERVICE="worker"
ARG APP_RELATIVE_PATH="${MODULE}/${SERVICE}"
WORKDIR /worker
COPY ./oasst-shared /tmp/oasst-shared
RUN conda create -n worker python=3.10 -y
RUN /opt/miniconda/envs/worker/bin/pip install /tmp/oasst-shared
COPY ./${APP_RELATIVE_PATH}/requirements.txt .
RUN /opt/miniconda/envs/worker/bin/pip install -r requirements.txt
COPY ./${APP_RELATIVE_PATH}/*.py .
COPY ./${APP_RELATIVE_PATH}/worker_full_main.sh /entrypoint.sh
ENV MODEL_ID="distilgpt2"
ENV INFERENCE_SERVER_URL="http://localhost:80"
ENTRYPOINT ["/entrypoint.sh"]