File size: 1,716 Bytes
6b225ba |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 |
FROM nvidia/cuda:11.8.0-cudnn8-devel-ubuntu20.04
LABEL maintainer="Hugging Face"
ENV PYTHONUNBUFFERED 1
EXPOSE 7860
ARG DEBIAN_FRONTEND=noninteractive
# Use login shell to read variables from `~/.profile` (to pass dynamic created variables between RUN commands)
SHELL ["sh", "-lc"]
RUN apt update
RUN apt --yes install build-essential
RUN apt --yes install curl
RUN curl -fsSL https://deb.nodesource.com/setup_18.x | bash -
RUN apt --yes install nodejs
# we need Rust
RUN curl https://sh.rustup.rs -sSf | sh -s -- --default-toolchain nightly -y
# configure PNPM
RUN corepack enable
RUN corepack prepare [email protected] --activate
RUN apt --yes install git git-lfs libsndfile1-dev tesseract-ocr espeak-ng python3 python3-pip ffmpeg
RUN git lfs install
RUN python3 -m pip install --no-cache-dir --upgrade pip
WORKDIR /tmp
# ok! let's try to compile llama-node
RUN git clone https://github.com/Atome-FE/llama-node.git
WORKDIR /tmp/llama-node
RUN git submodule update --init --recursive
RUN pnpm install --ignore-scripts
# let's try to build backends, to see
RUN pnpm build:llama-cpp
RUN pnpm:build
WORKDIR /tmp/llama-node/packages/llama-cpp
RUN pnpm build:cuda
ENV LD_LIBRARY_PATH $LD_LIBRARY_PATH:$HOME/.llama-node
RUN useradd -m -u 1000 user
USER user
ENV HOME=/home/user \
PATH=/home/user/.local/bin:$PATH
WORKDIR $HOME/app
# prepare to install the Node app
COPY --chown=user package*.json .
RUN pnpm --version
RUN npm install
# ok.. should be good?
COPY --chown=user . .
ADD --chown=user https://huggingface.co/TheBloke/airoboros-13b-gpt4-GGML/resolve/main/airoboros-13b-gpt4.ggmlv3.q4_0.bin models/airoboros-13b-gpt4.ggmlv3.q4_0.bin
RUN python3 test.py
CMD [ "pnpm", "run", "start" ] |