Spaces:

jbilcke-hf
/

webapp-factory-llama-node

Sleeping

jbilcke-hf HF staff commited on Jun 26, 2023

Commit

5535b95

1 Parent(s): 1e042d7

install deps in /tmp

Files changed (2) hide show

Dockerfile CHANGED Viewed

@@ -48,10 +48,12 @@ RUN pnpm --version
 RUN pnpm install
 # ok! let's try to compile llama-node
 RUN git clone https://github.com/Atome-FE/llama-node.git
-WORKDIR $HOME/app/llama-node
 RUN git submodule update --init --recursive
@@ -62,7 +64,7 @@ RUN pnpm build:llama-cpp
 RUN pnpm:build
-WORKDIR $HOME/app/llama-node/packages/llama-cpp
 RUN pnpm build:cuda

 RUN pnpm install
+WORKDIR /tmp
 # ok! let's try to compile llama-node
 RUN git clone https://github.com/Atome-FE/llama-node.git
+WORKDIR /tmp/llama-node
 RUN git submodule update --init --recursive
 RUN pnpm:build
+WORKDIR /tmp/llama-node/packages/llama-cpp
 RUN pnpm build:cuda

src/index.mts CHANGED Viewed

@@ -93,7 +93,7 @@ app.get("/app", async (req, res) => {
   // naive implementation: we say we are out of capacity
   if (pending.queue.length >= maxParallelRequests) {
-    res.write('sorry, max nb of parallel request reached')
     res.end()
     return
   }

   // naive implementation: we say we are out of capacity
   if (pending.queue.length >= maxParallelRequests) {
+    res.write('Sorry, max nb of parallel requests reached. A new slot should be available in < 5 min.')
     res.end()
     return
   }