support VLLM_MODEL override

yoziru · May 7, 2024 · 586e708 · 586e708
1 parent 79277ac
commit 586e708
Show file tree

Hide file tree

Showing 2 changed files with 28 additions and 12 deletions.
diff --git a/README.md b/README.md
@@ -19,8 +19,6 @@ This project aims to be the easiest way for you to get started with LLMs. No ted
 - **Easy setup:** No tedious and annoying setup required. Just clone the repo and you're good to go!
 - **Code syntax highligting:** Messages that include code, will be highlighted for easy access.
 - **Copy codeblocks easily:** Easily copy the highlighted code with one click.
-- **Download/Pull & Delete models:** Easily download and delete models directly from the interface.
-- **Switch between models:** Switch between models fast with a click.
 - **Chat history:** Chats are saved and easily accessed.
 - **Light & Dark mode:** Switch between light & dark mode.
 
@@ -43,6 +41,11 @@ The easiest way to get started is to use the pre-built Docker image.
 docker run --rm -d -p 3000:3000 -e VLLM_URL=http://host.docker.internal:8000 ghcr.io/yoziru/nextjs-vllm-ui:latest
 ```
 
+If you're using Ollama, you need to set the `VLLM_MODEL`:
+```
+docker run --rm -d -p 3000:3000 -e VLLM_URL=http://host.docker.internal:11434 -e NEXT_PUBLIC_TOKEN_LIMIT=8192 -e VLLM_MODEL=llama3 ghcr.io/yoziru/nextjs-vllm-ui:latest
+```
+
 Then go to [localhost:3000](http://localhost:3000) and start chatting with your favourite model!
 
 # Development 📖

diff --git a/src/app/api/models/route.ts b/src/app/api/models/route.ts
@@ -1,17 +1,30 @@
 import { NextRequest, NextResponse } from "next/server";
 
 export async function GET(req: NextRequest): Promise<NextResponse> {
+  const baseUrl = process.env.VLLM_URL;
+  const apiKey = process.env.VLLM_API_KEY;
+  const headers = new Headers();
+  if (apiKey !== undefined) {
+    headers.set("Authorization", `Bearer ${apiKey}`);
+    headers.set("api-key", apiKey);
+  }
+  if (!baseUrl) {
+    throw new Error("VLLM_URL is not set");
+  }
+
+  const envModel = process.env.VLLM_MODEL;
+  if (envModel) {
+    return NextResponse.json({
+      object: "list",
+      data: [
+        {
+          id: envModel,
+        },
+      ],
+    });
+  }
+
   try {
-    const baseUrl = process.env.VLLM_URL;
-    if (!baseUrl) {
-      throw new Error("VLLM_URL is not set");
-    }
-    const apiKey = process.env.VLLM_API_KEY;
-    const headers = new Headers();
-    if (apiKey !== undefined) {
-      headers.set("Authorization", `Bearer ${apiKey}`);
-      headers.set("api-key", apiKey);
-    }
     const res = await fetch(`${baseUrl}/v1/models`, {
       headers: headers,
       cache: "no-store",