Add MLC Web-LLM Integration (#5243)

* resolved merge conflicts * create webllm.ts chat model file * add prior developed code to webllm.ts with credit * feat: add webllm entry point * update @mlc-ai/web-llm dependency * change @mlc-ai/web-llm dependency to 0.2.28 * change @mlc-ai/web-llm dependency * Fix imports and spacing * Updated to use Engine instead of ChatModule (being deprecated) * Replace chatCompletionAsyncChunkGenerator with more general chat.completions.create * Add examples and update documentation * feat: add webllm entry point * feat: add webllm entry point * create webllm.ts chat model file * add prior developed code to webllm.ts with credit * update @mlc-ai/web-llm dependency * change @mlc-ai/web-llm dependency to 0.2.28 * Fix imports and spacing * Updated to use Engine instead of ChatModule (being deprecated) * Replace chatCompletionAsyncChunkGenerator with more general chat.completions.create * Add examples and update documentation * did integration tests for mlcllm and mlcaiwebllm * Make example file for webllm.ts * Add example code for webllm.ts integration * Update community package.json and gitignore with WebLLM integration, rework integration example * chore: format * remove incorrect comment in webllm.ts * changed the import statement in test file for mlcllm * fixed test file to use the right parameters * changed function to role * Lint and format * Comment out test for now * Fix streaming * Add docs page, fixes * Update lock * Update colors * Update docstring --------- Co-authored-by: edwincha <edwincha@DESKTOP-0I6H3O4> Co-authored-by: echao-2 <[email protected]> Co-authored-by: Joshua Charat-Collins <[email protected]> Co-authored-by: Jeffrey Zhang <[email protected]> Co-authored-by: Joshua Charat-Collins <[email protected]> Co-authored-by: jacoblee93 <[email protected]>
langchain-ai · May 13, 2024 · 5c36137 · 5c36137
1 parent a57d58e
commit 5c36137
Show file tree

Hide file tree

Showing 10 changed files with 364 additions and 1 deletion.
diff --git a/docs/core_docs/docs/integrations/chat/web_llm.mdx b/docs/core_docs/docs/integrations/chat/web_llm.mdx
@@ -0,0 +1,42 @@
+---
+sidebar_class_name: web-only
+---
+
+# WebLLM
+
+:::tip Compatibility
+Only available in web environments.
+:::
+
+You can run LLMs directly in your web browser using LangChain's [WebLLM](https://webllm.mlc.ai) integration.
+
+## Setup
+
+You'll need to install the [WebLLM SDK](https://www.npmjs.com/package/@mlc-ai/web-llm) module to communicate with your local model.
+
+import IntegrationInstallTooltip from "@mdx_components/integration_install_tooltip.mdx";
+
+<IntegrationInstallTooltip></IntegrationInstallTooltip>
+
+```bash npm2yarn
+npm install -S @mlc-ai/web-llm @langchain/community
+```
+
+## Usage
+
+Note that the first time a model is called, WebLLM will download the full weights for that model. This can be multiple gigabytes, and may not be possible for all end-users of your application depending on their internet connection and computer specs.
+While the browser will cache future invocations of that model, we recommend using the smallest possible model you can.
+
+We also recommend using a [separate web worker](https://developer.mozilla.org/en-US/docs/Web/API/Web_Workers_API/Using_web_workers) when invoking and loading your models to
+not block execution.
+
+import CodeBlock from "@theme/CodeBlock";
+import Example from "@examples/models/chat/integration_webllm.ts";
+
+<CodeBlock language="typescript">{Example}</CodeBlock>
+
+Streaming is also supported.
+
+## Example
+
+For a full end-to-end example, check out [this project](https://github.com/jacoblee93/fully-local-pdf-chatbot).
diff --git a/docs/core_docs/src/css/custom.css b/docs/core_docs/src/css/custom.css
@@ -50,6 +50,7 @@
 }
 
 .node-only,
+.web-only,
 .beta {
   position: relative;
 }
@@ -60,7 +61,8 @@
 }
 
 .node-only::after,
-.beta::after {
+.beta::after,
+.web-only::after {
   position: absolute;
   right: 0.25rem;
   top: 5px;
@@ -91,6 +93,19 @@
   color: #fff;
 }
 
+/* Override `web-only` color */
+.web-only::after {
+  content: "Web-only";
+  color: #0a0072;
+  border: 1px solid #0a0072;
+}
+
+/* Override `web-only` color */
+[data-theme="dark"] .web-only::after {
+  background: #0a0072;
+  color: #fff;
+}
+
 .node-only-category,
 .beta-category {
   position: relative;

diff --git a/examples/src/models/chat/integration_webllm.ts b/examples/src/models/chat/integration_webllm.ts
@@ -0,0 +1,33 @@
+// Must be run in a web environment, e.g. a web worker
+
+import { ChatWebLLM } from "@langchain/community/chat_models/webllm";
+import { HumanMessage } from "@langchain/core/messages";
+
+// Initialize the ChatWebLLM model with the model record and chat options.
+// Note that if the appConfig field is set, the list of model records
+// must include the selected model record for the engine.
+
+// You can import a list of models available by default here:
+// https://github.com/mlc-ai/web-llm/blob/main/src/config.ts
+//
+// Or by importing it via:
+// import { prebuiltAppConfig } from "@mlc-ai/web-llm";
+const model = new ChatWebLLM({
+  model: "Phi2-q4f32_1",
+  chatOptions: {
+    temperature: 0.5,
+  },
+});
+
+// Call the model with a message and await the response.
+const response = await model.invoke([
+  new HumanMessage({ content: "What is 1 + 1?" }),
+]);
+
+console.log(response);
+
+/*
+AIMessage {
+  content: ' 2\n',
+}
+*/
diff --git a/libs/langchain-community/.gitignore b/libs/langchain-community/.gitignore
@@ -538,6 +538,10 @@ chat_models/togetherai.cjs
 chat_models/togetherai.js
 chat_models/togetherai.d.ts
 chat_models/togetherai.d.cts
+chat_models/webllm.cjs
+chat_models/webllm.js
+chat_models/webllm.d.ts
+chat_models/webllm.d.cts
 chat_models/yandex.cjs
 chat_models/yandex.js
 chat_models/yandex.d.ts

diff --git a/libs/langchain-community/langchain.config.js b/libs/langchain-community/langchain.config.js
@@ -170,6 +170,7 @@ export const config = {
     "chat_models/portkey": "chat_models/portkey",
     "chat_models/premai": "chat_models/premai",
     "chat_models/togetherai": "chat_models/togetherai",
+    "chat_models/webllm": "chat_models/webllm",
     "chat_models/yandex": "chat_models/yandex",
     "chat_models/zhipuai": "chat_models/zhipuai",
     // callbacks
@@ -388,6 +389,7 @@ export const config = {
     "chat_models/premai",
     "chat_models/iflytek_xinghuo",
     "chat_models/iflytek_xinghuo/web",
+    "chat_models/webllm",
     "chat_models/zhipuai",
     "retrievers/amazon_kendra",
     "retrievers/amazon_knowledge_base",

diff --git a/libs/langchain-community/package.json b/libs/langchain-community/package.json
@@ -82,6 +82,7 @@
     "@jest/globals": "^29.5.0",
     "@langchain/scripts": "~0.0",
     "@mendable/firecrawl-js": "^0.0.13",
+    "@mlc-ai/web-llm": "^0.2.35",
     "@mozilla/readability": "^0.4.4",
     "@neondatabase/serverless": "^0.9.1",
     "@notionhq/client": "^2.2.10",
@@ -233,6 +234,7 @@
     "@gradientai/nodejs-sdk": "^1.2.0",
     "@huggingface/inference": "^2.6.4",
     "@mendable/firecrawl-js": "^0.0.13",
+    "@mlc-ai/web-llm": "^0.2.35",
     "@mozilla/readability": "*",
     "@neondatabase/serverless": "*",
     "@notionhq/client": "^2.2.10",
@@ -398,6 +400,9 @@
     "@mendable/firecrawl-js": {
       "optional": true
     },
+    "@mlc-ai/web-llm": {
+      "optional": true
+    },
     "@mozilla/readability": {
       "optional": true
     },
@@ -1882,6 +1887,15 @@
       "import": "./chat_models/togetherai.js",
       "require": "./chat_models/togetherai.cjs"
     },
+    "./chat_models/webllm": {
+      "types": {
+        "import": "./chat_models/webllm.d.ts",
+        "require": "./chat_models/webllm.d.cts",
+        "default": "./chat_models/webllm.d.ts"
+      },
+      "import": "./chat_models/webllm.js",
+      "require": "./chat_models/webllm.cjs"
+    },
     "./chat_models/yandex": {
       "types": {
         "import": "./chat_models/yandex.d.ts",
@@ -3362,6 +3376,10 @@
     "chat_models/togetherai.js",
     "chat_models/togetherai.d.ts",
     "chat_models/togetherai.d.cts",
+    "chat_models/webllm.cjs",
+    "chat_models/webllm.js",
+    "chat_models/webllm.d.ts",
+    "chat_models/webllm.d.cts",
     "chat_models/yandex.cjs",
     "chat_models/yandex.js",
     "chat_models/yandex.d.ts",

diff --git a/libs/langchain-community/src/chat_models/tests/webllm.int.test.ts b/libs/langchain-community/src/chat_models/tests/webllm.int.test.ts
@@ -0,0 +1,69 @@
+// TODO: Fix for Node environments
+
+// import { ChatWebLLM, WebLLMInputs } from "../webllm.js";
+// import * as webllm from "@mlc-ai/web-llm";
+
+// jest.mock("@mlc-ai/web-llm", () => ({
+//   Engine: jest.fn().mockImplementation(() => ({
+//     reload: jest.fn().mockResolvedValue(undefined),
+//     setInitProgressCallback: jest.fn(),
+//     chat: {
+//       completions: {
+//         create: jest.fn().mockImplementation(() => {
+//           const messages = [
+//             {
+//               choices: [
+//                 {
+//                   delta: { content: "Hello" },
+//                   logprobs: null,
+//                   finish_reason: "complete",
+//                 },
+//               ],
+//             },
+//             {
+//               choices: [
+//                 {
+//                   delta: { content: "How are you?" },
+//                   logprobs: null,
+//                   finish_reason: "complete",
+//                 },
+//               ],
+//             },
+//           ];
+//           return (async function* () {
+//             for (let msg of messages) {
+//               yield msg;
+//             }
+//           })();
+//         }),
+//       },
+//     },
+//   })),
+// }));
+
+describe("ChatWebLLM Integration Tests", () => {
+  // let chatWebLLM: ChatWebLLM;
+  // let modelRecord = { model_id: "test-model" };
+
+  // beforeEach(() => {
+  //   const inputs: WebLLMInputs = {
+  //     modelRecord: modelRecord,
+  //     appConfig: {},
+  //     chatOpts: {},
+  //   };
+  //   chatWebLLM = new ChatWebLLM(inputs);
+  // });
+
+  test("ChatWebLLM initializes and processes messages correctly", async () => {
+    // const options = {}; // Adjust options as necessary
+    // const response = await chatWebLLM.invoke("Hello", options);
+    // expect(response).toBe("Hello");
+    // expect(webllm.Engine).toHaveBeenCalled();
+    // expect(webllm.Engine().chat.completions.create).toHaveBeenCalledWith({
+    //   stream: true,
+    //   messages: [{ role: "user", content: "Hello" }],
+    //   stop: null,
+    //   logprobs: true,
+    // });
+  });
+});