lms chat (#227)

* first working chat example "lms ask sup" or "lms chat" * print streaming response instead of waiting until the end * visual polish * removed ask alias, chat only. --prompt or -p to provide initial prompt (quits after response). model selection i.e. "lms chat phi-4" * use existing Chat class for context management, use existing optionalPositional() for model arg * prettier changes, added types, added quit instructions * allow combining -p with stdin for processing piped content with a prompt
2025-09-18 02:03:35 +08:00 · 2025-05-09 12:18:59 -07:00
parent 91bd55686b
commit bcdfc235ba
2 changed files with 171 additions and 0 deletions
--- a/src/index.ts
+++ b/src/index.ts
@ -1,5 +1,6 @@
 import { run, subcommands } from "cmd-ts";
 import { bootstrap } from "./subcommands/bootstrap.js";
+import { chat } from "./subcommands/chat.js";
 import { clone } from "./subcommands/clone.js";
 import { create } from "./subcommands/create.js";
 import { dev } from "./subcommands/dev.js";
@ -25,6 +26,7 @@ if (process.argv.length === 2) {
 const cli = subcommands({
  name: "lms",
  cmds: {
+    chat,
    status,
    server,
    ls,
--- a/src/subcommands/chat.ts
+++ b/src/subcommands/chat.ts
@ -0,0 +1,169 @@
+import { Chat, type LLM } from "@lmstudio/sdk";
+import { command, option, optional, string } from "cmd-ts";
+import * as readline from "readline";
+import { createClient, createClientArgs } from "../createClient.js";
+import { createLogger, logLevelArgs } from "../logLevel.js";
+import { optionalPositional } from "../optionalPositional.js";
+
+async function readStdin(): Promise<string> {
+  return new Promise(resolve => {
+    let input = "";
+    process.stdin.setEncoding("utf-8");
+
+    process.stdin.on("data", chunk => {
+      input += chunk;
+    });
+
+    process.stdin.on("end", () => {
+      resolve(input.trim());
+    });
+  });
+}
+
+export const chat = command({
+  name: "chat",
+  description: "Open an interactive chat with the currently loaded model.",
+  args: {
+    ...logLevelArgs,
+    ...createClientArgs,
+    model: optionalPositional({
+      displayName: "model",
+      description: "Model name to use",
+      type: string,
+      default: "",
+    }),
+    prompt: option({
+      type: optional(string),
+      long: "prompt",
+      short: "p",
+      description: "Print response to stdout and quit",
+    }),
+    systemPrompt: option({
+      type: optional(string),
+      long: "system-prompt",
+      short: "s",
+      description: "Custom system prompt to use for the chat",
+    }),
+  },
+  async handler(args) {
+    const logger = createLogger(args);
+    const client = await createClient(logger, args);
+
+    let initialPrompt = "";
+    if (args.prompt) {
+      initialPrompt = args.prompt;
+      if (!process.stdin.isTTY) {
+        const stdinContent = await readStdin();
+        initialPrompt = `${initialPrompt}\n\n${stdinContent}`;
+      }
+    } else if (!process.stdin.isTTY) {
+      initialPrompt = await readStdin();
+    }
+
+    let model: LLM;
+    if (args.model) {
+      try {
+        model = await client.llm.model(args.model);
+      } catch (e) {
+        logger.error(`Model "${args.model}" not found, check available models with:`);
+        logger.error("  lms ls");
+        process.exit(1);
+      }
+    } else {
+      try {
+        model = await client.llm.model();
+      } catch (e) {
+        logger.error("No loaded default model found, load one first:");
+        logger.error("  lms load");
+        process.exit(1);
+      }
+    }
+    if (!initialPrompt) {
+      logger.info(`Chatting with ${model.identifier}.  Type 'exit', 'quit' or Ctrl+C to quit`);
+    }
+
+    const chat = Chat.empty();
+    chat.append(
+      "system",
+      args.systemPrompt ??
+        "You are a technical AI assistant. Answer questions clearly, concisely and to-the-point.",
+    );
+
+    if (initialPrompt) {
+      chat.append("user", initialPrompt);
+      try {
+        const prediction = model.respond(chat);
+        let lastFragment = "";
+        for await (const fragment of prediction) {
+          process.stdout.write(fragment.content);
+          lastFragment = fragment.content;
+        }
+        const result = await prediction.result();
+        chat.append("assistant", result.content);
+
+        if (!lastFragment.endsWith("\n")) {
+          // Newline before new shell prompt if not already there
+          process.stdout.write("\n");
+        }
+        process.exit(0);
+      } catch (err) {
+        logger.error("Error during chat:", err);
+        process.exit(1);
+      }
+    }
+
+    if (process.stdin.isTTY) {
+      const rl = readline.createInterface({
+        input: process.stdin,
+        output: process.stdout,
+        prompt: "› ",
+      });
+
+      process.stdout.write("\n");
+      rl.prompt();
+
+      rl.on("line", async (line: string) => {
+        const input = line.trim();
+        if (input === "exit" || input === "quit") {
+          rl.close();
+          return;
+        }
+
+        // Skip empty input
+        if (!input) {
+          rl.prompt();
+          return;
+        }
+
+        try {
+          chat.append("user", input);
+          process.stdout.write("\n● ");
+          const prediction = model.respond(chat);
+
+          // Temporarily pause the readline interface
+          rl.pause();
+
+          for await (const fragment of prediction) {
+            process.stdout.write(fragment.content);
+          }
+          const result = await prediction.result();
+          chat.append("assistant", result.content);
+
+          // Resume readline and write a new prompt
+          process.stdout.write("\n\n");
+          rl.resume();
+          rl.prompt();
+        } catch (err) {
+          logger.error("Error during chat:", err);
+          rl.prompt();
+        }
+      });
+
+      rl.on("close", () => {
+        process.exit(0);
+      });
+    } else {
+      process.exit(0);
+    }
+  },
+});