e2e tests for engine (#322)

2025-06-03 16:11:16 -07:00
parent 7235eab227
commit fc1ebe9e8a
10 changed files with 956 additions and 165 deletions
--- a/testing/fake-llm-server/chatCompletionHandler.ts
+++ b/testing/fake-llm-server/chatCompletionHandler.ts
@@ -0,0 +1,156 @@
+import { Request, Response } from "express";
+import fs from "fs";
+import path from "path";
+import { CANNED_MESSAGE, createStreamChunk } from ".";
+
+let globalCounter = 0;
+
+export const createChatCompletionHandler =
+  (prefix: string) => (req: Request, res: Response) => {
+    const { stream = false, messages = [] } = req.body;
+    console.log("* Received messages", messages);
+
+    // Check if the last message contains "[429]" to simulate rate limiting
+    const lastMessage = messages[messages.length - 1];
+    if (lastMessage && lastMessage.content === "[429]") {
+      return res.status(429).json({
+        error: {
+          message: "Too many requests. Please try again later.",
+          type: "rate_limit_error",
+          param: null,
+          code: "rate_limit_exceeded",
+        },
+      });
+    }
+
+    let messageContent = CANNED_MESSAGE;
+    console.error("LASTMESSAGE", lastMessage);
+    // Check if the last message is "[dump]" to write messages to file and return path
+    if (
+      lastMessage &&
+      (Array.isArray(lastMessage.content)
+        ? lastMessage.content.some(
+            (part: { type: string; text: string }) =>
+              part.type === "text" && part.text.includes("[dump]"),
+          )
+        : lastMessage.content.includes("[dump]"))
+    ) {
+      const timestamp = Date.now();
+      const generatedDir = path.join(__dirname, "generated");
+
+      // Create generated directory if it doesn't exist
+      if (!fs.existsSync(generatedDir)) {
+        fs.mkdirSync(generatedDir, { recursive: true });
+      }
+
+      const dumpFilePath = path.join(generatedDir, `${timestamp}.json`);
+
+      try {
+        fs.writeFileSync(
+          dumpFilePath,
+          JSON.stringify(
+            {
+              body: req.body,
+              headers: { authorization: req.headers["authorization"] },
+            },
+            null,
+            2,
+          ),
+          "utf-8",
+        );
+        console.log(`* Dumped messages to: ${dumpFilePath}`);
+        messageContent = `[[dyad-dump-path=${dumpFilePath}]]`;
+      } catch (error) {
+        console.error(`* Error writing dump file: ${error}`);
+        messageContent = `Error: Could not write dump file: ${error}`;
+      }
+    }
+
+    if (lastMessage && lastMessage.content === "[increment]") {
+      globalCounter++;
+      messageContent = `counter=${globalCounter}`;
+    }
+
+    // Check if the last message starts with "tc=" to load test case file
+    if (
+      lastMessage &&
+      lastMessage.content &&
+      typeof lastMessage.content === "string" &&
+      lastMessage.content.startsWith("tc=")
+    ) {
+      const testCaseName = lastMessage.content.slice(3); // Remove "tc=" prefix
+      const testFilePath = path.join(
+        __dirname,
+        "..",
+        "..",
+        "..",
+        "e2e-tests",
+        "fixtures",
+        prefix,
+        `${testCaseName}.md`,
+      );
+
+      try {
+        if (fs.existsSync(testFilePath)) {
+          messageContent = fs.readFileSync(testFilePath, "utf-8");
+          console.log(`* Loaded test case: ${testCaseName}`);
+        } else {
+          console.log(`* Test case file not found: ${testFilePath}`);
+          messageContent = `Error: Test case file not found: ${testCaseName}.md`;
+        }
+      } catch (error) {
+        console.error(`* Error reading test case file: ${error}`);
+        messageContent = `Error: Could not read test case file: ${testCaseName}.md`;
+      }
+    }
+
+    // Non-streaming response
+    if (!stream) {
+      return res.json({
+        id: `chatcmpl-${Date.now()}`,
+        object: "chat.completion",
+        created: Math.floor(Date.now() / 1000),
+        model: "fake-model",
+        choices: [
+          {
+            index: 0,
+            message: {
+              role: "assistant",
+              content: messageContent,
+            },
+            finish_reason: "stop",
+          },
+        ],
+      });
+    }
+
+    // Streaming response
+    res.setHeader("Content-Type", "text/event-stream");
+    res.setHeader("Cache-Control", "no-cache");
+    res.setHeader("Connection", "keep-alive");
+
+    // Split the message into characters to simulate streaming
+    const message = messageContent;
+    const messageChars = message.split("");
+
+    // Stream each character with a delay
+    let index = 0;
+    const batchSize = 8;
+
+    // Send role first
+    res.write(createStreamChunk("", "assistant"));
+
+    const interval = setInterval(() => {
+      if (index < messageChars.length) {
+        // Get the next batch of characters (up to batchSize)
+        const batch = messageChars.slice(index, index + batchSize).join("");
+        res.write(createStreamChunk(batch));
+        index += batchSize;
+      } else {
+        // Send the final chunk
+        res.write(createStreamChunk("", "assistant", true));
+        clearInterval(interval);
+        res.end();
+      }
+    }, 10);
+  };
--- a/testing/fake-llm-server/index.ts
+++ b/testing/fake-llm-server/index.ts
@@ -1,8 +1,7 @@
-import express, { Request, Response } from "express";
+import express from "express";
 import { createServer } from "http";
 import cors from "cors";
-import fs from "fs";
-import path from "path";
+import { createChatCompletionHandler } from "./chatCompletionHandler";

 // Create Express app
 const app = express();
@@ -13,7 +12,7 @@ app.use(express.urlencoded({ extended: true, limit: "50mb" }));
 const PORT = 3500;

 // Helper function to create OpenAI-like streaming response chunks
-function createStreamChunk(
+export function createStreamChunk(
  content: string,
  role: string = "assistant",
  isLast: boolean = false,
@@ -35,7 +34,7 @@ function createStreamChunk(
  return `data: ${JSON.stringify(chunk)}\n\n${isLast ? "data: [DONE]\n\n" : ""}`;
 }

-const CANNED_MESSAGE = `
+export const CANNED_MESSAGE = `
  <think>
  \`<dyad-write>\`:
  I'll think about the problem and write a bug report.
@@ -93,8 +92,6 @@ app.get("/ollama/api/tags", (req, res) => {
  res.json(ollamaModels);
 });

-let globalCounter = 0;
-
 app.post("/ollama/chat", (req, res) => {
  // Tell the client we're going to stream NDJSON
  res.setHeader("Content-Type", "application/x-ndjson");
@@ -183,151 +180,16 @@ app.get("/lmstudio/api/v0/models", (req, res) => {
  res.json(lmStudioModels);
 });

-app.post("/lmstudio/v1/chat/completions", chatCompletionHandler);
+app.post(
+  "/lmstudio/v1/chat/completions",
+  createChatCompletionHandler("lmstudio"),
+);
+
+app.post("/engine/v1/chat/completions", createChatCompletionHandler("engine"));

 // Handle POST requests to /v1/chat/completions
-app.post("/v1/chat/completions", chatCompletionHandler);
+app.post("/v1/chat/completions", createChatCompletionHandler("."));

-function chatCompletionHandler(req: Request, res: Response) {
-  const { stream = false, messages = [] } = req.body;
-  console.log("* Received messages", messages);
-
-  // Check if the last message contains "[429]" to simulate rate limiting
-  const lastMessage = messages[messages.length - 1];
-  if (lastMessage && lastMessage.content === "[429]") {
-    return res.status(429).json({
-      error: {
-        message: "Too many requests. Please try again later.",
-        type: "rate_limit_error",
-        param: null,
-        code: "rate_limit_exceeded",
-      },
-    });
-  }
-
-  let messageContent = CANNED_MESSAGE;
-  console.error("LASTMESSAGE", lastMessage);
-  // Check if the last message is "[dump]" to write messages to file and return path
-  if (
-    lastMessage &&
-    (Array.isArray(lastMessage.content)
-      ? lastMessage.content.some(
-          (part: { type: string; text: string }) =>
-            part.type === "text" && part.text.includes("[dump]"),
-        )
-      : lastMessage.content.includes("[dump]"))
-  ) {
-    const timestamp = Date.now();
-    const generatedDir = path.join(__dirname, "generated");
-
-    // Create generated directory if it doesn't exist
-    if (!fs.existsSync(generatedDir)) {
-      fs.mkdirSync(generatedDir, { recursive: true });
-    }
-
-    const dumpFilePath = path.join(generatedDir, `${timestamp}.json`);
-
-    try {
-      fs.writeFileSync(
-        dumpFilePath,
-        JSON.stringify(messages, null, 2),
-        "utf-8",
-      );
-      console.log(`* Dumped messages to: ${dumpFilePath}`);
-      messageContent = `[[dyad-dump-path=${dumpFilePath}]]`;
-    } catch (error) {
-      console.error(`* Error writing dump file: ${error}`);
-      messageContent = `Error: Could not write dump file: ${error}`;
-    }
-  }
-
-  if (lastMessage && lastMessage.content === "[increment]") {
-    globalCounter++;
-    messageContent = `counter=${globalCounter}`;
-  }
-
-  // Check if the last message starts with "tc=" to load test case file
-  if (
-    lastMessage &&
-    lastMessage.content &&
-    typeof lastMessage.content === "string" &&
-    lastMessage.content.startsWith("tc=")
-  ) {
-    const testCaseName = lastMessage.content.slice(3); // Remove "tc=" prefix
-    const testFilePath = path.join(
-      __dirname,
-      "..",
-      "..",
-      "..",
-      "e2e-tests",
-      "fixtures",
-      `${testCaseName}.md`,
-    );
-
-    try {
-      if (fs.existsSync(testFilePath)) {
-        messageContent = fs.readFileSync(testFilePath, "utf-8");
-        console.log(`* Loaded test case: ${testCaseName}`);
-      } else {
-        console.log(`* Test case file not found: ${testFilePath}`);
-        messageContent = `Error: Test case file not found: ${testCaseName}.md`;
-      }
-    } catch (error) {
-      console.error(`* Error reading test case file: ${error}`);
-      messageContent = `Error: Could not read test case file: ${testCaseName}.md`;
-    }
-  }
-
-  // Non-streaming response
-  if (!stream) {
-    return res.json({
-      id: `chatcmpl-${Date.now()}`,
-      object: "chat.completion",
-      created: Math.floor(Date.now() / 1000),
-      model: "fake-model",
-      choices: [
-        {
-          index: 0,
-          message: {
-            role: "assistant",
-            content: messageContent,
-          },
-          finish_reason: "stop",
-        },
-      ],
-    });
-  }
-
-  // Streaming response
-  res.setHeader("Content-Type", "text/event-stream");
-  res.setHeader("Cache-Control", "no-cache");
-  res.setHeader("Connection", "keep-alive");
-
-  // Split the message into characters to simulate streaming
-  const message = messageContent;
-  const messageChars = message.split("");
-
-  // Stream each character with a delay
-  let index = 0;
-  const batchSize = 8;
-
-  // Send role first
-  res.write(createStreamChunk("", "assistant"));
-
-  const interval = setInterval(() => {
-    if (index < messageChars.length) {
-      // Get the next batch of characters (up to batchSize)
-      const batch = messageChars.slice(index, index + batchSize).join("");
-      res.write(createStreamChunk(batch));
-      index += batchSize;
-    } else {
-      // Send the final chunk
-      res.write(createStreamChunk("", "assistant", true));
-      clearInterval(interval);
-      res.end();
-    }
-  }, 10);
-}
 // Start the server
 const server = createServer(app);
 server.listen(PORT, () => {