feat: improve repo matching and exec output cleanup

MackDing · MackDing · commit 3677ee425fcc · 2026-03-14T02:02:32.000+08:00
diff --git a/README.md b/README.md
@@ -125,6 +125,7 @@ General:
 - `/repo` - list switchable git projects under `WORKSPACE_ROOT`
 - `/repo <name>` - switch the current chat to another project
 - `/repo <keyword>` - fuzzy match projects; switch if only one match, otherwise list candidates
+- `/repo <typo>` - suggests the closest project name when there is no direct match
 - `/repo recent` - show recent projects for the current chat
 - `/repo -` - switch back to the previous project
 - `/new` - clear the saved Codex conversation for the current project and start fresh on the next message
@@ -186,6 +187,7 @@ PTY output is streamed with throttled `editMessageText` updates.
   - spoiler (`||...||`, default)
   - quote block (if `REASONING_RENDER_MODE=quote`)
 - If `node-pty` cannot spawn on the current host, the runner falls back to `codex exec` for per-request execution
+- In `codex exec` fallback mode, Telegram output is cleaned to hide the Codex banner, raw tool trace, `mcp startup`, and duplicate `tokens used` footer
 
 ## Project-Scoped Conversation State
 
diff --git a/src/bot/formatter.js b/src/bot/formatter.js
@@ -1,5 +1,7 @@
 const THINK_BLOCK_REGEX = /<think>([\s\S]*?)<\/think>/gi;
 const TELEGRAM_SPECIAL_REGEX = /[_*[\]()~`>#+\-=|{}.!\\]/g;
+const CODEX_DIVIDER = "\n--------\n";
+const CODEX_TRANSCRIPT_HEADER_REGEX = /^OpenAI Codex v[^\n]*\n/;
 
 export function escapeMarkdownV2(input = "") {
   return String(input).replace(TELEGRAM_SPECIAL_REGEX, "\\$&");
@@ -21,6 +23,101 @@ export function extractReasoning(raw = "") {
   };
 }
 
+function removeCodexBanner(raw = "") {
+  const source = String(raw || "").replace(/\r/g, "");
+  if (!CODEX_TRANSCRIPT_HEADER_REGEX.test(source)) return source;
+
+  const firstDividerIndex = source.indexOf(CODEX_DIVIDER);
+  if (firstDividerIndex === -1) return source;
+
+  const secondDividerIndex = source.indexOf(
+    CODEX_DIVIDER,
+    firstDividerIndex + CODEX_DIVIDER.length
+  );
+  if (secondDividerIndex === -1) return source;
+
+  return source.slice(secondDividerIndex + CODEX_DIVIDER.length);
+}
+
+export function extractCodexExecResponse(raw = "") {
+  const source = removeCodexBanner(raw);
+  if (!source) return "";
+
+  const blocks = [];
+  let section = null;
+  let currentCodexLines = [];
+  let skipNextNonEmptyLine = false;
+
+  const flushCodexBlock = () => {
+    if (!currentCodexLines.length) return;
+
+    const content = currentCodexLines.join("\n").trim();
+    if (content) blocks.push(content);
+    currentCodexLines = [];
+  };
+
+  for (const line of source.split("\n")) {
+    const trimmed = line.trim();
+
+    if (skipNextNonEmptyLine) {
+      if (trimmed) {
+        skipNextNonEmptyLine = false;
+      }
+      continue;
+    }
+
+    if (trimmed === "tokens used") {
+      flushCodexBlock();
+      break;
+    }
+
+    if (/^mcp startup:/i.test(trimmed)) {
+      continue;
+    }
+
+    if (trimmed === "user") {
+      flushCodexBlock();
+      section = "user";
+      continue;
+    }
+
+    if (trimmed === "codex") {
+      flushCodexBlock();
+      section = "codex";
+      continue;
+    }
+
+    if (trimmed === "exec") {
+      flushCodexBlock();
+      section = "exec";
+      continue;
+    }
+
+    if (trimmed === "tokens" || trimmed === "token usage") {
+      flushCodexBlock();
+      break;
+    }
+
+    if (/^[\d,]+$/.test(trimmed) && section !== "codex") {
+      continue;
+    }
+
+    if (section === "codex") {
+      currentCodexLines.push(line);
+      continue;
+    }
+
+    if (/^tokens used\b/i.test(trimmed)) {
+      flushCodexBlock();
+      skipNextNonEmptyLine = true;
+      continue;
+    }
+  }
+
+  flushCodexBlock();
+  return blocks.at(-1) || "";
+}
+
 function renderReasoningBlock(content, mode = "spoiler") {
   const escaped = escapeMarkdownV2(content);
   if (mode === "quote") {
@@ -42,8 +139,10 @@ function renderReasoningBlock(content, mode = "spoiler") {
 }
 
 export function formatPtyOutput(raw, options = {}) {
-  const { mode = "spoiler" } = options;
-  const { cleanText, reasoningBlocks } = extractReasoning(raw);
+  const { mode = "spoiler", sessionMode = "pty" } = options;
+  const normalizedRaw =
+    sessionMode === "exec" ? extractCodexExecResponse(raw) : String(raw || "");
+  const { cleanText, reasoningBlocks } = extractReasoning(normalizedRaw);
   const sections = [];
 
   if (cleanText) {
diff --git a/src/bot/handlers.js b/src/bot/handlers.js
@@ -1,5 +1,9 @@
 import { Markup } from "telegraf";
-import { buildPlanPrompt, extractCommandPayload } from "./commandUtils.js";
+import {
+  buildPlanPrompt,
+  extractCommandPayload,
+  suggestClosestWord
+} from "./commandUtils.js";
 import { escapeMarkdownV2, splitTelegramMessage } from "./formatter.js";
 
 async function sendChunkedMarkdown(ctx, text, extra = {}) {
@@ -48,6 +52,21 @@ function formatSkillLines(skillStates) {
   return skillStates.map((skill) => `- ${skill.name}: ${skill.enabled ? "on" : "off"}`);
 }
 
+function suggestProjectName(input, projects) {
+  const candidates = [
+    ...new Set(
+      projects.flatMap((project) => [project.relativePath, project.name]).filter(Boolean)
+    )
+  ];
+
+  const threshold = Math.min(
+    6,
+    Math.max(2, Math.ceil(String(input || "").trim().length * 0.35))
+  );
+
+  return suggestClosestWord(input, candidates, threshold);
+}
+
 export function registerHandlers({
   bot,
   router,
@@ -209,6 +228,13 @@ export function registerHandlers({
           );
 
           if (!matches.length) {
+            const suggestion = suggestProjectName(payload, projects);
+            if (suggestion) {
+              throw new Error(
+                `没有匹配的项目: ${payload}\n你是不是想找: ${suggestion}\ntry: /repo ${suggestion}`
+              );
+            }
+
             throw new Error(`没有匹配的项目: ${payload}`);
           }
 
diff --git a/src/runner/ptyManager.js b/src/runner/ptyManager.js
@@ -410,7 +410,10 @@ export class PtyManager {
     if (!session) return;
 
     const rawTail = session.rawBuffer.slice(-60000);
-    const rendered = formatPtyOutput(rawTail, { mode: this.config.reasoning.mode });
+    const rendered = formatPtyOutput(rawTail, {
+      mode: this.config.reasoning.mode,
+      sessionMode: session.mode
+    });
     if (rendered === session.lastRendered) return;
     session.lastRendered = rendered;
 
diff --git a/tests/commandUtils.test.js b/tests/commandUtils.test.js
@@ -24,3 +24,10 @@ test("suggestClosestWord returns the nearest supported command when the typo is
   assert.equal(suggestClosestWord("ststus", ["list", "status", "tools"]), "status");
   assert.equal(suggestClosestWord("zzz", ["list", "status", "tools"]), "");
 });
+
+test("suggestClosestWord supports larger edit distances when the caller relaxes the threshold", () => {
+  assert.equal(
+    suggestClosestWord("ai-engineer-hub", ["ai-engineering-hub"], 6),
+    "ai-engineering-hub"
+  );
+});
diff --git a/tests/formatter.test.js b/tests/formatter.test.js
@@ -2,6 +2,7 @@ import test from "node:test";
 import assert from "node:assert/strict";
 import {
   escapeMarkdownV2,
+  extractCodexExecResponse,
   extractReasoning,
   formatPtyOutput,
   splitTelegramMessage
@@ -34,6 +35,60 @@ test("formatPtyOutput renders visible output and spoiler reasoning", () => {
   assert.match(rendered, /\|\|private reasoning\|\|/);
 });
 
+test("extractCodexExecResponse strips codex exec transcript noise and keeps the final assistant reply", () => {
+  const raw = [
+    "OpenAI Codex v0.114.0 (research preview)",
+    "--------",
+    "workdir: /tmp/demo",
+    "model: gpt-5.4",
+    "session id: 11111111-1111-1111-1111-111111111111",
+    "--------",
+    "user",
+    "run unit test",
+    "mcp startup: no servers",
+    "codex",
+    "I’m checking the repository layout first.",
+    "exec",
+    "/bin/zsh -lc 'npm test' succeeded in 1.07s:",
+    "ok",
+    "codex",
+    "`npm test` passed.",
+    "",
+    "15 tests ran, 15 passed, 0 failed.",
+    "tokens used",
+    "8,301",
+    "`npm test` passed.",
+    "",
+    "15 tests ran, 15 passed, 0 failed."
+  ].join("\n");
+
+  assert.equal(
+    extractCodexExecResponse(raw),
+    "`npm test` passed.\n\n15 tests ran, 15 passed, 0 failed."
+  );
+});
+
+test("formatPtyOutput uses cleaned codex exec content when session mode is exec", () => {
+  const raw = [
+    "OpenAI Codex v0.114.0 (research preview)",
+    "--------",
+    "workdir: /tmp/demo",
+    "--------",
+    "user",
+    "who are u",
+    "mcp startup: no servers",
+    "codex",
+    "I am Codex."
+  ].join("\n");
+
+  const rendered = formatPtyOutput(raw, {
+    mode: "spoiler",
+    sessionMode: "exec"
+  });
+
+  assert.equal(rendered, "I am Codex\\.");
+});
+
 test("splitTelegramMessage preserves content and avoids trailing escape characters in chunks", () => {
   const input = `${"a".repeat(9)}\\b`;
   const chunks = splitTelegramMessage(input, 10);