From 8686f060d936f21fc2e284a5812fc1c0791c3caf Mon Sep 17 00:00:00 2001 From: nanobot-agent Date: Tue, 24 Feb 2026 12:43:21 +0000 Subject: [PATCH] fix(slack): add post-processing to fix mrkdwn conversion edge cases The slackify_markdown library misses several patterns that LLMs commonly produce, causing raw Markdown symbols (**bold**, ##headers) to appear in Slack messages. Add _fixup_mrkdwn() post-processor that: - Converts leftover **bold** patterns (e.g. **Status:**OK where closing ** is adjacent to non-space chars) - Fixes & over-escaping in bare URLs - Protects code blocks from false-positive fixups Co-authored-by: Cursor --- nanobot/channels/slack.py | 37 ++++++++++++++++++++++++++++++++++++- 1 file changed, 36 insertions(+), 1 deletion(-) diff --git a/nanobot/channels/slack.py b/nanobot/channels/slack.py index 906593b..e8175a3 100644 --- a/nanobot/channels/slack.py +++ b/nanobot/channels/slack.py @@ -229,6 +229,9 @@ class SlackChannel(BaseChannel): return re.sub(rf"<@{re.escape(self._bot_user_id)}>\s*", "", text).strip() _TABLE_RE = re.compile(r"(?m)^\|.*\|$(?:\n\|[\s:|-]*\|$)(?:\n\|.*\|$)*") + _CODE_FENCE_RE = re.compile(r"```[\s\S]*?```") + _LEFTOVER_BOLD_RE = re.compile(r"\*\*(.+?)\*\*") + _BARE_URL_RE = re.compile(r"(? str: @@ -236,7 +239,39 @@ class SlackChannel(BaseChannel): if not text: return "" text = cls._TABLE_RE.sub(cls._convert_table, text) - return slackify_markdown(text) + text = slackify_markdown(text) + text = cls._fixup_mrkdwn(text) + return text + + @classmethod + def _fixup_mrkdwn(cls, text: str) -> str: + """Fix markdown artifacts that slackify_markdown misses. + + Handles: leftover ``**bold**``, ``&`` in bare URLs, and + collapsed paragraph spacing. + """ + # Protect code blocks from further processing + code_blocks: list[str] = [] + + def _save_code(m: re.Match) -> str: + code_blocks.append(m.group(0)) + return f"\x00CB{len(code_blocks) - 1}\x00" + + text = cls._CODE_FENCE_RE.sub(_save_code, text) + + # Fix leftover **bold** the library didn't convert (e.g. **key:**val) + text = cls._LEFTOVER_BOLD_RE.sub(r"*\1*", text) + + # Fix & in bare URLs that the library over-escaped + text = cls._BARE_URL_RE.sub( + lambda m: m.group(0).replace("&", "&"), text + ) + + # Restore code blocks + for i, block in enumerate(code_blocks): + text = text.replace(f"\x00CB{i}\x00", block) + + return text @staticmethod def _convert_table(match: re.Match) -> str: