From 67882d49a9c1ae2cb60194ab8c6aae23b4cc5957 Mon Sep 17 00:00:00 2001 From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com> Date: Mon, 3 Nov 2025 05:59:46 +0000 Subject: [PATCH] Fix NON_BREAKING_SPACE_PATTERN to avoid matching regular spaces Co-authored-by: TheLovinator1 <4153203+TheLovinator1@users.noreply.github.com> --- scrape.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/scrape.py b/scrape.py index 08c20ba..aae4172 100644 --- a/scrape.py +++ b/scrape.py @@ -33,7 +33,7 @@ SQUARE_BRACKETS_PATTERN = re.compile(r"^\s*\[([^\]]+)\]\s*$", re.MULTILINE) BALL_PATTERN = re.compile(r"●\s*(.*?)\n", re.MULTILINE) REFERENCE_MARK_PATTERN = re.compile(r"^\s*※\s*(\S.*?)\s*$", re.MULTILINE) ESCAPED_STAR_PATTERN = re.compile(r"\\\*(.*)", re.MULTILINE) -NON_BREAKING_SPACE_PATTERN = re.compile(r"[\xa0 ]") # noqa: RUF001 +NON_BREAKING_SPACE_PATTERN = re.compile(r"[\xa0\u00a0\u2002\u2003\u2009]") # Various nbsp characters EMPTY_CODE_BLOCK_PATTERN = re.compile(r"```[ \t]*\n[ \t]*\n```") # Circled number patterns - precompile for better performance