fix(scraper): improve charset detection regex to accurately parse meta tags (#1265)

2025-02-27 00:31:06 +08:00
parent bf1a79588e
commit 7bf04d409a
1 changed files with 1 additions and 1 deletions
@@ -74,7 +74,7 @@ export async function scrapeURLWithFetch(
      const buf = Buffer.from(await x.arrayBuffer());
      let text = buf.toString("utf8");
-      const charset = (text.match(/charset=["']?(.+?)["']?>/) ?? [])[1]
+      const charset = (text.match(/<meta\b[^>]*charset\s*=\s*["']?([^"'\s\/>]+)/i) ?? [])[1]
      try {
        if (charset) {
          text = new TextDecoder(charset.trim()).decode(buf);