From 62c754fe23f3382036a38f72c4bd947d9501a5f1 Mon Sep 17 00:00:00 2001 From: MDLeom <2809763-curben@users.noreply.gitlab.com> Date: Wed, 19 Mar 2025 10:22:34 +0000 Subject: [PATCH] fix(clean_url): encode ^ this is unrelated to address separator of adblock filter syntax https://adblockplus.org/filter-cheatsheet#blocking1 which does not need to be escaped uBO can handle this pattern just fine ||example.com/so%5Emany?ca^r=e^t^$all query string does not need to percent-encode ^, only pathname --- src/clean_url.js | 6 +++++- 1 file changed, 5 insertions(+), 1 deletion(-) diff --git a/src/clean_url.js b/src/clean_url.js index b9613710..9581aeb9 100644 --- a/src/clean_url.js +++ b/src/clean_url.js @@ -30,7 +30,11 @@ for await (const line of createInterface({ input: process.stdin, terminal: false url = new URL(url.searchParams.get('url')) } - const outUrl = `${url.host.replace(/^www\./, '')}${url.pathname}${url.search}` + url.host = url.host.replace(/^www\./, '') + // nodejs does not percent-encode ^ yet + // https://github.com/nodejs/node/issues/57313 + url.pathname = url.pathname.replaceAll('^', encodeURI('^')) + const outUrl = `${url.host}${url.pathname}${url.search}` // remove trailing slash from domain except path #43 .replace(/(^[^/]*)\/+$/, '$1')