We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 90af453 commit 40ab287Copy full SHA for 40ab287
crawl4ai/utils.py
@@ -2184,8 +2184,10 @@ def normalize_url(
2184
netloc = parsed.netloc.lower()
2185
2186
# ── path ──
2187
- # Strip duplicate slashes and trailing “/” (except root)
2188
- path = quote(unquote(parsed.path))
+ # Strip duplicate slashes and trailing "/" (except root)
+ # IMPORTANT: Don't use quote(unquote()) as it mangles + signs in URLs
2189
+ # The path from urlparse is already properly encoded
2190
+ path = parsed.path
2191
if path.endswith('/') and path != '/':
2192
path = path.rstrip('/')
2193
0 commit comments