[fix] Result type: remove rstrip "/" form url normalization
This commit is contained in:
parent
087da66565
commit
99ad69450d
@ -55,8 +55,7 @@ def _normalize_url_fields(result: Result | LegacyResult):
|
|||||||
result.parsed_url = result.parsed_url._replace(
|
result.parsed_url = result.parsed_url._replace(
|
||||||
# if the result has no scheme, use http as default
|
# if the result has no scheme, use http as default
|
||||||
scheme=result.parsed_url.scheme or "http",
|
scheme=result.parsed_url.scheme or "http",
|
||||||
# normalize ``example.com/path/`` to ``example.com/path``
|
path=result.parsed_url.path,
|
||||||
path=result.parsed_url.path.rstrip("/"),
|
|
||||||
)
|
)
|
||||||
result.url = result.parsed_url.geturl()
|
result.url = result.parsed_url.geturl()
|
||||||
|
|
||||||
@ -73,7 +72,7 @@ def _normalize_url_fields(result: Result | LegacyResult):
|
|||||||
item["url"] = _url._replace(
|
item["url"] = _url._replace(
|
||||||
scheme=_url.scheme or "http",
|
scheme=_url.scheme or "http",
|
||||||
# netloc=_url.netloc.replace("www.", ""),
|
# netloc=_url.netloc.replace("www.", ""),
|
||||||
path=_url.path.rstrip("/"),
|
path=_url.path,
|
||||||
).geturl()
|
).geturl()
|
||||||
|
|
||||||
infobox_id = getattr(result, "id", None)
|
infobox_id = getattr(result, "id", None)
|
||||||
@ -82,7 +81,7 @@ def _normalize_url_fields(result: Result | LegacyResult):
|
|||||||
result.id = _url._replace(
|
result.id = _url._replace(
|
||||||
scheme=_url.scheme or "http",
|
scheme=_url.scheme or "http",
|
||||||
# netloc=_url.netloc.replace("www.", ""),
|
# netloc=_url.netloc.replace("www.", ""),
|
||||||
path=_url.path.rstrip("/"),
|
path=_url.path,
|
||||||
).geturl()
|
).geturl()
|
||||||
|
|
||||||
|
|
||||||
@ -259,9 +258,6 @@ class Result(msgspec.Struct, kw_only=True):
|
|||||||
``parse_url`` from field ``url``. The ``url`` field is initialized
|
``parse_url`` from field ``url``. The ``url`` field is initialized
|
||||||
with the resulting value in ``parse_url``, if ``url`` and
|
with the resulting value in ``parse_url``, if ``url`` and
|
||||||
``parse_url`` are not equal.
|
``parse_url`` are not equal.
|
||||||
|
|
||||||
- ``example.com/path/`` and ``example.com/path`` are equivalent and are
|
|
||||||
normalized to ``example.com/path``.
|
|
||||||
"""
|
"""
|
||||||
_normalize_url_fields(self)
|
_normalize_url_fields(self)
|
||||||
|
|
||||||
|
Loading…
x
Reference in New Issue
Block a user