From 939fec8ecdf1247791269dbf05e65203af8002aa Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Mike=20F=C3=A4hrmann?= Date: Sun, 5 Jan 2020 17:32:06 +0100 Subject: [PATCH] [deviantart] match new search/popular URLs (closes #538) --- gallery_dl/extractor/deviantart.py | 27 ++++++++++++++++++++++----- 1 file changed, 22 insertions(+), 5 deletions(-) diff --git a/gallery_dl/extractor/deviantart.py b/gallery_dl/extractor/deviantart.py index 95880d48a07..0437ab4e339 100644 --- a/gallery_dl/extractor/deviantart.py +++ b/gallery_dl/extractor/deviantart.py @@ -576,12 +576,22 @@ class DeviantartPopularExtractor(DeviantartExtractor): directory_fmt = ("{category}", "Popular", "{popular[range]}", "{popular[search]}") archive_fmt = "P_{popular[range]}_{popular[search]}_{index}.{extension}" - pattern = (r"(?:https?://)?www\.deviantart\.com" - r"((?:/\w+)*)/(?:popular-([^/?&#]+))/?(?:\?([^#]*))?") + pattern = (r"(?:https?://)?www\.deviantart\.com/(?:" + r"search(?:/deviations)?" + r"|(?:deviations/?)?\?order=(popular-[^/?&#]+)" + r"|((?:[\w-]+/)*)(popular-[^/?&#]+)" + r")/?(?:\?([^#]*))?") test = ( + ("https://www.deviantart.com/?order=popular-all-time", { + "options": (("original", False),), + "range": "1-30", + "count": 30, + }), ("https://www.deviantart.com/popular-24-hours/?q=tree+house", { "options": (("original", False),), }), + ("https://www.deviantart.com/search?q=tree"), + ("https://www.deviantart.com/search/deviations?order=popular-1-week"), ("https://www.deviantart.com/artisan/popular-all-time/?q=tree"), ) @@ -590,13 +600,20 @@ def __init__(self, match): self.search_term = self.time_range = self.category_path = None self.user = "" - path, trange, query = match.groups() + trange1, path, trange2, query = match.groups() + trange = trange1 or trange2 + query = text.parse_query(query) + + if not trange: + trange = query.get("order") + if path: - self.category_path = path.lstrip("/") + self.category_path = path.strip("/") if trange: + trange = trange[8:] if trange.startswith("popular-") else "" self.time_range = trange.replace("-", "").replace("hours", "hr") if query: - self.search_term = text.parse_query(query).get("q") + self.search_term = query.get("q") self.popular = { "search": self.search_term or "",