From 0817f468ef79d506574007daa74ebaa7faa61c9e Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Mike=20F=C3=A4hrmann?= Date: Mon, 23 Aug 2021 22:49:35 +0200 Subject: [PATCH] [twitter] expand t.co links in user descriptions (#1532, #1787) --- gallery_dl/extractor/twitter.py | 13 ++++++++++++- 1 file changed, 12 insertions(+), 1 deletion(-) diff --git a/gallery_dl/extractor/twitter.py b/gallery_dl/extractor/twitter.py index ac511288..94c61158 100644 --- a/gallery_dl/extractor/twitter.py +++ b/gallery_dl/extractor/twitter.py @@ -220,7 +220,6 @@ class TwitterExtractor(Extractor): "id" : text.parse_int(uid), "name" : user["screen_name"], "nick" : user["name"], - "description" : user["description"], "location" : user["location"], "date" : text.parse_datetime( user["created_at"], "%a %b %d %H:%M:%S %z %Y"), @@ -236,6 +235,13 @@ class TwitterExtractor(Extractor): "statuses_count" : user["statuses_count"], } + descr = user["description"] + urls = entities["description"].get("urls") + if urls: + for url in urls: + descr = descr.replace(url["url"], url["expanded_url"]) + udata["description"] = descr + if "url" in entities: udata["url"] = entities["url"]["urls"][0]["expanded_url"] @@ -469,6 +475,11 @@ class TwitterTweetExtractor(TwitterExtractor): ("https://twitter.com/i/web/status/1424882930803908612", { "options": (("replies", "self"),), "count": 4, + "keyword": {"user": { + "description": "re:business email-- rhettaro.bloom@gmail.com " + "patreon- http://patreon.com/Princecanary", + "url": "http://princecanary.tumblr.com", + }}, }), ("https://twitter.com/i/web/status/1424898916156284928", { "options": (("replies", "self"),),