From 6083ea26642f7494a5d80c531a8ab369e7dba596 Mon Sep 17 00:00:00 2001 From: Soxoj <31013580+soxoj@users.noreply.github.com> Date: Tue, 7 Apr 2026 18:25:13 +0200 Subject: [PATCH] Fix Spotify, add Spotify Community forum (#2467) --- maigret/activation.py | 11 --------- maigret/resources/data.json | 41 +++++++++++++++++----------------- maigret/resources/db_meta.json | 6 ++--- sites.md | 23 ++++++++++--------- 4 files changed, 35 insertions(+), 46 deletions(-) diff --git a/maigret/activation.py b/maigret/activation.py index faa1acb..c02a631 100644 --- a/maigret/activation.py +++ b/maigret/activation.py @@ -30,17 +30,6 @@ class ParsingActivator: jwt_token = r.json()["jwt"] site.headers["Authorization"] = "jwt " + jwt_token - @staticmethod - def spotify(site, logger, cookies={}): - headers = dict(site.headers) - if "Authorization" in headers: - del headers["Authorization"] - import requests - - r = requests.get(site.activation["url"]) - bearer_token = r.json()["accessToken"] - site.headers["authorization"] = f"Bearer {bearer_token}" - @staticmethod def weibo(site, logger): headers = dict(site.headers) diff --git a/maigret/resources/data.json b/maigret/resources/data.json index a4dad42..173df8b 100644 --- a/maigret/resources/data.json +++ b/maigret/resources/data.json @@ -535,33 +535,16 @@ ] }, "Spotify": { - "disabled": true, "tags": [ "music" ], - "headers": { - "authorization": "Bearer BQDDk6n__YLKqIDKxBb2fvOZm6yxuOj0XeU0mCpRmBi_0UsUz2fUP-tFsl7IjT-YOCXxmvfzUMAnQ0Y4KBo" - }, - "errors": { - "Spotify is currently not available in your country.": "Access denied in your country, use proxy/vpn" - }, - "activation": { - "method": "spotify", - "marks": [ - "No token provided", - "The access token expired" - ], - "url": "https://open.spotify.com/get_access_token?reason=transport&productType=web_player", - "src": "accessToken", - "dst": "authorization" - }, - "urlProbe": "https://spclient.wg.spotify.com/user-profile-view/v3/profile/{username}?playlist_limit=10&artist_limit=10&market=EN", "checkType": "status_code", - "alexaRank": 63, "urlMain": "https://open.spotify.com/", "url": "https://open.spotify.com/user/{username}", - "usernameClaimed": "blue", - "usernameUnclaimed": "noonewouldeverusethis7" + "urlProbe": "https://api.stats.fm/api/v1/users/{username}", + "usernameClaimed": "alex", + "usernameUnclaimed": "noonewouldeverusethis7", + "alexaRank": 63 }, "Archive.org": { "checkType": "message", @@ -35137,6 +35120,22 @@ "crypto", "gaming" ] + }, + "SpotifyCommunity": { + "url": "https://community.spotify.com/t5/forums/searchpage/tab/user?q={username}", + "urlMain": "https://community.spotify.com", + "checkType": "message", + "absenceStrs": [ + "0 results", + "No search results found" + ], + "regexCheck": "^[a-zA-Z0-9_.]+$", + "usernameClaimed": "adam", + "usernameUnclaimed": "noonewouldeverusethis7", + "tags": [ + "forum", + "music" + ] } }, "engines": { diff --git a/maigret/resources/db_meta.json b/maigret/resources/db_meta.json index 5009c3d..3d772c6 100644 --- a/maigret/resources/db_meta.json +++ b/maigret/resources/db_meta.json @@ -1,8 +1,8 @@ { "version": 1, - "updated_at": "2026-04-06T19:19:38Z", - "sites_count": 3154, + "updated_at": "2026-04-07T16:18:18Z", + "sites_count": 3155, "min_maigret_version": "0.5.0", - "data_sha256": "e44eee4a22651061460abae4535b935b2021a19377ead76b87a5f24de625df3a", + "data_sha256": "279fb90280814cd11dcd711b1b8e6c6a99fefea4ce6ef05c9d64dced6ac795c0", "data_url": "https://raw.githubusercontent.com/soxoj/maigret/main/maigret/resources/data.json" } \ No newline at end of file diff --git a/sites.md b/sites.md index 0148e4d..a045b77 100644 --- a/sites.md +++ b/sites.md @@ -1,5 +1,5 @@ -## List of supported sites (search methods): total 3154 +## List of supported sites (search methods): total 3155 Rank data fetched from Majestic Million by domains. @@ -24,7 +24,7 @@ Rank data fetched from Majestic Million by domains. 1. ![](https://www.google.com/s2/favicons?domain=https://t.me/) [Telegram (https://t.me/)](https://t.me/)*: top 50, messaging* 1. ![](https://www.google.com/s2/favicons?domain=https://www.reddit.com/) [Reddit (https://www.reddit.com/)](https://www.reddit.com/)*: top 50, discussion, news, social* 1. ![](https://www.google.com/s2/favicons?domain=https://www.tumblr.com) [Tumblr (https://www.tumblr.com)](https://www.tumblr.com)*: top 100, blog, social* -1. ![](https://www.google.com/s2/favicons?domain=https://open.spotify.com/) [Spotify (https://open.spotify.com/)](https://open.spotify.com/)*: top 100, music*, search is disabled +1. ![](https://www.google.com/s2/favicons?domain=https://open.spotify.com/) [Spotify (https://open.spotify.com/)](https://open.spotify.com/)*: top 100, music* 1. ![](https://www.google.com/s2/favicons?domain=https://archive.org) [Archive.org (https://archive.org)](https://archive.org)*: top 100, archive*, search is disabled 1. ![](https://www.google.com/s2/favicons?domain=https://www.flickr.com/) [Flickr (https://www.flickr.com/)](https://www.flickr.com/)*: top 100, photo* 1. ![](https://www.google.com/s2/favicons?domain=https://www.flickr.com) [Flickr Groups (https://www.flickr.com)](https://www.flickr.com)*: top 100, photo* @@ -3157,21 +3157,22 @@ Rank data fetched from Majestic Million by domains. 1. ![](https://www.google.com/s2/favicons?domain=https://paragraph.com) [Paragraph (https://paragraph.com)](https://paragraph.com)*: top 100M, blog, crypto* 1. ![](https://www.google.com/s2/favicons?domain=https://tonometerbot.com) [Tonometerbot (https://tonometerbot.com)](https://tonometerbot.com)*: top 100M, crypto* 1. ![](https://www.google.com/s2/favicons?domain=https://www.spatial.io) [Spatial (https://www.spatial.io)](https://www.spatial.io)*: top 100M, crypto, gaming* +1. ![](https://www.google.com/s2/favicons?domain=https://community.spotify.com) [SpotifyCommunity (https://community.spotify.com)](https://community.spotify.com)*: top 100M, forum, music* -The list was updated at (2026-04-06) +The list was updated at (2026-04-07) ## Statistics -Enabled/total sites: 2535/3154 = 80.37% +Enabled/total sites: 2537/3155 = 80.41% -Incomplete message checks: 334/2535 = 13.18% (false positive risks) +Incomplete message checks: 335/2537 = 13.2% (false positive risks) -Status code checks: 631/2535 = 24.89% (false positive risks) +Status code checks: 632/2537 = 24.91% (false positive risks) -False positive risk (total): 38.07% +False positive risk (total): 38.11% -Sites with probing: 500px, Armchairgm, BinarySearch (disabled), BleachFandom, Bluesky, BongaCams, Boosty, BuyMeACoffee, Calendly, Cent, Chess, Code Sandbox, Code Snippet Wiki, DailyMotion, Discord, Diskusjon.no, Disqus, Docker Hub, Duolingo, FandomCommunityCentral, GitHub, GitLab, Google Plus (archived), Gravatar, Hashnode, Holopin, Imgur, Issuu, Keybase, Kick, Kvinneguiden, LeetCode, Lesswrong, Livejasmin, LocalCryptos (disabled), MicrosoftLearn, MixCloud, Monkeytype, Niftygateway, Omg.lol, Paragraph, Picsart, Plurk, Polarsteps, Rarible, Reddit, Reddit Search (Pushshift) (disabled), RoyalCams, Scratch, Soop, SportsTracker, Spotify (disabled), StackOverflow, Substack, TAP'D, Topcoder, Trello, Twitch, Twitter, Twitter Shadowban (disabled), UnstoppableDomains, Vimeo, Warframe Market, Warpcast, Weibo, Yapisal (disabled), YouNow, en.brickimedia.org, nightbot, notabug.org, qiwi.me (disabled) +Sites with probing: 500px, Armchairgm, BinarySearch (disabled), BleachFandom, Bluesky, BongaCams, Boosty, BuyMeACoffee, Calendly, Cent, Chess, Code Sandbox, Code Snippet Wiki, DailyMotion, Discord, Diskusjon.no, Disqus, Docker Hub, Duolingo, FandomCommunityCentral, GitHub, GitLab, Google Plus (archived), Gravatar, Hashnode, Holopin, Imgur, Issuu, Keybase, Kick, Kvinneguiden, LeetCode, Lesswrong, Livejasmin, LocalCryptos (disabled), MicrosoftLearn, MixCloud, Monkeytype, Niftygateway, Omg.lol, Paragraph, Picsart, Plurk, Polarsteps, Rarible, Reddit, Reddit Search (Pushshift) (disabled), RoyalCams, Scratch, Soop, SportsTracker, Spotify, StackOverflow, Substack, TAP'D, Topcoder, Trello, Twitch, Twitter, Twitter Shadowban (disabled), UnstoppableDomains, Vimeo, Warframe Market, Warpcast, Weibo, Yapisal (disabled), YouNow, en.brickimedia.org, nightbot, notabug.org, qiwi.me (disabled) -Sites with activation: Spotify (disabled), Twitter, Vimeo, Weibo +Sites with activation: Twitter, Vimeo, Weibo Top 20 profile URLs: - (710) `{urlMain}/index/8-0-{username} (uCoz)` @@ -3198,7 +3199,7 @@ Top 20 profile URLs: Top 20 tags: - (1060) `NO_TAGS` (non-standard) -- (754) `forum` +- (755) `forum` - (127) `gaming` - (79) `coding` - (59) `photo` @@ -3206,7 +3207,7 @@ Top 20 tags: - (46) `tech` - (41) `news` - (39) `blog` -- (34) `music` +- (35) `music` - (32) `shopping` - (25) `sharing` - (25) `crypto`