diff --git a/maigret/resources/data.json b/maigret/resources/data.json index 12a55fe..5b49ca3 100644 --- a/maigret/resources/data.json +++ b/maigret/resources/data.json @@ -789,6 +789,7 @@ "checkType": "status_code", "urlMain": "https://scratch.mit.edu/", "url": "https://scratch.mit.edu/users/{username}", + "urlProbe": "https://api.scratch.mit.edu/users/{username}", "usernameClaimed": "griffpatch", "usernameUnclaimed": "noonewould" }, @@ -954,7 +955,8 @@ "The page you are looking for could not be found" ], "urlMain": "https://calendly.com", - "url": "https://calendly.com/{username}/15min", + "url": "https://calendly.com/{username}", + "urlProbe": "https://calendly.com/api/booking/profiles/{username}", "usernameClaimed": "john", "usernameUnclaimed": "noonewouldeverusethis7", "alexaRank": 149 @@ -1103,14 +1105,14 @@ ], "checkType": "message", "absenceStrs": [ - "Oops!", - "Unable to resolve handle" + "Profile not found" ], "presenseStrs": [ - ".bsky.social on Bluesky" + "\"did\"" ], "urlMain": "https://bsky.app", "url": "https://bsky.app/profile/{username}.bsky.social", + "urlProbe": "https://public.api.bsky.app/xrpc/app.bsky.actor.getProfile?actor={username}.bsky.social", "usernameClaimed": "shamerli", "usernameUnclaimed": "noonewouldeverusethis7", "alexaRank": 186 @@ -1220,29 +1222,13 @@ "tags": [ "video" ], - "checkType": "message", - "presenseStrs": [ - " style=", - "", - "og:title", - "Twitter", - "og:site_name" - ], + "checkType": "status_code", "alexaRank": 229, "urlMain": "https://www.dailymotion.com", "url": "https://www.dailymotion.com/{username}", + "urlProbe": "https://api.dailymotion.com/user/{username}?fields=id,username,screenname,description,avatar_720_url,cover_250_url,followers_total,following_total,videos_total,country,created_time,verified,url", "usernameClaimed": "blue", - "usernameUnclaimed": "rstnodkwzr", - "absenceStrs": [ - "Page not found", - "profile", - "error404", - "bodyall", - "No matches found" - ], - "headers": { - "User-Agent": "" - } + "usernameUnclaimed": "rstnodkwzr" }, "Bandcamp": { "tags": [ @@ -1767,9 +1753,13 @@ "Code Snippet Wiki": { "url": "https://codesnippets.fandom.com/wiki/User:{username}", "urlMain": "https://codesnippets.fandom.com", + "urlProbe": "https://codesnippets.fandom.com/api.php?action=query&list=users&ususers={username}&format=json", "checkType": "message", + "presenseStrs": [ + "\"userid\"" + ], "absenceStrs": [ - "This user has not filled out their profile page yet" + "\"missing\"" ], "usernameClaimed": "bob", "usernameUnclaimed": "noonewouldeverusethis7", diff --git a/sites.md b/sites.md index f4fd14f..9d16859 100644 --- a/sites.md +++ b/sites.md @@ -752,7 +752,7 @@ Rank data fetched from Majestic Million by domains. 1. ![](https://www.google.com/s2/favicons?domain=https://tproger.ru) [Tproger (https://tproger.ru)](https://tproger.ru)*: top 10M, ru*, search is disabled 1. ![](https://www.google.com/s2/favicons?domain=https://www.gamblejoe.com) [Gamblejoe (https://www.gamblejoe.com)](https://www.gamblejoe.com)*: top 10M, de, mk, ua* 1. ![](https://www.google.com/s2/favicons?domain=https://massagerepublic.com) [massagerepublic.com (https://massagerepublic.com)](https://massagerepublic.com)*: top 10M* -1. ![](https://www.google.com/s2/favicons?domain=https://www.allthelyrics.com) [AllTheLyrics (https://www.allthelyrics.com)](https://www.allthelyrics.com)*: top 10M, forum, music* +1. ![](https://www.google.com/s2/favicons?domain=https://www.allthelyrics.com) [AllTheLyrics (https://www.allthelyrics.com)](https://www.allthelyrics.com)*: top 10M, forum, music*, search is disabled 1. ![](https://www.google.com/s2/favicons?domain=https://mama.ru) [Mama (https://mama.ru)](https://mama.ru)*: top 10M, ru*, search is disabled 1. ![](https://www.google.com/s2/favicons?domain=https://www.w7forums.com) [W7forums (https://www.w7forums.com)](https://www.w7forums.com)*: top 10M, forum* 1. ![](https://www.google.com/s2/favicons?domain=https://gvectors.com) [Gvectors (https://gvectors.com)](https://gvectors.com)*: top 10M, in, us* @@ -3263,19 +3263,19 @@ The list was updated at (2026-03-27) Enabled/total sites: 2632/3254 = 80.89% -Incomplete message checks: 344/2632 = 13.07% (false positive risks) +Incomplete message checks: 343/2632 = 13.03% (false positive risks) -Status code checks: 636/2632 = 24.16% (false positive risks) +Status code checks: 637/2632 = 24.2% (false positive risks) False positive risk (total): 37.23% -Sites with probing: 500px, Aparat (disabled), Armchairgm, BinarySearch (disabled), BleachFandom, BongaCams, BuyMeACoffee, Cent, Chess, Code Sandbox, Discord, Diskusjon.no, Disqus, Docker Hub, Duolingo, FandomCommunityCentral, Gab, GitHub, GitLab, Google Plus (archived), Gravatar, Holopin, Imgur, Issuu, Keybase, Kick, Kvinneguiden, Lesswrong, Livejasmin, LocalCryptos (disabled), MicrosoftLearn, MixCloud, Monkeytype, Niftygateway, Omg.lol, Picsart, Rarible, Reddit, Reddit Search (Pushshift) (disabled), RoyalCams, SOOP, SportsTracker, Spotify (disabled), Substack, TAP'D, Topcoder, Trello, Twitch, Twitter, Twitter Shadowban (disabled), UnstoppableDomains, Vimeo, Warframe Market, Weibo, Yapisal (disabled), YouNow, en.brickimedia.org, hashnode, nightbot, notabug.org, polarsteps, qiwi.me (disabled) +Sites with probing: 500px, Aparat (disabled), Armchairgm, BinarySearch (disabled), BleachFandom, Bluesky, BongaCams, BuyMeACoffee, Cent, Chess, Code Sandbox, Code Snippet Wiki, DailyMotion, Discord, Diskusjon.no, Disqus, Docker Hub, Duolingo, FandomCommunityCentral, Gab, GitHub, GitLab, Google Plus (archived), Gravatar, Holopin, Imgur, Issuu, Keybase, Kick, Kvinneguiden, Lesswrong, Livejasmin, LocalCryptos (disabled), MicrosoftLearn, MixCloud, Monkeytype, Niftygateway, Omg.lol, Picsart, Rarible, Reddit, Reddit Search (Pushshift) (disabled), RoyalCams, SOOP, Scratch, SportsTracker, Spotify (disabled), Substack, TAP'D, Topcoder, Trello, Twitch, Twitter, Twitter Shadowban (disabled), UnstoppableDomains, Vimeo, Warframe Market, Weibo, Yapisal (disabled), YouNow, calendly.com, en.brickimedia.org, hashnode, nightbot, notabug.org, polarsteps, qiwi.me (disabled) Sites with activation: Spotify (disabled), Twitter, Vimeo, Weibo Top 20 profile URLs: - (796) `{urlMain}/index/8-0-{username} (uCoz)` -- (321) `/{username}` +- (322) `/{username}` - (221) `{urlMain}{urlSubpath}/members/?username={username} (XenForo)` - (173) `/user/{username}` - (139) `/profile/{username}`