diff --git a/.githooks/pre-commit b/.githooks/pre-commit index 7a9bbe1..8d88963 100755 --- a/.githooks/pre-commit +++ b/.githooks/pre-commit @@ -4,4 +4,7 @@ poetry run update_sitesmd echo 'Regenerating db_meta.json...' python3 utils/generate_db_meta.py -git add maigret/resources/db_meta.json \ No newline at end of file + +git add maigret/resources/db_meta.json +git add maigret/resources/data.json +git add sites.md diff --git a/maigret/resources/data.json b/maigret/resources/data.json index 4f2a019..1f39a9d 100644 --- a/maigret/resources/data.json +++ b/maigret/resources/data.json @@ -371,7 +371,8 @@ "urlMain": "https://bit.ly", "url": "https://bit.ly/{username}", "usernameClaimed": "john", - "usernameUnclaimed": "noonewouldeverusethis7" + "usernameUnclaimed": "noonewouldeverusethis7", + "disabled": true }, "WordPress": { "tags": [ @@ -1354,7 +1355,8 @@ "tags": [ "education", "research" - ] + ], + "similarSearch": true }, "GoodReads": { "tags": [ @@ -11177,7 +11179,14 @@ "urlMain": "https://boards.theforce.net", "engine": "XenForo", "usernameClaimed": "alex", - "usernameUnclaimed": "noonewouldeverusethis7" + "usernameUnclaimed": "noonewouldeverusethis7", + "disabled": true, + "errors": { + "Log in | Jedi Council": "Login required" + }, + "protection": [ + "login" + ] }, "Akniga": { "tags": [ @@ -12182,7 +12191,11 @@ "usernameUnclaimed": "noonewouldeverusethis7", "protection": [ "ip_reputation" - ] + ], + "disabled": true, + "errors": { + "Just a moment": "Cloudflare challenge" + } }, "discuss.inventables.com": { "urlMain": "https://discuss.inventables.com", @@ -19622,7 +19635,8 @@ "urlMain": "https://www.firearmstalk.com", "url": "https://www.firearmstalk.com/members/?username={username}", "usernameClaimed": "adam", - "usernameUnclaimed": "noonewouldeverusethis7" + "usernameUnclaimed": "noonewouldeverusethis7", + "disabled": true }, "Dissenter": { "tags": [ @@ -23186,7 +23200,8 @@ "urlMain": "http://forum.trade-print.ru", "engine": "vBulletin", "usernameClaimed": "alex", - "usernameUnclaimed": "noonewouldeverusethis7" + "usernameUnclaimed": "noonewouldeverusethis7", + "disabled": true }, "red-forum.com": { "urlMain": "https://red-forum.com", @@ -26850,7 +26865,14 @@ "checkType": "status_code", "url": "https://www.needrom.com/author/{username}/", "usernameClaimed": "needrom", - "usernameUnclaimed": "noonewouldeverusethis7" + "usernameUnclaimed": "noonewouldeverusethis7", + "disabled": true, + "protection": [ + "js_challenge" + ], + "errors": { + "Just a moment": "Cloudflare challenge" + } }, "No-jus": { "tags": [ @@ -32921,12 +32943,6 @@ "usernameUnclaimed": "noonewouldeverusethis7", "url": "https://discuss.pytorch.org/u/{username}" }, - "discussion.dreamhost.com": { - "checkType": "status_code", - "usernameClaimed": "adam", - "usernameUnclaimed": "noonewouldeverusethis7", - "url": "https://discussion.dreamhost.com/u/{username}" - }, "dnd-wiki.org": { "checkType": "status_code", "usernameClaimed": "adam", @@ -32946,14 +32962,20 @@ "url": "https://elixirforum.com/u/{username}" }, "en.brickimedia.org": { - "checkType": "message", - "usernameClaimed": "adam", - "usernameUnclaimed": "noonewouldeverusethis7", "url": "https://en.brickimedia.org/wiki/User:{username}", - "urlMain": "https://en.brickimedia.org", "urlProbe": "https://en.brickimedia.org/w/api.php?action=query&list=users&ususers={username}&format=json", + "urlMain": "https://en.brickimedia.org", + "checkType": "message", + "presenseStrs": [ + "\"userid\"" + ], "absenceStrs": [ "\"missing\"" + ], + "usernameClaimed": "Lcawte", + "usernameUnclaimed": "noonewouldeverusethis7", + "tags": [ + "wiki" ] }, "en.illogicopedia.org": { @@ -33477,12 +33499,6 @@ "usernameUnclaimed": "noonewouldeverusethis7", "url": "https://premium.chat/{username}" }, - "profile.typepad.com": { - "checkType": "status_code", - "usernameClaimed": "adam", - "usernameUnclaimed": "noonewouldeverusethis7", - "url": "https://profile.typepad.com/{username}" - }, "pttweb.cc": { "checkType": "status_code", "usernameClaimed": "adam", diff --git a/maigret/resources/db_meta.json b/maigret/resources/db_meta.json index 9fe5125..def26cc 100644 --- a/maigret/resources/db_meta.json +++ b/maigret/resources/db_meta.json @@ -1,8 +1,8 @@ { "version": 1, - "updated_at": "2026-04-04T16:16:31Z", - "sites_count": 3157, + "updated_at": "2026-04-04T17:04:45Z", + "sites_count": 3155, "min_maigret_version": "0.5.0", - "data_sha256": "7c8d51c45100ef0a26c401ee26ffb83ee5b7c897011502ded8d9ae161c8ed751", + "data_sha256": "4b1c0c96e1595f6e83584a7a6e885647095cbfb7f23c938d7440f8a3408551b1", "data_url": "https://raw.githubusercontent.com/soxoj/maigret/main/maigret/resources/data.json" } \ No newline at end of file diff --git a/sites.md b/sites.md index 574bce4..cd45e11 100644 --- a/sites.md +++ b/sites.md @@ -1,5 +1,5 @@ -## List of supported sites (search methods): total 3157 +## List of supported sites (search methods): total 3155 Rank data fetched from Majestic Million by domains. @@ -18,7 +18,7 @@ Rank data fetched from Majestic Million by domains. 1. ![](https://www.google.com/s2/favicons?domain=https://vimeo.com) [Vimeo (https://vimeo.com)](https://vimeo.com)*: top 50, video* 1. ![](https://www.google.com/s2/favicons?domain=https://www.tiktok.com/) [TikTok (https://www.tiktok.com/)](https://www.tiktok.com/)*: top 50, social, video* 1. ![](https://www.google.com/s2/favicons?domain=https://amazon.com) [Amazon (https://amazon.com)](https://amazon.com)*: top 50, shopping, us* -1. ![](https://www.google.com/s2/favicons?domain=https://bit.ly) [Bit.ly (https://bit.ly)](https://bit.ly)*: top 50, links* +1. ![](https://www.google.com/s2/favicons?domain=https://bit.ly) [Bit.ly (https://bit.ly)](https://bit.ly)*: top 50, links*, search is disabled 1. ![](https://www.google.com/s2/favicons?domain=https://wordpress.com) [WordPress (https://wordpress.com)](https://wordpress.com)*: top 50, blog* 1. ![](https://www.google.com/s2/favicons?domain=https://plus.google.com) [Google Plus (archived) (https://plus.google.com)](https://plus.google.com)*: top 50, social* 1. ![](https://www.google.com/s2/favicons?domain=https://t.me/) [Telegram (https://t.me/)](https://t.me/)*: top 50, messaging* @@ -505,7 +505,7 @@ Rank data fetched from Majestic Million by domains. 1. ![](https://www.google.com/s2/favicons?domain=http://lurkmore.to) [Lurkmore (http://lurkmore.to)](http://lurkmore.to)*: top 100K, ru* 1. ![](https://www.google.com/s2/favicons?domain=https://uid.me/) [uID.me (by username) (https://uid.me/)](https://uid.me/)*: top 100K, ru* 1. ![](https://www.google.com/s2/favicons?domain=https://uid.me/) [uID.me (by uguid) (https://uid.me/)](https://uid.me/)*: top 100K, ru* -1. ![](https://www.google.com/s2/favicons?domain=https://www.travelblog.org) [Travelblog (https://www.travelblog.org)](https://www.travelblog.org)*: top 100K, blog, travel* +1. ![](https://www.google.com/s2/favicons?domain=https://www.travelblog.org) [Travelblog (https://www.travelblog.org)](https://www.travelblog.org)*: top 100K, blog, travel*, search is disabled 1. ![](https://www.google.com/s2/favicons?domain=https://xakep.ru) [xakep.ru (https://xakep.ru)](https://xakep.ru)*: top 100K, ru* 1. ![](https://www.google.com/s2/favicons?domain=https://dou.ua/) [Dou (https://dou.ua/)](https://dou.ua/)*: top 100K, ua* 1. ![](https://www.google.com/s2/favicons?domain=https://www.hr.com) [Hr (https://www.hr.com)](https://www.hr.com)*: top 100K, career* @@ -935,7 +935,7 @@ Rank data fetched from Majestic Million by domains. 1. ![](https://www.google.com/s2/favicons?domain=https://ghisler.ch/board) [ghisler.ch (https://ghisler.ch/board)](https://ghisler.ch/board)*: top 10M, forum* 1. ![](https://www.google.com/s2/favicons?domain=https://www.magix.info) [Magix (https://www.magix.info)](https://www.magix.info)*: top 10M, tech*, search is disabled 1. ![](https://www.google.com/s2/favicons?domain=https://gpodder.net/) [Gpodder (https://gpodder.net/)](https://gpodder.net/)*: top 10M, music* -1. ![](https://www.google.com/s2/favicons?domain=https://www.firearmstalk.com) [Firearmstalk (https://www.firearmstalk.com)](https://www.firearmstalk.com)*: top 10M, us* +1. ![](https://www.google.com/s2/favicons?domain=https://www.firearmstalk.com) [Firearmstalk (https://www.firearmstalk.com)](https://www.firearmstalk.com)*: top 10M, us*, search is disabled 1. ![](https://www.google.com/s2/favicons?domain=https://dissenter.com/) [Dissenter (https://dissenter.com/)](https://dissenter.com/)*: top 10M, us* 1. ![](https://www.google.com/s2/favicons?domain=https://www.autolada.ru/) [Autolada (https://www.autolada.ru/)](https://www.autolada.ru/)*: top 10M, ru* 1. ![](https://www.google.com/s2/favicons?domain=https://www.russpuss.ru) [russpuss.ru (https://www.russpuss.ru)](https://www.russpuss.ru)*: top 10M, erotic, forum, ru* @@ -1765,7 +1765,7 @@ Rank data fetched from Majestic Million by domains. 1. ![](https://www.google.com/s2/favicons?domain=https://forums.alliedmods.net/) [alliedmods (https://forums.alliedmods.net/)](https://forums.alliedmods.net/)*: top 100M, forum, gb, jp, tr, uz*, search is disabled 1. ![](https://www.google.com/s2/favicons?domain=https://forums.gamerevolution.com) [GameRevolution (https://forums.gamerevolution.com)](https://forums.gamerevolution.com)*: top 100M, forum, gaming* 1. ![](https://www.google.com/s2/favicons?domain=https://ru.pathofexile.com) [Pathofexile (https://ru.pathofexile.com)](https://ru.pathofexile.com)*: top 100M, ru* -1. ![](https://www.google.com/s2/favicons?domain=https://boards.theforce.net) [boards.theforce.net (https://boards.theforce.net)](https://boards.theforce.net)*: top 100M* +1. ![](https://www.google.com/s2/favicons?domain=https://boards.theforce.net) [boards.theforce.net (https://boards.theforce.net)](https://boards.theforce.net)*: top 100M*, search is disabled 1. ![](https://www.google.com/s2/favicons?domain=https://community.justlanded.com) [Justlanded (https://community.justlanded.com)](https://community.justlanded.com)*: top 100M* 1. ![](https://www.google.com/s2/favicons?domain=http://forum.igromania.ru/) [igromania (http://forum.igromania.ru/)](http://forum.igromania.ru/)*: top 100M, forum, gaming, ru* 1. ![](https://www.google.com/s2/favicons?domain=http://forum.lingvolive.com) [Lingvolive (http://forum.lingvolive.com)](http://forum.lingvolive.com)*: top 100M, de, forum, it, ru*, search is disabled @@ -1988,7 +1988,7 @@ Rank data fetched from Majestic Million by domains. 1. ![](https://www.google.com/s2/favicons?domain=https://forum.freeton.org) [forum.freeton.org (https://forum.freeton.org)](https://forum.freeton.org)*: top 100M, finance, forum*, search is disabled 1. ![](https://www.google.com/s2/favicons?domain=http://forum.ua-vet.com) [forum.ua-vet.com (http://forum.ua-vet.com)](http://forum.ua-vet.com)*: top 100M, forum* 1. ![](https://www.google.com/s2/favicons?domain=https://sst.hiberworld.com/user/{username}) [sst.hiberworld.com (https://sst.hiberworld.com/user/{username})](https://sst.hiberworld.com/user/{username})*: top 100M* -1. ![](https://www.google.com/s2/favicons?domain=http://forum.trade-print.ru) [forum.trade-print.ru (http://forum.trade-print.ru)](http://forum.trade-print.ru)*: top 100M* +1. ![](https://www.google.com/s2/favicons?domain=http://forum.trade-print.ru) [forum.trade-print.ru (http://forum.trade-print.ru)](http://forum.trade-print.ru)*: top 100M*, search is disabled 1. ![](https://www.google.com/s2/favicons?domain=http://0-3.ru) [0-3.RU (http://0-3.ru)](http://0-3.ru)*: top 100M, forum, ru* 1. ![](https://www.google.com/s2/favicons?domain=) [discussions.ubisoft.com ()]()*: top 100M, forum, gaming* 1. ![](https://www.google.com/s2/favicons?domain=http://1001mem.ru) [1001mem.ru (http://1001mem.ru)](http://1001mem.ru)*: top 100M, ru* @@ -2290,7 +2290,7 @@ Rank data fetched from Majestic Million by domains. 1. ![](https://www.google.com/s2/favicons?domain=) [Ninjakiwi ()]()*: top 100M*, search is disabled 1. ![](https://www.google.com/s2/favicons?domain=https://www.nationalgunforum.com) [NationalgunForum (https://www.nationalgunforum.com)](https://www.nationalgunforum.com)*: top 100M, ca, forum*, search is disabled 1. ![](https://www.google.com/s2/favicons?domain=https://naturalworld.guru) [Naturalworld (https://naturalworld.guru)](https://naturalworld.guru)*: top 100M, ru* -1. ![](https://www.google.com/s2/favicons?domain=) [Needrom ()]()*: top 100M* +1. ![](https://www.google.com/s2/favicons?domain=) [Needrom ()]()*: top 100M*, search is disabled 1. ![](https://www.google.com/s2/favicons?domain=https://no-jus.com) [No-jus (https://no-jus.com)](https://no-jus.com)*: top 100M, ru*, search is disabled 1. ![](https://www.google.com/s2/favicons?domain=https://numizmat-forum.ru) [Numizmat (https://numizmat-forum.ru)](https://numizmat-forum.ru)*: top 100M, forum, ru* 1. ![](https://www.google.com/s2/favicons?domain=) [Nyaa.si ()]()*: top 100M* @@ -2933,11 +2933,10 @@ Rank data fetched from Majestic Million by domains. 1. ![](https://www.google.com/s2/favicons?domain=) [discuss.pixls.us ()]()*: top 100M* 1. ![](https://www.google.com/s2/favicons?domain=) [discuss.prosemirror.net ()]()*: top 100M* 1. ![](https://www.google.com/s2/favicons?domain=) [discuss.pytorch.org ()]()*: top 100M* -1. ![](https://www.google.com/s2/favicons?domain=) [discussion.dreamhost.com ()]()*: top 100M* 1. ![](https://www.google.com/s2/favicons?domain=) [dnd-wiki.org ()]()*: top 100M* 1. ![](https://www.google.com/s2/favicons?domain=) [dogcraft.net ()]()*: top 100M* 1. ![](https://www.google.com/s2/favicons?domain=) [elixirforum.com ()]()*: top 100M* -1. ![](https://www.google.com/s2/favicons?domain=https://en.brickimedia.org) [en.brickimedia.org (https://en.brickimedia.org)](https://en.brickimedia.org)*: top 100M* +1. ![](https://www.google.com/s2/favicons?domain=https://en.brickimedia.org) [en.brickimedia.org (https://en.brickimedia.org)](https://en.brickimedia.org)*: top 100M, wiki* 1. ![](https://www.google.com/s2/favicons?domain=) [en.illogicopedia.org ()]()*: top 100M* 1. ![](https://www.google.com/s2/favicons?domain=) [en.uncyclopedia.co ()]()*: top 100M* 1. ![](https://www.google.com/s2/favicons?domain=) [en.wikifur.com ()]()*: top 100M* @@ -3018,7 +3017,6 @@ Rank data fetched from Majestic Million by domains. 1. ![](https://www.google.com/s2/favicons?domain=) [pinataisland.info ()]()*: top 100M* 1. ![](https://www.google.com/s2/favicons?domain=) [postcrossing.com ()]()*: top 100M*, search is disabled 1. ![](https://www.google.com/s2/favicons?domain=) [premium.chat ()]()*: top 100M* -1. ![](https://www.google.com/s2/favicons?domain=) [profile.typepad.com ()]()*: top 100M* 1. ![](https://www.google.com/s2/favicons?domain=) [pttweb.cc ()]()*: top 100M* 1. ![](https://www.google.com/s2/favicons?domain=) [qiita.com ()]()*: top 100M* 1. ![](https://www.google.com/s2/favicons?domain=) [rationalwiki.org ()]()*: top 100M* @@ -3164,13 +3162,13 @@ Rank data fetched from Majestic Million by domains. The list was updated at (2026-04-04) ## Statistics -Enabled/total sites: 2546/3157 = 80.65% +Enabled/total sites: 2538/3155 = 80.44% -Incomplete message checks: 341/2546 = 13.39% (false positive risks) +Incomplete message checks: 338/2538 = 13.32% (false positive risks) -Status code checks: 636/2546 = 24.98% (false positive risks) +Status code checks: 631/2538 = 24.86% (false positive risks) -False positive risk (total): 38.37% +False positive risk (total): 38.18% Sites with probing: 500px, Armchairgm, BinarySearch (disabled), BleachFandom, Bluesky, BongaCams, Boosty, BuyMeACoffee, Calendly, Cent, Chess, Code Sandbox, Code Snippet Wiki, DailyMotion, Discord, Diskusjon.no, Disqus, Docker Hub, Duolingo, FandomCommunityCentral, GitHub, GitLab, Google Plus (archived), Gravatar, Hashnode, Holopin, Imgur, Issuu, Keybase, Kick, Kvinneguiden, LeetCode, Lesswrong, Livejasmin, LocalCryptos (disabled), MicrosoftLearn, MixCloud, Monkeytype, Niftygateway, Omg.lol, Paragraph, Picsart, Plurk, Polarsteps, Rarible, Reddit, Reddit Search (Pushshift) (disabled), RoyalCams, Scratch, Soop, SportsTracker, Spotify (disabled), StackOverflow, Substack, TAP'D, Topcoder, Trello, Twitch, Twitter, Twitter Shadowban (disabled), UnstoppableDomains, Vimeo, Warframe Market, Warpcast, Weibo, Yapisal (disabled), YouNow, en.brickimedia.org, nightbot, notabug.org, qiwi.me (disabled) @@ -3178,13 +3176,13 @@ Sites with activation: Spotify (disabled), Twitter, Vimeo, Weibo Top 20 profile URLs: - (710) `{urlMain}/index/8-0-{username} (uCoz)` -- (319) `/{username}` +- (318) `/{username}` - (221) `{urlMain}{urlSubpath}/members/?username={username} (XenForo)` - (173) `/user/{username}` - (138) `/profile/{username}` - (131) `{urlMain}{urlSubpath}/member.php?username={username} (vBulletin)` - (127) `{urlMain}{urlSubpath}/search.php?author={username} (phpBB/Search)` -- (118) `/u/{username}` +- (117) `/u/{username}` - (92) `/users/{username}` - (87) `{urlMain}/u/{username}/summary (Discourse)` - (68) `/@{username}` @@ -3200,7 +3198,7 @@ Top 20 profile URLs: Top 20 tags: -- (1063) `NO_TAGS` (non-standard) +- (1060) `NO_TAGS` (non-standard) - (754) `forum` - (127) `gaming` - (79) `coding`