From 3960510b6320a7d47e79b64a5c9c7850e255e0d9 Mon Sep 17 00:00:00 2001 From: Soxoj <31013580+soxoj@users.noreply.github.com> Date: Sun, 26 Apr 2026 12:34:52 +0200 Subject: [PATCH] Fix site checks: 7 fixed, 1 disabled (#2565) False-positive site probe issues #2531, #2542, #2556, #2559, #2560, #2561, #2563, #2496. --- maigret/resources/data.json | 50 +++++++++++++++++++++++++++++----- maigret/resources/db_meta.json | 4 +-- sites.md | 10 +++---- 3 files changed, 50 insertions(+), 14 deletions(-) diff --git a/maigret/resources/data.json b/maigret/resources/data.json index b089018..de82119 100644 --- a/maigret/resources/data.json +++ b/maigret/resources/data.json @@ -1335,12 +1335,17 @@ "usernameClaimed": "Blue", "usernameUnclaimed": "noonewouldeverusethis7", "alexaRank": 242, + "presenseStrs": [ + "class=\"gs_a\"" + ], "absenceStrs": [ "did not match any articles", "not match" ], "errors": { - "Our systems have detected unusual traffic": "Google rate-limit / captcha" + "Our systems have detected unusual traffic": "Google rate-limit / captcha", + "/sorry/index": "Google rate-limit / captcha", + "unusual traffic from your computer network": "Google rate-limit / captcha" }, "tags": [ "education", @@ -5462,7 +5467,13 @@ "tags": [ "gaming" ], - "checkType": "status_code", + "checkType": "message", + "presenseStrs": [ + "class=\"profile-container\"" + ], + "absenceStrs": [ + "request-error" + ], "alexaRank": 2067, "urlMain": "https://www.roblox.com/", "url": "https://www.roblox.com/user.aspx?username={username}", @@ -11389,7 +11400,17 @@ "tags": [ "us" ], - "checkType": "response_url", + "checkType": "message", + "presenseStrs": [ + "'s profile - Garden.org" + ], + "absenceStrs": [ + "Member List - Garden.org" + ], + "errors": { + "Just a moment": "Cloudflare challenge", + "challenges.cloudflare.com": "Cloudflare challenge" + }, "alexaRank": 17338, "urlMain": "https://garden.org", "url": "https://garden.org/users/profile/{username}/", @@ -13171,8 +13192,12 @@ "url": "https://hive.blog/@{username}", "urlMain": "https://hive.blog/", "checkType": "message", + "presenseStrs": [ + "class=\"UserProfile\"" + ], "absenceStrs": [ - "User Not Found - Hive" + "User Not Found - Hive", + "class=\"NotFound" ], "usernameClaimed": "mango-juice", "usernameUnclaimed": "noonewouldeverusethis7", @@ -14771,7 +14796,14 @@ "tags": [ "gaming" ], - "checkType": "response_url", + "checkType": "message", + "presenseStrs": [ + "class=\"profile-avatar\"" + ], + "errors": { + "Just a moment": "Cloudflare challenge", + "challenges.cloudflare.com": "Cloudflare challenge" + }, "alexaRank": 65342, "urlMain": "https://www.thesimsresource.com/", "url": "https://www.thesimsresource.com/members/{username}/", @@ -16774,8 +16806,8 @@ "ru" ], "checkType": "message", - "absenceStrs": [ - "Пользователь с таким именем не найден" + "presenseStrs": [ + "class=\"userprofile\"" ], "alexaRank": 160156, "urlMain": "https://www.rusfootball.info/", @@ -18596,6 +18628,9 @@ "us" ], "checkType": "message", + "presenseStrs": [ + "class=\"data_head\"" + ], "absenceStrs": [ "The user you requested does not exist, no matter how much you wish this might be the case." ], @@ -28554,6 +28589,7 @@ ] }, "TikTok Online Viewer": { + "disabled": true, "errors": { "Website unavailable": "Site error", "is currently offline": "Site error" diff --git a/maigret/resources/db_meta.json b/maigret/resources/db_meta.json index 335f0a1..914491b 100644 --- a/maigret/resources/db_meta.json +++ b/maigret/resources/db_meta.json @@ -1,8 +1,8 @@ { "version": 1, - "updated_at": "2026-04-26T09:18:14Z", + "updated_at": "2026-04-26T10:28:07Z", "sites_count": 3139, "min_maigret_version": "0.6.0", - "data_sha256": "c51ecaa6c0736c5e1e7ca91aaf111445b3ac9ce9541a472d97db2dcc3ff8aa17", + "data_sha256": "7a6e2e5d2d970d85a3c0b4ecc6eda34a927b6067bd75f2df0301d8603722428e", "data_url": "https://raw.githubusercontent.com/soxoj/maigret/main/maigret/resources/data.json" } \ No newline at end of file diff --git a/sites.md b/sites.md index 735c2e0..ede7df2 100644 --- a/sites.md +++ b/sites.md @@ -2402,7 +2402,7 @@ Rank data fetched from Majestic Million by domains. 1. ![](https://www.google.com/s2/favicons?domain=http://terminator-scc.net.ru) [Terminator (http://terminator-scc.net.ru)](http://terminator-scc.net.ru)*: top 100M, ru* 1. ![](https://www.google.com/s2/favicons?domain=https://www.thedaftclub.com) [Thedaftclub (https://www.thedaftclub.com)](https://www.thedaftclub.com)*: top 100M*, search is disabled 1. ![](https://www.google.com/s2/favicons?domain=https://www.thephysicsforum.com) [Thephysicsforum (https://www.thephysicsforum.com)](https://www.thephysicsforum.com)*: top 100M, forum*, search is disabled -1. ![](https://www.google.com/s2/favicons?domain=https://ttonlineviewer.com) [TikTok Online Viewer (https://ttonlineviewer.com)](https://ttonlineviewer.com)*: top 100M* +1. ![](https://www.google.com/s2/favicons?domain=https://ttonlineviewer.com) [TikTok Online Viewer (https://ttonlineviewer.com)](https://ttonlineviewer.com)*: top 100M*, search is disabled 1. ![](https://www.google.com/s2/favicons?domain=http://tkgr.ru/) [Tkgr (http://tkgr.ru/)](http://tkgr.ru/)*: top 100M, ru* 1. ![](https://www.google.com/s2/favicons?domain=https://torrent-soft.net) [Torrent-soft (https://torrent-soft.net)](https://torrent-soft.net)*: top 100M, ru* 1. ![](https://www.google.com/s2/favicons?domain=https://totalstavki.ru) [TotalStavki (https://totalstavki.ru)](https://totalstavki.ru)*: top 100M, ru*, search is disabled @@ -3146,13 +3146,13 @@ Rank data fetched from Majestic Million by domains. The list was updated at (2026-04-26) ## Statistics -Enabled/total sites: 2510/3139 = 79.96% +Enabled/total sites: 2509/3139 = 79.93% -Incomplete message checks: 317/2510 = 12.63% (false positive risks) +Incomplete message checks: 315/2509 = 12.55% (false positive risks) -Status code checks: 625/2510 = 24.9% (false positive risks) +Status code checks: 624/2509 = 24.87% (false positive risks) -False positive risk (total): 37.53% +False positive risk (total): 37.42% Sites with probing: 500px, Armchairgm, BinarySearch (disabled), BleachFandom, Bluesky, BongaCams, Boosty, BuyMeACoffee, Calendly, Cent, Chess, Code Sandbox, Code Snippet Wiki, DailyMotion, Discord, Diskusjon.no, Disqus, Docker Hub, Duolingo, FandomCommunityCentral, GitHub, GitLab, Google Plus (archived), Gravatar, HackTheBox, Hackerrank, Hashnode, Holopin, Imgur, Issuu, Keybase, Kick, Kvinneguiden, LeetCode, Lesswrong, Livejasmin, LocalCryptos (disabled), Medium, MicrosoftLearn, MixCloud, Monkeytype, NPM, Niftygateway, Omg.lol, OnlyFans, Paragraph, Picsart, Plurk, Polarsteps, Rarible, Reddit (disabled), Reddit Search (Pushshift) (disabled), Revolut.me, RoyalCams, Scratch, Soop, SportsTracker, Spotify, StackOverflow, Substack, TAP'D, Topcoder, Trello, Twitch, Twitter, Twitter Shadowban (disabled), UnstoppableDomains, Vimeo, Vivino, Warframe Market, Warpcast, Weibo, Wikipedia, Yapisal (disabled), YouNow, en.brickimedia.org, nightbot, notabug.org, qiwi.me (disabled)