mirror of
https://github.com/soxoj/maigret.git
synced 2026-05-06 14:08:59 +00:00
Fix false positives (#2459)
* Fix false positives: APClips, Taplink, gentoo, Discord.bio, ChaturBate; disable 7Cups, playtime, openriskmanual, reactos; update tags * Fix db_meta.json regeneration in update_site_data.py (inline instead of module import)
This commit is contained in:
+57
-32
@@ -5799,26 +5799,20 @@
|
|||||||
"alexaRank": 2741
|
"alexaRank": 2741
|
||||||
},
|
},
|
||||||
"Taplink": {
|
"Taplink": {
|
||||||
"tags": [
|
|
||||||
"links",
|
|
||||||
"ru"
|
|
||||||
],
|
|
||||||
"headers": {
|
|
||||||
"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Safari/537.36"
|
|
||||||
},
|
|
||||||
"checkType": "message",
|
|
||||||
"absenceStrs": [
|
|
||||||
"Page not found",
|
|
||||||
"Страница не найдена"
|
|
||||||
],
|
|
||||||
"presenseStrs": [
|
|
||||||
"taplink.cc"
|
|
||||||
],
|
|
||||||
"urlMain": "https://taplink.cc/",
|
|
||||||
"url": "https://taplink.cc/{username}",
|
"url": "https://taplink.cc/{username}",
|
||||||
"usernameClaimed": "taplink.ru",
|
"urlMain": "https://taplink.cc/",
|
||||||
"usernameUnclaimed": "noonewouldeverusethis77777",
|
"checkType": "message",
|
||||||
"alexaRank": 4798
|
"presenseStrs": [
|
||||||
|
"at Taplink"
|
||||||
|
],
|
||||||
|
"usernameClaimed": "adidas",
|
||||||
|
"usernameUnclaimed": "noonewouldeverusethis7",
|
||||||
|
"tags": [
|
||||||
|
"links"
|
||||||
|
],
|
||||||
|
"protection": [
|
||||||
|
"tls_fingerprint"
|
||||||
|
]
|
||||||
},
|
},
|
||||||
"MetaDiscourse": {
|
"MetaDiscourse": {
|
||||||
"tags": [
|
"tags": [
|
||||||
@@ -5990,12 +5984,12 @@
|
|||||||
},
|
},
|
||||||
"gentoo": {
|
"gentoo": {
|
||||||
"tags": [
|
"tags": [
|
||||||
"fi",
|
"coding",
|
||||||
"forum"
|
"forum"
|
||||||
],
|
],
|
||||||
"checkType": "message",
|
"checkType": "message",
|
||||||
"absenceStrs": [
|
"absenceStrs": [
|
||||||
"title>Gentoo Forums :: </title>"
|
"Error 404 (Not Found)"
|
||||||
],
|
],
|
||||||
"urlMain": "https://forums.gentoo.org",
|
"urlMain": "https://forums.gentoo.org",
|
||||||
"url": "https://forums.gentoo.org/profile.php?mode=viewprofile&u={username}",
|
"url": "https://forums.gentoo.org/profile.php?mode=viewprofile&u={username}",
|
||||||
@@ -6221,14 +6215,21 @@
|
|||||||
},
|
},
|
||||||
"ChaturBate": {
|
"ChaturBate": {
|
||||||
"tags": [
|
"tags": [
|
||||||
|
"porn",
|
||||||
"webcam"
|
"webcam"
|
||||||
],
|
],
|
||||||
"checkType": "status_code",
|
"checkType": "status_code",
|
||||||
"alexaRank": 3165,
|
"alexaRank": 3165,
|
||||||
"urlMain": "https://chaturbate.com",
|
"urlMain": "https://chaturbate.com",
|
||||||
"url": "https://chaturbate.com/{username}",
|
"url": "https://chaturbate.com/{username}/",
|
||||||
"usernameClaimed": "cute18cute",
|
"usernameClaimed": "cute18cute",
|
||||||
"usernameUnclaimed": "noonewouldeverusethis77777"
|
"usernameUnclaimed": "noonewouldeverusethis77777",
|
||||||
|
"presenseStrs": [
|
||||||
|
"\"broadcaster_username\""
|
||||||
|
],
|
||||||
|
"absenceStrs": [
|
||||||
|
"<title>Chaturbate"
|
||||||
|
]
|
||||||
},
|
},
|
||||||
"Techdirt": {
|
"Techdirt": {
|
||||||
"disabled": true,
|
"disabled": true,
|
||||||
@@ -12178,7 +12179,10 @@
|
|||||||
"urlMain": "https://www.travelblog.org",
|
"urlMain": "https://www.travelblog.org",
|
||||||
"url": "https://www.travelblog.org/Bloggers/{username}",
|
"url": "https://www.travelblog.org/Bloggers/{username}",
|
||||||
"usernameClaimed": "adam",
|
"usernameClaimed": "adam",
|
||||||
"usernameUnclaimed": "noonewouldeverusethis7"
|
"usernameUnclaimed": "noonewouldeverusethis7",
|
||||||
|
"protection": [
|
||||||
|
"ip_reputation"
|
||||||
|
]
|
||||||
},
|
},
|
||||||
"discuss.inventables.com": {
|
"discuss.inventables.com": {
|
||||||
"urlMain": "https://discuss.inventables.com",
|
"urlMain": "https://discuss.inventables.com",
|
||||||
@@ -13298,7 +13302,8 @@
|
|||||||
"urlMain": "https://www.7cups.com/",
|
"urlMain": "https://www.7cups.com/",
|
||||||
"url": "https://www.7cups.com/@{username}",
|
"url": "https://www.7cups.com/@{username}",
|
||||||
"usernameClaimed": "blue",
|
"usernameClaimed": "blue",
|
||||||
"usernameUnclaimed": "noonewouldeverusethis7"
|
"usernameUnclaimed": "noonewouldeverusethis7",
|
||||||
|
"disabled": true
|
||||||
},
|
},
|
||||||
"hi-news.ru": {
|
"hi-news.ru": {
|
||||||
"tags": [
|
"tags": [
|
||||||
@@ -21362,9 +21367,13 @@
|
|||||||
"usernameClaimed": "onlybbyraq",
|
"usernameClaimed": "onlybbyraq",
|
||||||
"usernameUnclaimed": "noonewouldeverusethis7",
|
"usernameUnclaimed": "noonewouldeverusethis7",
|
||||||
"tags": [
|
"tags": [
|
||||||
|
"porn",
|
||||||
"video"
|
"video"
|
||||||
],
|
],
|
||||||
"alexaRank": 557429
|
"alexaRank": 557429,
|
||||||
|
"protection": [
|
||||||
|
"tls_fingerprint"
|
||||||
|
]
|
||||||
},
|
},
|
||||||
"Politikforum": {
|
"Politikforum": {
|
||||||
"tags": [
|
"tags": [
|
||||||
@@ -29469,7 +29478,8 @@
|
|||||||
"playtime": {
|
"playtime": {
|
||||||
"tags": [
|
"tags": [
|
||||||
"de",
|
"de",
|
||||||
"forum"
|
"forum",
|
||||||
|
"gaming"
|
||||||
],
|
],
|
||||||
"checkType": "message",
|
"checkType": "message",
|
||||||
"absenceStrs": [
|
"absenceStrs": [
|
||||||
@@ -29478,7 +29488,8 @@
|
|||||||
"urlMain": "https://forum.playtime-forum.info",
|
"urlMain": "https://forum.playtime-forum.info",
|
||||||
"url": "https://forum.playtime-forum.info/members/?username={username}",
|
"url": "https://forum.playtime-forum.info/members/?username={username}",
|
||||||
"usernameClaimed": "Glumbi",
|
"usernameClaimed": "Glumbi",
|
||||||
"usernameUnclaimed": "noonewouldeverusethis7"
|
"usernameUnclaimed": "noonewouldeverusethis7",
|
||||||
|
"disabled": true
|
||||||
},
|
},
|
||||||
"privateinvestor2000.com": {
|
"privateinvestor2000.com": {
|
||||||
"engine": "uCoz",
|
"engine": "uCoz",
|
||||||
@@ -33398,7 +33409,12 @@
|
|||||||
"checkType": "status_code",
|
"checkType": "status_code",
|
||||||
"usernameClaimed": "test",
|
"usernameClaimed": "test",
|
||||||
"usernameUnclaimed": "noonewouldeverusethis7",
|
"usernameUnclaimed": "noonewouldeverusethis7",
|
||||||
"url": "https://openriskmanual.org/wiki/User:{username}"
|
"url": "https://openriskmanual.org/wiki/User:{username}",
|
||||||
|
"disabled": true,
|
||||||
|
"tags": [
|
||||||
|
"finance",
|
||||||
|
"wiki"
|
||||||
|
]
|
||||||
},
|
},
|
||||||
"openwetware.org": {
|
"openwetware.org": {
|
||||||
"checkType": "status_code",
|
"checkType": "status_code",
|
||||||
@@ -33495,7 +33511,12 @@
|
|||||||
"checkType": "status_code",
|
"checkType": "status_code",
|
||||||
"usernameClaimed": "admin",
|
"usernameClaimed": "admin",
|
||||||
"usernameUnclaimed": "noonewouldeverusethis7",
|
"usernameUnclaimed": "noonewouldeverusethis7",
|
||||||
"url": "https://reactos.org/wiki/User:{username}"
|
"url": "https://reactos.org/wiki/User:{username}",
|
||||||
|
"disabled": true,
|
||||||
|
"tags": [
|
||||||
|
"coding",
|
||||||
|
"wiki"
|
||||||
|
]
|
||||||
},
|
},
|
||||||
"realcty.org": {
|
"realcty.org": {
|
||||||
"checkType": "status_code",
|
"checkType": "status_code",
|
||||||
@@ -34903,10 +34924,14 @@
|
|||||||
"urlMain": "https://discord.bio/",
|
"urlMain": "https://discord.bio/",
|
||||||
"checkType": "message",
|
"checkType": "message",
|
||||||
"absenceStrs": [
|
"absenceStrs": [
|
||||||
"<title>Server Error (500)</title>"
|
"User not found"
|
||||||
],
|
],
|
||||||
"usernameClaimed": "robert",
|
"usernameClaimed": "robert",
|
||||||
"usernameUnclaimed": "noonewouldeverusethis7"
|
"usernameUnclaimed": "noonewouldeverusethis7",
|
||||||
|
"tags": [
|
||||||
|
"gaming",
|
||||||
|
"social"
|
||||||
|
]
|
||||||
},
|
},
|
||||||
"Hacker Sploit": {
|
"Hacker Sploit": {
|
||||||
"url": "https://forum.hackersploit.org/u/{username}",
|
"url": "https://forum.hackersploit.org/u/{username}",
|
||||||
|
|||||||
@@ -1,8 +1,8 @@
|
|||||||
{
|
{
|
||||||
"version": 1,
|
"version": 1,
|
||||||
"updated_at": "2026-04-04T15:54:23Z",
|
"updated_at": "2026-04-04T16:16:31Z",
|
||||||
"sites_count": 3157,
|
"sites_count": 3157,
|
||||||
"min_maigret_version": "0.5.0",
|
"min_maigret_version": "0.5.0",
|
||||||
"data_sha256": "880a56363cf5d71e13ca389330388fbc4796bff50d6e207a056112c4a5606f83",
|
"data_sha256": "7c8d51c45100ef0a26c401ee26ffb83ee5b7c897011502ded8d9ae161c8ed751",
|
||||||
"data_url": "https://raw.githubusercontent.com/soxoj/maigret/main/maigret/resources/data.json"
|
"data_url": "https://raw.githubusercontent.com/soxoj/maigret/main/maigret/resources/data.json"
|
||||||
}
|
}
|
||||||
@@ -249,7 +249,7 @@ Rank data fetched from Majestic Million by domains.
|
|||||||
1.  [Mix (https://mix.com)](https://mix.com)*: top 5K, links, sharing*
|
1.  [Mix (https://mix.com)](https://mix.com)*: top 5K, links, sharing*
|
||||||
1.  [Chess (https://www.chess.com)](https://www.chess.com)*: top 5K, gaming, hobby*
|
1.  [Chess (https://www.chess.com)](https://www.chess.com)*: top 5K, gaming, hobby*
|
||||||
1.  [OpenCollective (https://opencollective.com/)](https://opencollective.com/)*: top 5K, coding, finance*
|
1.  [OpenCollective (https://opencollective.com/)](https://opencollective.com/)*: top 5K, coding, finance*
|
||||||
1.  [ChaturBate (https://chaturbate.com)](https://chaturbate.com)*: top 5K, webcam*
|
1.  [ChaturBate (https://chaturbate.com)](https://chaturbate.com)*: top 5K, porn, webcam*
|
||||||
1.  [Techdirt (https://www.techdirt.com/)](https://www.techdirt.com/)*: top 5K, news, tech*, search is disabled
|
1.  [Techdirt (https://www.techdirt.com/)](https://www.techdirt.com/)*: top 5K, news, tech*, search is disabled
|
||||||
1.  [jAlbum.net (https://jalbum.net)](https://jalbum.net)*: top 5K, photo*
|
1.  [jAlbum.net (https://jalbum.net)](https://jalbum.net)*: top 5K, photo*
|
||||||
1.  [Ultimate-Guitar (https://ultimate-guitar.com/)](https://ultimate-guitar.com/)*: top 5K, music*
|
1.  [Ultimate-Guitar (https://ultimate-guitar.com/)](https://ultimate-guitar.com/)*: top 5K, music*
|
||||||
@@ -277,7 +277,6 @@ Rank data fetched from Majestic Million by domains.
|
|||||||
1.  [AlternativeTo (https://alternativeto.net/)](https://alternativeto.net/)*: top 5K, tech*
|
1.  [AlternativeTo (https://alternativeto.net/)](https://alternativeto.net/)*: top 5K, tech*
|
||||||
1.  [PeriscopeTv (https://www.pscp.tv)](https://www.pscp.tv)*: top 5K, streaming, video*
|
1.  [PeriscopeTv (https://www.pscp.tv)](https://www.pscp.tv)*: top 5K, streaming, video*
|
||||||
1.  [Pikabu (https://pikabu.ru/)](https://pikabu.ru/)*: top 5K, ru, sharing, social*
|
1.  [Pikabu (https://pikabu.ru/)](https://pikabu.ru/)*: top 5K, ru, sharing, social*
|
||||||
1.  [Taplink (https://taplink.cc/)](https://taplink.cc/)*: top 5K, links, ru*
|
|
||||||
1.  [Lichess (https://lichess.org)](https://lichess.org)*: top 5K, gaming, hobby*
|
1.  [Lichess (https://lichess.org)](https://lichess.org)*: top 5K, gaming, hobby*
|
||||||
1.  [Speedrun.com (https://speedrun.com/)](https://speedrun.com/)*: top 5K, gaming*
|
1.  [Speedrun.com (https://speedrun.com/)](https://speedrun.com/)*: top 5K, gaming*
|
||||||
1.  [F6S (https://f6s.com/)](https://f6s.com/)*: top 5K, business*
|
1.  [F6S (https://f6s.com/)](https://f6s.com/)*: top 5K, business*
|
||||||
@@ -572,7 +571,7 @@ Rank data fetched from Majestic Million by domains.
|
|||||||
1.  [Fredmiranda (https://www.fredmiranda.com)](https://www.fredmiranda.com)*: top 100K, de*
|
1.  [Fredmiranda (https://www.fredmiranda.com)](https://www.fredmiranda.com)*: top 100K, de*
|
||||||
1.  [Skyblock (https://skyblock.net)](https://skyblock.net)*: top 100K, forum, gaming*
|
1.  [Skyblock (https://skyblock.net)](https://skyblock.net)*: top 100K, forum, gaming*
|
||||||
1.  [joyreactor.cc (http://joyreactor.cc)](http://joyreactor.cc)*: top 100K, art, nl, ru*
|
1.  [joyreactor.cc (http://joyreactor.cc)](http://joyreactor.cc)*: top 100K, art, nl, ru*
|
||||||
1.  [7Cups (https://www.7cups.com/)](https://www.7cups.com/)*: top 100K, medicine*
|
1.  [7Cups (https://www.7cups.com/)](https://www.7cups.com/)*: top 100K, medicine*, search is disabled
|
||||||
1.  [hi-news.ru (https://hi-news.ru)](https://hi-news.ru)*: top 100K, ru*
|
1.  [hi-news.ru (https://hi-news.ru)](https://hi-news.ru)*: top 100K, ru*
|
||||||
1.  [BabyBlog.ru (https://www.babyblog.ru/)](https://www.babyblog.ru/)*: top 100K, ru*
|
1.  [BabyBlog.ru (https://www.babyblog.ru/)](https://www.babyblog.ru/)*: top 100K, ru*
|
||||||
1.  [ViewBug (https://www.viewbug.com)](https://www.viewbug.com)*: top 100K, photo*
|
1.  [ViewBug (https://www.viewbug.com)](https://www.viewbug.com)*: top 100K, photo*
|
||||||
@@ -1042,7 +1041,7 @@ Rank data fetched from Majestic Million by domains.
|
|||||||
1.  [Gigbucks (https://gigbucks.com/)](https://gigbucks.com/)*: top 10M, dz, eg*
|
1.  [Gigbucks (https://gigbucks.com/)](https://gigbucks.com/)*: top 10M, dz, eg*
|
||||||
1.  [Kashalot (https://kashalot.com)](https://kashalot.com)*: top 10M, ua*
|
1.  [Kashalot (https://kashalot.com)](https://kashalot.com)*: top 10M, ua*
|
||||||
1.  [Angara (https://angara.net)](https://angara.net)*: top 10M, ru*
|
1.  [Angara (https://angara.net)](https://angara.net)*: top 10M, ru*
|
||||||
1.  [APClips (https://apclips.com/)](https://apclips.com/)*: top 10M, video*
|
1.  [APClips (https://apclips.com/)](https://apclips.com/)*: top 10M, porn, video*
|
||||||
1.  [Politikforum (http://www.politikforum.ru/)](http://www.politikforum.ru/)*: top 10M, forum, ru*
|
1.  [Politikforum (http://www.politikforum.ru/)](http://www.politikforum.ru/)*: top 10M, forum, ru*
|
||||||
1.  [Mactalk (http://www.mactalk.com.au/)](http://www.mactalk.com.au/)*: top 10M, au, pk*, search is disabled
|
1.  [Mactalk (http://www.mactalk.com.au/)](http://www.mactalk.com.au/)*: top 10M, au, pk*, search is disabled
|
||||||
1.  [yamaya.ru (https://yamaya.ru)](https://yamaya.ru)*: top 10M, ru*
|
1.  [yamaya.ru (https://yamaya.ru)](https://yamaya.ru)*: top 10M, ru*
|
||||||
@@ -1491,9 +1490,10 @@ Rank data fetched from Majestic Million by domains.
|
|||||||
1.  [forum.audacityteam.org (https://forum.audacityteam.org)](https://forum.audacityteam.org)*: top 100M, forum*
|
1.  [forum.audacityteam.org (https://forum.audacityteam.org)](https://forum.audacityteam.org)*: top 100M, forum*
|
||||||
1.  [{username}.ddns.net ({username}.ddns.net)]({username}.ddns.net)*: top 100M*
|
1.  [{username}.ddns.net ({username}.ddns.net)]({username}.ddns.net)*: top 100M*
|
||||||
1.  [Rust-lang (https://users.rust-lang.org)](https://users.rust-lang.org)*: top 100M, coding, forum*
|
1.  [Rust-lang (https://users.rust-lang.org)](https://users.rust-lang.org)*: top 100M, coding, forum*
|
||||||
|
1.  [Taplink (https://taplink.cc/)](https://taplink.cc/)*: top 100M, links*
|
||||||
1.  [MetaDiscourse (https://meta.discourse.org/)](https://meta.discourse.org/)*: top 100M, forum*
|
1.  [MetaDiscourse (https://meta.discourse.org/)](https://meta.discourse.org/)*: top 100M, forum*
|
||||||
1.  [community.icons8.com (https://community.icons8.com)](https://community.icons8.com)*: top 100M, forum*
|
1.  [community.icons8.com (https://community.icons8.com)](https://community.icons8.com)*: top 100M, forum*
|
||||||
1.  [gentoo (https://forums.gentoo.org)](https://forums.gentoo.org)*: top 100M, fi, forum*
|
1.  [gentoo (https://forums.gentoo.org)](https://forums.gentoo.org)*: top 100M, coding, forum*
|
||||||
1.  [forum.inaturalist.org (https://forum.inaturalist.org)](https://forum.inaturalist.org)*: top 100M, forum*
|
1.  [forum.inaturalist.org (https://forum.inaturalist.org)](https://forum.inaturalist.org)*: top 100M, forum*
|
||||||
1.  [Pluralsight (https://app.pluralsight.com)](https://app.pluralsight.com)*: top 100M*
|
1.  [Pluralsight (https://app.pluralsight.com)](https://app.pluralsight.com)*: top 100M*
|
||||||
1.  [F-droid (https://forum.f-droid.org)](https://forum.f-droid.org)*: top 100M, forum*
|
1.  [F-droid (https://forum.f-droid.org)](https://forum.f-droid.org)*: top 100M, forum*
|
||||||
@@ -2523,7 +2523,7 @@ Rank data fetched from Majestic Million by domains.
|
|||||||
1.  [ozcardtrader.com.au (http://www.ozcardtrader.com.au/community/)](http://www.ozcardtrader.com.au/community/)*: top 100M, au, forum, sport*
|
1.  [ozcardtrader.com.au (http://www.ozcardtrader.com.au/community/)](http://www.ozcardtrader.com.au/community/)*: top 100M, au, forum, sport*
|
||||||
1.  [p8ntballer-forums.com (http://p8ntballer-forums.com/)](http://p8ntballer-forums.com/)*: top 100M, forum*
|
1.  [p8ntballer-forums.com (http://p8ntballer-forums.com/)](http://p8ntballer-forums.com/)*: top 100M, forum*
|
||||||
1.  [panzer35.ru (http://panzer35.ru)](http://panzer35.ru)*: top 100M, ru*
|
1.  [panzer35.ru (http://panzer35.ru)](http://panzer35.ru)*: top 100M, ru*
|
||||||
1.  [playtime (https://forum.playtime-forum.info)](https://forum.playtime-forum.info)*: top 100M, de, forum*
|
1.  [playtime (https://forum.playtime-forum.info)](https://forum.playtime-forum.info)*: top 100M, de, forum, gaming*, search is disabled
|
||||||
1.  [privateinvestor2000.com (http://privateinvestor2000.com)](http://privateinvestor2000.com)*: top 100M*
|
1.  [privateinvestor2000.com (http://privateinvestor2000.com)](http://privateinvestor2000.com)*: top 100M*
|
||||||
1.  [prizyvnikmoy.ru (http://prizyvnikmoy.ru)](http://prizyvnikmoy.ru)*: top 100M, ru*
|
1.  [prizyvnikmoy.ru (http://prizyvnikmoy.ru)](http://prizyvnikmoy.ru)*: top 100M, ru*
|
||||||
1.  [pvpru (https://pvpru.com/)](https://pvpru.com/)*: top 100M, gaming, ru*, search is disabled
|
1.  [pvpru (https://pvpru.com/)](https://pvpru.com/)*: top 100M, gaming, ru*, search is disabled
|
||||||
@@ -3007,7 +3007,7 @@ Rank data fetched from Majestic Million by domains.
|
|||||||
1.  [nookipedia.com ()]()*: top 100M*
|
1.  [nookipedia.com ()]()*: top 100M*
|
||||||
1.  [oldschool.runescape.wiki ()]()*: top 100M*
|
1.  [oldschool.runescape.wiki ()]()*: top 100M*
|
||||||
1.  [openhub.net ()]()*: top 100M*
|
1.  [openhub.net ()]()*: top 100M*
|
||||||
1.  [openriskmanual.org ()]()*: top 100M*
|
1.  [openriskmanual.org ()]()*: top 100M, finance, wiki*, search is disabled
|
||||||
1.  [openwetware.org ()]()*: top 100M*
|
1.  [openwetware.org ()]()*: top 100M*
|
||||||
1.  [oyoy.com ()]()*: top 100M*
|
1.  [oyoy.com ()]()*: top 100M*
|
||||||
1.  [padlet.com ()]()*: top 100M*
|
1.  [padlet.com ()]()*: top 100M*
|
||||||
@@ -3023,7 +3023,7 @@ Rank data fetched from Majestic Million by domains.
|
|||||||
1.  [qiita.com ()]()*: top 100M*
|
1.  [qiita.com ()]()*: top 100M*
|
||||||
1.  [rationalwiki.org ()]()*: top 100M*
|
1.  [rationalwiki.org ()]()*: top 100M*
|
||||||
1.  [raymanpc.com ()]()*: top 100M*
|
1.  [raymanpc.com ()]()*: top 100M*
|
||||||
1.  [reactos.org ()]()*: top 100M*
|
1.  [reactos.org ()]()*: top 100M, coding, wiki*, search is disabled
|
||||||
1.  [realcty.org ()]()*: top 100M*
|
1.  [realcty.org ()]()*: top 100M*
|
||||||
1.  [renderosity.com ()]()*: top 100M*
|
1.  [renderosity.com ()]()*: top 100M*
|
||||||
1.  [run-log.com ()]()*: top 100M*
|
1.  [run-log.com ()]()*: top 100M*
|
||||||
@@ -3142,7 +3142,7 @@ Rank data fetched from Majestic Million by domains.
|
|||||||
1.  [Codolio (https://codolio.com/)](https://codolio.com/)*: top 100M*, search is disabled
|
1.  [Codolio (https://codolio.com/)](https://codolio.com/)*: top 100M*, search is disabled
|
||||||
1.  [Coinvote (https://coinvote.cc/)](https://coinvote.cc/)*: top 100M*
|
1.  [Coinvote (https://coinvote.cc/)](https://coinvote.cc/)*: top 100M*
|
||||||
1.  [Cracked Forum (https://cracked.sh/)](https://cracked.sh/)*: top 100M, forum*
|
1.  [Cracked Forum (https://cracked.sh/)](https://cracked.sh/)*: top 100M, forum*
|
||||||
1.  [Discord.bio (https://discord.bio/)](https://discord.bio/)*: top 100M*
|
1.  [Discord.bio (https://discord.bio/)](https://discord.bio/)*: top 100M, gaming, social*
|
||||||
1.  [Hacker Sploit (https://forum.hackersploit.org/)](https://forum.hackersploit.org/)*: top 100M, coding, forum*
|
1.  [Hacker Sploit (https://forum.hackersploit.org/)](https://forum.hackersploit.org/)*: top 100M, coding, forum*
|
||||||
1.  [Holopin (https://holopin.io)](https://holopin.io)*: top 100M*
|
1.  [Holopin (https://holopin.io)](https://holopin.io)*: top 100M*
|
||||||
1.  [Patched (https://patched.sh/)](https://patched.sh/)*: top 100M*
|
1.  [Patched (https://patched.sh/)](https://patched.sh/)*: top 100M*
|
||||||
@@ -3161,16 +3161,16 @@ Rank data fetched from Majestic Million by domains.
|
|||||||
1.  [Tonometerbot (https://tonometerbot.com)](https://tonometerbot.com)*: top 100M, crypto*
|
1.  [Tonometerbot (https://tonometerbot.com)](https://tonometerbot.com)*: top 100M, crypto*
|
||||||
1.  [Spatial (https://www.spatial.io)](https://www.spatial.io)*: top 100M, crypto, gaming*
|
1.  [Spatial (https://www.spatial.io)](https://www.spatial.io)*: top 100M, crypto, gaming*
|
||||||
|
|
||||||
The list was updated at (2026-04-03)
|
The list was updated at (2026-04-04)
|
||||||
## Statistics
|
## Statistics
|
||||||
|
|
||||||
Enabled/total sites: 2550/3157 = 80.77%
|
Enabled/total sites: 2546/3157 = 80.65%
|
||||||
|
|
||||||
Incomplete message checks: 341/2550 = 13.37% (false positive risks)
|
Incomplete message checks: 341/2546 = 13.39% (false positive risks)
|
||||||
|
|
||||||
Status code checks: 639/2550 = 25.06% (false positive risks)
|
Status code checks: 636/2546 = 24.98% (false positive risks)
|
||||||
|
|
||||||
False positive risk (total): 38.43%
|
False positive risk (total): 38.37%
|
||||||
|
|
||||||
Sites with probing: 500px, Armchairgm, BinarySearch (disabled), BleachFandom, Bluesky, BongaCams, Boosty, BuyMeACoffee, Calendly, Cent, Chess, Code Sandbox, Code Snippet Wiki, DailyMotion, Discord, Diskusjon.no, Disqus, Docker Hub, Duolingo, FandomCommunityCentral, GitHub, GitLab, Google Plus (archived), Gravatar, Hashnode, Holopin, Imgur, Issuu, Keybase, Kick, Kvinneguiden, LeetCode, Lesswrong, Livejasmin, LocalCryptos (disabled), MicrosoftLearn, MixCloud, Monkeytype, Niftygateway, Omg.lol, Paragraph, Picsart, Plurk, Polarsteps, Rarible, Reddit, Reddit Search (Pushshift) (disabled), RoyalCams, Scratch, Soop, SportsTracker, Spotify (disabled), StackOverflow, Substack, TAP'D, Topcoder, Trello, Twitch, Twitter, Twitter Shadowban (disabled), UnstoppableDomains, Vimeo, Warframe Market, Warpcast, Weibo, Yapisal (disabled), YouNow, en.brickimedia.org, nightbot, notabug.org, qiwi.me (disabled)
|
Sites with probing: 500px, Armchairgm, BinarySearch (disabled), BleachFandom, Bluesky, BongaCams, Boosty, BuyMeACoffee, Calendly, Cent, Chess, Code Sandbox, Code Snippet Wiki, DailyMotion, Discord, Diskusjon.no, Disqus, Docker Hub, Duolingo, FandomCommunityCentral, GitHub, GitLab, Google Plus (archived), Gravatar, Hashnode, Holopin, Imgur, Issuu, Keybase, Kick, Kvinneguiden, LeetCode, Lesswrong, Livejasmin, LocalCryptos (disabled), MicrosoftLearn, MixCloud, Monkeytype, Niftygateway, Omg.lol, Paragraph, Picsart, Plurk, Polarsteps, Rarible, Reddit, Reddit Search (Pushshift) (disabled), RoyalCams, Scratch, Soop, SportsTracker, Spotify (disabled), StackOverflow, Substack, TAP'D, Topcoder, Trello, Twitch, Twitter, Twitter Shadowban (disabled), UnstoppableDomains, Vimeo, Warframe Market, Warpcast, Weibo, Yapisal (disabled), YouNow, en.brickimedia.org, nightbot, notabug.org, qiwi.me (disabled)
|
||||||
|
|
||||||
@@ -3200,13 +3200,13 @@ Top 20 profile URLs:
|
|||||||
|
|
||||||
|
|
||||||
Top 20 tags:
|
Top 20 tags:
|
||||||
- (1066) `NO_TAGS` (non-standard)
|
- (1063) `NO_TAGS` (non-standard)
|
||||||
- (754) `forum`
|
- (754) `forum`
|
||||||
- (125) `gaming`
|
- (127) `gaming`
|
||||||
- (77) `coding`
|
- (79) `coding`
|
||||||
- (59) `photo`
|
- (59) `photo`
|
||||||
|
- (46) `social`
|
||||||
- (46) `tech`
|
- (46) `tech`
|
||||||
- (45) `social`
|
|
||||||
- (41) `news`
|
- (41) `news`
|
||||||
- (39) `blog`
|
- (39) `blog`
|
||||||
- (34) `music`
|
- (34) `music`
|
||||||
@@ -3215,7 +3215,7 @@ Top 20 tags:
|
|||||||
- (25) `crypto`
|
- (25) `crypto`
|
||||||
- (23) `video`
|
- (23) `video`
|
||||||
- (23) `education`
|
- (23) `education`
|
||||||
- (22) `finance`
|
- (23) `finance`
|
||||||
- (21) `art`
|
- (21) `art`
|
||||||
- (21) `freelance`
|
- (21) `freelance`
|
||||||
- (18) `hobby`
|
- (18) `hobby`
|
||||||
|
|||||||
@@ -219,8 +219,21 @@ Rank data fetched from Majestic Million by domains.
|
|||||||
|
|
||||||
# Regenerate db_meta.json to stay in sync with data.json
|
# Regenerate db_meta.json to stay in sync with data.json
|
||||||
try:
|
try:
|
||||||
from generate_db_meta import main as generate_meta
|
import hashlib, json, os
|
||||||
generate_meta()
|
db_data_raw = open(args.base_file, 'rb').read()
|
||||||
|
db_data_parsed = json.loads(db_data_raw)
|
||||||
|
meta = {
|
||||||
|
"version": 1,
|
||||||
|
"updated_at": datetime.now(timezone.utc).strftime("%Y-%m-%dT%H:%M:%SZ"),
|
||||||
|
"sites_count": len(db_data_parsed.get("sites", {})),
|
||||||
|
"min_maigret_version": "0.5.0",
|
||||||
|
"data_sha256": hashlib.sha256(db_data_raw).hexdigest(),
|
||||||
|
"data_url": "https://raw.githubusercontent.com/soxoj/maigret/main/maigret/resources/data.json",
|
||||||
|
}
|
||||||
|
meta_path = os.path.join(os.path.dirname(args.base_file), "db_meta.json")
|
||||||
|
with open(meta_path, "w", encoding="utf-8") as mf:
|
||||||
|
json.dump(meta, mf, indent=4, ensure_ascii=False)
|
||||||
|
print(f"Updated {meta_path} ({meta['sites_count']} sites)")
|
||||||
except Exception as e:
|
except Exception as e:
|
||||||
print(f"Warning: could not regenerate db_meta.json: {e}")
|
print(f"Warning: could not regenerate db_meta.json: {e}")
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user