mirror of
https://github.com/soxoj/maigret.git
synced 2026-05-07 06:24:35 +00:00
23adc178ea
* Initial plan * Fix crash on -a --self-check by adding exception handling in site_self_check and self_check Wrap the body of site_self_check in try/except to catch unexpected errors and always return a valid changes dict. Also add a safety-net try/except in self_check around awaiting individual site check futures so that a single site failure doesn't crash the entire self-check process. Agent-Logs-Url: https://github.com/soxoj/maigret/sessions/5e27d620-5cbb-43d2-a9f9-ecb53a29904d Co-authored-by: soxoj <31013580+soxoj@users.noreply.github.com> * Restore @pytest.mark.slow on test_maigret_results Agent-Logs-Url: https://github.com/soxoj/maigret/sessions/5e27d620-5cbb-43d2-a9f9-ecb53a29904d Co-authored-by: soxoj <31013580+soxoj@users.noreply.github.com> * Document --self-check error resilience, --auto-disable, and --diagnose in docs/ Update command-line-options.rst with expanded --self-check description and new --auto-disable and --diagnose entries. Add a "Database self-check" section to features.rst explaining error-resilient behaviour and usage examples. Update usage-examples.rst to reference --auto-disable. Agent-Logs-Url: https://github.com/soxoj/maigret/sessions/af1f0f09-9112-4902-8475-e81d235ff3ed Co-authored-by: soxoj <31013580+soxoj@users.noreply.github.com> --------- Co-authored-by: copilot-swe-agent[bot] <198982749+Copilot@users.noreply.github.com> Co-authored-by: soxoj <31013580+soxoj@users.noreply.github.com>
205 lines
6.7 KiB
Python
205 lines
6.7 KiB
Python
"""Maigret main module test functions"""
|
|
|
|
import asyncio
|
|
import copy
|
|
from unittest.mock import patch
|
|
|
|
import pytest
|
|
from mock import Mock
|
|
|
|
from maigret.maigret import self_check, maigret
|
|
from maigret.maigret import (
|
|
extract_ids_from_page,
|
|
extract_ids_from_results,
|
|
)
|
|
from maigret.checking import site_self_check
|
|
from maigret.sites import MaigretSite, MaigretDatabase
|
|
from maigret.result import MaigretCheckResult, MaigretCheckStatus
|
|
from tests.conftest import RESULTS_EXAMPLE
|
|
|
|
|
|
@pytest.mark.slow
|
|
@pytest.mark.asyncio
|
|
async def test_self_check_db(test_db):
|
|
# initalize logger to debug
|
|
logger = Mock()
|
|
|
|
assert test_db.sites_dict['InvalidActive'].disabled is False
|
|
assert test_db.sites_dict['ValidInactive'].disabled is True
|
|
assert test_db.sites_dict['ValidActive'].disabled is False
|
|
assert test_db.sites_dict['InvalidInactive'].disabled is True
|
|
|
|
await self_check(
|
|
test_db, test_db.sites_dict, logger, silent=False, auto_disable=True
|
|
)
|
|
|
|
assert test_db.sites_dict['InvalidActive'].disabled is True
|
|
assert test_db.sites_dict['ValidInactive'].disabled is False
|
|
assert test_db.sites_dict['ValidActive'].disabled is False
|
|
assert test_db.sites_dict['InvalidInactive'].disabled is True
|
|
|
|
|
|
@pytest.mark.slow
|
|
@pytest.mark.asyncio
|
|
async def test_self_check_no_progressbar(test_db):
|
|
"""Verify that no_progressbar=True disables the alive_bar in self_check."""
|
|
logger = Mock()
|
|
|
|
with patch('maigret.checking.alive_bar') as mock_alive_bar:
|
|
mock_bar = Mock()
|
|
mock_alive_bar.return_value.__enter__ = Mock(return_value=mock_bar)
|
|
mock_alive_bar.return_value.__exit__ = Mock(return_value=False)
|
|
|
|
await self_check(
|
|
test_db, test_db.sites_dict, logger, silent=True,
|
|
no_progressbar=True,
|
|
)
|
|
|
|
# First call is the self-check progress bar; subsequent calls are
|
|
# from inner search() invocations.
|
|
self_check_call = mock_alive_bar.call_args_list[0]
|
|
_, kwargs = self_check_call
|
|
assert kwargs.get('title') == 'Self-checking'
|
|
assert kwargs.get('disable') is True
|
|
|
|
|
|
@pytest.mark.slow
|
|
@pytest.mark.asyncio
|
|
async def test_self_check_progressbar_enabled_by_default(test_db):
|
|
"""Verify that alive_bar is enabled by default (no_progressbar=False)."""
|
|
logger = Mock()
|
|
|
|
with patch('maigret.checking.alive_bar') as mock_alive_bar:
|
|
mock_bar = Mock()
|
|
mock_alive_bar.return_value.__enter__ = Mock(return_value=mock_bar)
|
|
mock_alive_bar.return_value.__exit__ = Mock(return_value=False)
|
|
|
|
await self_check(
|
|
test_db, test_db.sites_dict, logger, silent=True,
|
|
)
|
|
|
|
self_check_call = mock_alive_bar.call_args_list[0]
|
|
_, kwargs = self_check_call
|
|
assert kwargs.get('title') == 'Self-checking'
|
|
assert kwargs.get('disable') is False
|
|
|
|
|
|
@pytest.mark.asyncio
|
|
async def test_site_self_check_handles_exception(test_db):
|
|
"""Verify that site_self_check catches unexpected exceptions and returns a valid result."""
|
|
logger = Mock()
|
|
sem = asyncio.Semaphore(1)
|
|
site = test_db.sites_dict['ValidActive']
|
|
|
|
with patch('maigret.checking.maigret', side_effect=RuntimeError("test crash")):
|
|
result = await site_self_check(site, logger, sem, test_db)
|
|
|
|
assert isinstance(result, dict)
|
|
assert "issues" in result
|
|
assert len(result["issues"]) > 0
|
|
assert any("Unexpected error" in issue for issue in result["issues"])
|
|
|
|
|
|
@pytest.mark.asyncio
|
|
async def test_self_check_handles_task_exception(test_db):
|
|
"""Verify that self_check continues when individual site checks raise exceptions."""
|
|
logger = Mock()
|
|
|
|
with patch('maigret.checking.maigret', side_effect=RuntimeError("test crash")):
|
|
result = await self_check(
|
|
test_db, test_db.sites_dict, logger, silent=True,
|
|
no_progressbar=True,
|
|
)
|
|
|
|
assert isinstance(result, dict)
|
|
assert 'results' in result
|
|
assert len(result['results']) == len(test_db.sites_dict)
|
|
for r in result['results']:
|
|
assert 'site_name' in r
|
|
assert 'issues' in r
|
|
|
|
|
|
@pytest.mark.slow
|
|
@pytest.mark.skip(reason="broken, fixme")
|
|
def test_maigret_results(test_db):
|
|
logger = Mock()
|
|
|
|
username = 'Skyeng'
|
|
loop = asyncio.get_event_loop()
|
|
results = loop.run_until_complete(
|
|
maigret(username, site_dict=test_db.sites_dict, logger=logger, timeout=30)
|
|
)
|
|
|
|
assert isinstance(results, dict)
|
|
|
|
reddit_site = results['Reddit']['site']
|
|
assert isinstance(reddit_site, MaigretSite)
|
|
|
|
assert reddit_site.json == {
|
|
'tags': ['news', 'social', 'us'],
|
|
'checkType': 'status_code',
|
|
'presenseStrs': ['totalKarma'],
|
|
'disabled': True,
|
|
'alexaRank': 17,
|
|
'url': 'https://www.reddit.com/user/{username}',
|
|
'urlMain': 'https://www.reddit.com/',
|
|
'usernameClaimed': 'blue',
|
|
'usernameUnclaimed': 'noonewouldeverusethis7',
|
|
}
|
|
|
|
del results['Reddit']['site']
|
|
del results['GooglePlayStore']['site']
|
|
|
|
reddit_status = results['Reddit']['status']
|
|
assert isinstance(reddit_status, MaigretCheckResult)
|
|
assert reddit_status.status == MaigretCheckStatus.ILLEGAL
|
|
|
|
playstore_status = results['GooglePlayStore']['status']
|
|
assert isinstance(playstore_status, MaigretCheckResult)
|
|
assert playstore_status.status == MaigretCheckStatus.CLAIMED
|
|
|
|
del results['Reddit']['status']
|
|
del results['GooglePlayStore']['status']
|
|
|
|
assert results['Reddit'].get('future') is None
|
|
del results['GooglePlayStore']['future']
|
|
del results['GooglePlayStore']['checker']
|
|
|
|
assert results == RESULTS_EXAMPLE
|
|
|
|
|
|
@pytest.mark.slow
|
|
def test_extract_ids_from_url(default_db):
|
|
assert default_db.extract_ids_from_url('https://www.reddit.com/user/test') == {
|
|
'test': 'username'
|
|
}
|
|
assert default_db.extract_ids_from_url('https://vk.com/id123') == {'123': 'vk_id'}
|
|
assert default_db.extract_ids_from_url('https://vk.com/ida123') == {
|
|
'ida123': 'username'
|
|
}
|
|
assert default_db.extract_ids_from_url(
|
|
'https://my.mail.ru/yandex.ru/dipres8904/'
|
|
) == {'dipres8904': 'username'}
|
|
assert default_db.extract_ids_from_url(
|
|
'https://reviews.yandex.ru/user/adbced123'
|
|
) == {'adbced123': 'yandex_public_id'}
|
|
|
|
|
|
@pytest.mark.slow
|
|
def test_extract_ids_from_page(test_db):
|
|
logger = Mock()
|
|
extract_ids_from_page('https://www.reddit.com/user/test', logger) == {
|
|
'test': 'username'
|
|
}
|
|
|
|
|
|
def test_extract_ids_from_results(test_db):
|
|
TEST_EXAMPLE: dict = copy.deepcopy(RESULTS_EXAMPLE)
|
|
TEST_EXAMPLE['Reddit']['ids_usernames'] = {'test1': 'yandex_public_id'}
|
|
TEST_EXAMPLE['Reddit']['ids_links'] = ['https://www.reddit.com/user/test2']
|
|
|
|
extract_ids_from_results(TEST_EXAMPLE, test_db) == {
|
|
'test1': 'yandex_public_id',
|
|
'test2': 'username',
|
|
}
|