fix: Telegram 409 다중 인스턴스 충돌 시 WARNING + 30초 백오프 (#180) #185

Merged
jihoson merged 2 commits from feature/issue-180-telegram-instance-lock into main 2026-02-20 09:52:15 +09:00
2 changed files with 23 additions and 37 deletions
Showing only changes of commit aceba86186 - Show all commits

View File

@@ -516,7 +516,6 @@ class TelegramCommandHandler:
self._last_update_id = 0
self._polling_task: asyncio.Task[None] | None = None
self._running = False
self._conflict_backoff_until: float = 0.0 # epoch time; skip polling until then
def register_command(
self, command: str, handler: Callable[[], Awaitable[None]]
@@ -575,12 +574,6 @@ class TelegramCommandHandler:
async def _poll_loop(self) -> None:
"""Main polling loop that fetches updates."""
while self._running:
# Skip this iteration while a conflict backoff is active
now = asyncio.get_event_loop().time()
if now < self._conflict_backoff_until:
await asyncio.sleep(self._polling_interval)
continue
try:
updates = await self._get_updates()
for update in updates:
@@ -612,15 +605,13 @@ class TelegramCommandHandler:
if resp.status != 200:
error_text = await resp.text()
if resp.status == 409:
# Another bot instance is already polling — back off to reduce conflict.
_conflict_backoff_secs = 30.0
self._conflict_backoff_until = (
asyncio.get_event_loop().time() + _conflict_backoff_secs
)
# Another bot instance is already polling — stop this poller entirely.
# Retrying would keep conflicting with the other instance.
self._running = False
logger.warning(
"Telegram conflict (409): another instance is polling. "
"Backing off %.0fs. Ensure only one bot instance runs at a time.",
_conflict_backoff_secs,
"Telegram conflict (409): another instance is already polling. "
"Disabling Telegram commands for this process. "
"Ensure only one instance of The Ouroboros is running at a time.",
)
else:
logger.error(

View File

@@ -877,10 +877,11 @@ class TestGetUpdates:
assert updates == []
@pytest.mark.asyncio
async def test_get_updates_409_sets_conflict_backoff(self) -> None:
"""409 Conflict response sets conflict_backoff_until and returns empty list."""
async def test_get_updates_409_stops_polling(self) -> None:
"""409 Conflict response stops the poller (_running = False) and returns empty list."""
client = TelegramClient(bot_token="123:abc", chat_id="456", enabled=True)
handler = TelegramCommandHandler(client)
handler._running = True # simulate active poller
mock_resp = AsyncMock()
mock_resp.status = 409
@@ -894,40 +895,34 @@ class TestGetUpdates:
updates = await handler._get_updates()
assert updates == []
assert handler._conflict_backoff_until > 0 # backoff was set
assert handler._running is False # poller stopped
@pytest.mark.asyncio
async def test_poll_loop_skips_during_conflict_backoff(self) -> None:
"""_poll_loop skips _get_updates while conflict backoff is active."""
async def test_poll_loop_exits_after_409(self) -> None:
"""_poll_loop exits naturally after _running is set to False by a 409 response."""
import asyncio as _asyncio
client = TelegramClient(bot_token="123:abc", chat_id="456", enabled=True)
handler = TelegramCommandHandler(client)
# Set an active backoff (far in the future)
handler._conflict_backoff_until = _asyncio.get_event_loop().time() + 600
call_count = 0
get_updates_called = []
async def mock_get_updates() -> list[dict]:
get_updates_called.append(True)
async def mock_get_updates_409() -> list[dict]:
nonlocal call_count
call_count += 1
# Simulate 409 stopping the poller
handler._running = False
return []
handler._get_updates = mock_get_updates # type: ignore[method-assign]
handler._get_updates = mock_get_updates_409 # type: ignore[method-assign]
# Run one iteration of the poll loop then stop
handler._running = True
task = _asyncio.create_task(handler._poll_loop())
await _asyncio.sleep(0.05)
handler._running = False
task.cancel()
try:
await task
except _asyncio.CancelledError:
pass
await _asyncio.wait_for(task, timeout=2.0)
# _get_updates should NOT have been called while backoff is active
assert get_updates_called == []
# _get_updates called exactly once, then loop exited
assert call_count == 1
assert handler._running is False
class TestCommandWithArgs: