Skip to content

Hitless-Upgrade: Add handling of MOVING push notification with "null" host:port info. #3738

New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Draft
wants to merge 34 commits into
base: feat/hitless-upgrade-sync-standalone
Choose a base branch
from
Draft
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
34 commits
Select commit Hold shift + click to select a range
092e33b
Handling of topology update push notifications for Standalone Redis c…
petyaslavova Jun 27, 2025
41a199e
Adding sequence id to the maintenance push notifications. Adding unit…
petyaslavova Jul 11, 2025
63d0c45
Adding integration-like tests for migrating/migrated events handling
petyaslavova Jul 11, 2025
5c71733
Removed unused imports
petyaslavova Jul 11, 2025
96c6e5d
Revert changing of the default retry object initialization for connec…
petyaslavova Jul 11, 2025
8691475
Complete migrating/migrated integration-like tests
petyaslavova Jul 14, 2025
7b57a22
Adding moving integration-like tests
petyaslavova Jul 15, 2025
bed2e40
Fixed BlockingConnectionPool locking strategy. Removed debug logging.…
petyaslavova Jul 17, 2025
0744ee5
Fixing linters
petyaslavova Jul 17, 2025
4c536f3
Applying Copilot's comments
petyaslavova Jul 17, 2025
6768d5d
Fixed type annotations not compatible with older python versions
petyaslavova Jul 17, 2025
ce31ec7
Add a few more tests and fix pool mock for python 3.9
petyaslavova Jul 17, 2025
d73cd35
Adding maintenance state to connections. Migrating and Migrated are n…
petyaslavova Jul 18, 2025
788cf52
Refactored the tmp host address and timeout storing and the way to ap…
petyaslavova Jul 22, 2025
6d496f0
Apply review comments
petyaslavova Jul 24, 2025
a8ba5ce
Adding handling of FAILING_OVER and FAILED_OVER events/push notificat…
petyaslavova Jul 24, 2025
2d3731f
Applying moving/moved only on connections to the same proxy.
petyaslavova Jul 26, 2025
d2288e9
Adds handshake for enabling server maintenance notifications
elena-kolevska Aug 1, 2025
b294db2
Adds tests
elena-kolevska Aug 7, 2025
a82cbfe
Merge branch 'master' into ps_hitless_upgrade_sync_redis
petyaslavova Aug 8, 2025
2cdfa75
Applying review comments.
petyaslavova Aug 8, 2025
822fccd
Refactor to have less methods in pool classes and made some of the ex…
petyaslavova Aug 11, 2025
2736aaa
Fixing lint errors
petyaslavova Aug 11, 2025
1e2b96d
Fixing tests
petyaslavova Aug 11, 2025
fb487c0
Adds handshake
elena-kolevska Aug 7, 2025
67bbee9
Fixes mock messages to follow the latest standard
elena-kolevska Aug 12, 2025
70688cc
Linters
elena-kolevska Aug 12, 2025
f9eec35
Hitless Upgrades enabled by default
elena-kolevska Aug 12, 2025
5fd2ddb
Fixing unit tests
petyaslavova Aug 13, 2025
e8785de
Applying review comments and moving resolving of conn ip in the Abstr…
petyaslavova Aug 13, 2025
c3caf6a
Fixing the docs of some of the new methods in connection pools. Handl…
petyaslavova Aug 14, 2025
8d7cc00
Merge branch 'ps_hitless_upgrade_sync_redis' into ps_add_fail_over_ev…
petyaslavova Aug 15, 2025
76eba1b
Merge branch 'ps_add_fail_over_events_handling' into hitless_handshake
petyaslavova Aug 15, 2025
e9b49e0
Adding handling for moving notifications with 'null' host/ip info
petyaslavova Aug 15, 2025
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
146 changes: 139 additions & 7 deletions redis/_parsers/base.py
Original file line number Diff line number Diff line change
@@ -1,8 +1,17 @@
import logging
import sys
from abc import ABC
from asyncio import IncompleteReadError, StreamReader, TimeoutError
from typing import Callable, List, Optional, Protocol, Union

from redis.maintenance_events import (
NodeFailedOverEvent,
NodeFailingOverEvent,
NodeMigratedEvent,
NodeMigratingEvent,
NodeMovingEvent,
)

if sys.version_info.major >= 3 and sys.version_info.minor >= 11:
from asyncio import timeout as async_timeout
else:
Expand Down Expand Up @@ -50,6 +59,8 @@
"Client sent AUTH, but no password is set": AuthenticationError,
}

logger = logging.getLogger(__name__)


class BaseParser(ABC):
EXCEPTION_CLASSES = {
Expand Down Expand Up @@ -158,48 +169,163 @@ async def read_response(
raise NotImplementedError()


_INVALIDATION_MESSAGE = [b"invalidate", "invalidate"]
_INVALIDATION_MESSAGE = (b"invalidate", "invalidate")
_MOVING_MESSAGE = (b"MOVING", "MOVING")
_MIGRATING_MESSAGE = (b"MIGRATING", "MIGRATING")
_MIGRATED_MESSAGE = (b"MIGRATED", "MIGRATED")
_FAILING_OVER_MESSAGE = (b"FAILING_OVER", "FAILING_OVER")
_FAILED_OVER_MESSAGE = (b"FAILED_OVER", "FAILED_OVER")

_MAINTENANCE_MESSAGES = (
*_MIGRATING_MESSAGE,
*_MIGRATED_MESSAGE,
*_FAILING_OVER_MESSAGE,
*_FAILED_OVER_MESSAGE,
)


class PushNotificationsParser(Protocol):
"""Protocol defining RESP3-specific parsing functionality"""

pubsub_push_handler_func: Callable
invalidation_push_handler_func: Optional[Callable] = None
node_moving_push_handler_func: Optional[Callable] = None
maintenance_push_handler_func: Optional[Callable] = None

def handle_pubsub_push_response(self, response):
"""Handle pubsub push responses"""
raise NotImplementedError()

def handle_push_response(self, response, **kwargs):
if response[0] not in _INVALIDATION_MESSAGE:
msg_type = response[0]
if msg_type not in (
*_INVALIDATION_MESSAGE,
*_MAINTENANCE_MESSAGES,
*_MOVING_MESSAGE,
):
return self.pubsub_push_handler_func(response)
if self.invalidation_push_handler_func:
return self.invalidation_push_handler_func(response)

try:
if (
msg_type in _INVALIDATION_MESSAGE
and self.invalidation_push_handler_func
):
return self.invalidation_push_handler_func(response)
if msg_type in _MOVING_MESSAGE and self.node_moving_push_handler_func:
# Expected message format is: MOVING <seq_number> <time> <endpoint>
id = response[1]
ttl = response[2]
host, port = response[3].decode().split(":")
notification = NodeMovingEvent(id, host, port, ttl)
return self.node_moving_push_handler_func(notification)

if msg_type in _MAINTENANCE_MESSAGES and self.maintenance_push_handler_func:
notification = None

if msg_type in _MIGRATING_MESSAGE:
# Expected message format is: MIGRATING <seq_number> <time> <shard_id-s>
id = response[1]
ttl = response[2]
notification = NodeMigratingEvent(id, ttl)
elif msg_type in _MIGRATED_MESSAGE:
id = response[1]
notification = NodeMigratedEvent(id)
elif msg_type in _FAILING_OVER_MESSAGE:
id = response[1]
ttl = response[2]
notification = NodeFailingOverEvent(id, ttl)
elif msg_type in _FAILED_OVER_MESSAGE:
id = response[1]
notification = NodeFailedOverEvent(id)

if notification is not None:
return self.maintenance_push_handler_func(notification)
except Exception as e:
logger.error(
"Error handling {} message ({}): {}".format(msg_type, response, e)
)

return None

def set_pubsub_push_handler(self, pubsub_push_handler_func):
self.pubsub_push_handler_func = pubsub_push_handler_func

def set_invalidation_push_handler(self, invalidation_push_handler_func):
self.invalidation_push_handler_func = invalidation_push_handler_func

def set_node_moving_push_handler(self, node_moving_push_handler_func):
self.node_moving_push_handler_func = node_moving_push_handler_func

def set_maintenance_push_handler(self, maintenance_push_handler_func):
self.maintenance_push_handler_func = maintenance_push_handler_func


class AsyncPushNotificationsParser(Protocol):
"""Protocol defining async RESP3-specific parsing functionality"""

pubsub_push_handler_func: Callable
invalidation_push_handler_func: Optional[Callable] = None
node_moving_push_handler_func: Optional[Callable] = None
maintenance_push_handler_func: Optional[Callable] = None

async def handle_pubsub_push_response(self, response):
"""Handle pubsub push responses asynchronously"""
raise NotImplementedError()

async def handle_push_response(self, response, **kwargs):
"""Handle push responses asynchronously"""
if response[0] not in _INVALIDATION_MESSAGE:

msg_type = response[0]
if msg_type not in (
*_INVALIDATION_MESSAGE,
*_MAINTENANCE_MESSAGES,
*_MOVING_MESSAGE,
):
return await self.pubsub_push_handler_func(response)
if self.invalidation_push_handler_func:
return await self.invalidation_push_handler_func(response)

try:
if (
msg_type in _INVALIDATION_MESSAGE
and self.invalidation_push_handler_func
):
return await self.invalidation_push_handler_func(response)
if msg_type in _MOVING_MESSAGE and self.node_moving_push_handler_func:
# push notification from enterprise cluster for node moving
id = response[1]
ttl = response[2]
if response[3] != "null":
host, port = response[3].split(":")
else:
host, port = None, None
notification = NodeMovingEvent(id, host, port, ttl)
return await self.node_moving_push_handler_func(notification)

if msg_type in _MAINTENANCE_MESSAGES and self.maintenance_push_handler_func:
notification = None

if msg_type in _MIGRATING_MESSAGE:
id = response[1]
ttl = response[2]
notification = NodeMigratingEvent(id, ttl)
elif msg_type in _MIGRATED_MESSAGE:
id = response[1]
notification = NodeMigratedEvent(id)
elif msg_type in _FAILING_OVER_MESSAGE:
id = response[1]
ttl = response[2]
notification = NodeFailingOverEvent(id, ttl)
elif msg_type in _FAILED_OVER_MESSAGE:
id = response[1]
notification = NodeFailedOverEvent(id)

if notification is not None:
return await self.maintenance_push_handler_func(notification)
except Exception as e:
logger.error(
"Error handling {} message ({}): {}".format(msg_type, response, e)
)

return None

def set_pubsub_push_handler(self, pubsub_push_handler_func):
"""Set the pubsub push handler function"""
Expand All @@ -209,6 +335,12 @@ def set_invalidation_push_handler(self, invalidation_push_handler_func):
"""Set the invalidation push handler function"""
self.invalidation_push_handler_func = invalidation_push_handler_func

def set_node_moving_push_handler(self, node_moving_push_handler_func):
self.node_moving_push_handler_func = node_moving_push_handler_func

def set_maintenance_push_handler(self, maintenance_push_handler_func):
self.maintenance_push_handler_func = maintenance_push_handler_func


class _AsyncRESPBase(AsyncBaseParser):
"""Base class for async resp parsing"""
Expand Down
26 changes: 16 additions & 10 deletions redis/_parsers/hiredis.py
Original file line number Diff line number Diff line change
Expand Up @@ -47,6 +47,8 @@ def __init__(self, socket_read_size):
self.socket_read_size = socket_read_size
self._buffer = bytearray(socket_read_size)
self.pubsub_push_handler_func = self.handle_pubsub_push_response
self.node_moving_push_handler_func = None
self.maintenance_push_handler_func = None
self.invalidation_push_handler_func = None
self._hiredis_PushNotificationType = None

Expand Down Expand Up @@ -141,12 +143,15 @@ def read_response(self, disable_decoding=False, push_request=False):
response, self._hiredis_PushNotificationType
):
response = self.handle_push_response(response)
if not push_request:
return self.read_response(
disable_decoding=disable_decoding, push_request=push_request
)
else:

# if this is a push request return the push response
if push_request:
return response

return self.read_response(
disable_decoding=disable_decoding,
push_request=push_request,
)
return response

if disable_decoding:
Expand All @@ -169,12 +174,13 @@ def read_response(self, disable_decoding=False, push_request=False):
response, self._hiredis_PushNotificationType
):
response = self.handle_push_response(response)
if not push_request:
return self.read_response(
disable_decoding=disable_decoding, push_request=push_request
)
else:
if push_request:
return response
return self.read_response(
disable_decoding=disable_decoding,
push_request=push_request,
)

elif (
isinstance(response, list)
and response
Expand Down
16 changes: 11 additions & 5 deletions redis/_parsers/resp3.py
Original file line number Diff line number Diff line change
Expand Up @@ -18,6 +18,8 @@ class _RESP3Parser(_RESPBase, PushNotificationsParser):
def __init__(self, socket_read_size):
super().__init__(socket_read_size)
self.pubsub_push_handler_func = self.handle_pubsub_push_response
self.node_moving_push_handler_func = None
self.maintenance_push_handler_func = None
self.invalidation_push_handler_func = None

def handle_pubsub_push_response(self, response):
Expand Down Expand Up @@ -117,17 +119,21 @@ def _read_response(self, disable_decoding=False, push_request=False):
for _ in range(int(response))
]
response = self.handle_push_response(response)
if not push_request:
return self._read_response(
disable_decoding=disable_decoding, push_request=push_request
)
else:

# if this is a push request return the push response
if push_request:
return response

return self._read_response(
disable_decoding=disable_decoding,
push_request=push_request,
)
else:
raise InvalidResponse(f"Protocol Error: {raw!r}")

if isinstance(response, bytes) and disable_decoding is False:
response = self.encoder.decode(response)

return response


Expand Down
Loading