Documentation for Dflupdatehandler Module¶

`DFLUpdateHandler` ¶

Bases: UpdateHandler

Distributed Federated Learning (DFL) Update Handler.

This handler manages the reception, storage, and tracking of model updates from federation nodes during asynchronous rounds. It supports partial updates, late arrivals, and maintains update history.

Source code in nebula/core/aggregation/updatehandlers/dflupdatehandler.py

class DFLUpdateHandler(UpdateHandler):
    """
    Distributed Federated Learning (DFL) Update Handler.

    This handler manages the reception, storage, and tracking of model updates from federation nodes
    during asynchronous rounds. It supports partial updates, late arrivals, and maintains update history.
    """

    def __init__(self, aggregator, addr, buffersize=MAX_UPDATE_BUFFER_SIZE):
        """
        Initialize the update handler with required locks and storage.

        Args:
            aggregator (Aggregator): Aggregator instance for the federation.
            addr (str): Address of the local node.
            buffersize (int): Maximum number of historical updates to keep per node.
        """
        self._addr = addr
        self._aggregator: Aggregator = aggregator
        self._buffersize = buffersize
        self._updates_storage: dict[str, tuple[Update, deque[Update]]] = {}
        self._updates_storage_lock = Locker(name="updates_storage_lock", async_lock=True)
        self._sources_expected = set()
        self._sources_received = set()
        self._round_updates_lock = Locker(name="round_updates_lock", async_lock=True)
        self._update_federation_lock = Locker(name="update_federation_lock", async_lock=True)
        self._notification_sent_lock = Locker(name="notification_sent_lock", async_lock=True)
        self._notification = False
        self._missing_ones = set()
        self._nodes_using_historic = set()

    @property
    def us(self):
        """Returns the internal updates storage dictionary."""
        return self._updates_storage

    @property
    def agg(self):
        """Returns the aggregator instance."""
        return self._aggregator

    async def init(self, config=None):
        """
        Subscribe to update-related events from the event manager.
        """
        await EventManager.get_instance().subscribe_node_event(UpdateNeighborEvent, self.notify_federation_update)
        await EventManager.get_instance().subscribe_node_event(UpdateReceivedEvent, self.storage_update)

    async def round_expected_updates(self, federation_nodes: set):
        """
        Define which nodes are expected to send updates in this round and reset internal state.

        Args:
            federation_nodes (set): Set of node IDs expected to participate this round.
        """
        await self._update_federation_lock.acquire_async()
        await self._updates_storage_lock.acquire_async()
        self._sources_expected = federation_nodes.copy()
        self._sources_received.clear()

        # Initialize new nodes
        for fn in federation_nodes:
            if fn not in self.us:
                self.us[fn] = (None, deque(maxlen=self._buffersize))

        # Clear removed nodes
        removed_nodes = [node for node in self._updates_storage.keys() if node not in federation_nodes]
        for rn in removed_nodes:
            del self._updates_storage[rn]

        # Check already received updates
        await self._check_updates_already_received()

        await self._updates_storage_lock.release_async()
        await self._update_federation_lock.release_async()

        # Lock to check if all updates received
        if self._round_updates_lock.locked():
            self._round_updates_lock.release_async()

        self._notification = False

    async def _check_updates_already_received(self):
        """
        Scan storage for updates already received in this round.
        """
        for se in self._sources_expected:
            (last_updt, node_storage) = self._updates_storage[se]
            if len(node_storage):
                try:
                    if (last_updt and node_storage[-1] and last_updt != node_storage[-1]) or (
                        node_storage[-1] and not last_updt
                    ):
                        self._sources_received.add(se)
                        logging.info(
                            f"Update already received from source: {se} | ({len(self._sources_received)}/{len(self._sources_expected)}) Updates received"
                        )
                except:
                    logging.exception(
                        f"ERROR: source expected: {se} | last_update None: {(True if not last_updt else False)}, last update storaged None: {(True if not node_storage[-1] else False)}"
                    )

    async def storage_update(self, updt_received_event: UpdateReceivedEvent):
        """
        Store an incoming update and trigger aggregation if all updates are received.

        Args:
            updt_received_event (UpdateReceivedEvent): Event with model update data.
        """
        time_received = time.time()
        (model, weight, source, round, _) = await updt_received_event.get_event_data()
        if source in self._sources_expected:
            updt = Update(model, weight, source, round, time_received)
            await self._updates_storage_lock.acquire_async()
            if updt in self.us[source][1]:
                logging.info(f"Discard | Alerady received update from source: {source} for round: {round}")
            else:
                last_update_used = self.us[source][0]
                self.us[source][1].append(updt)
                self.us[source] = (last_update_used, self.us[source][1])
                logging.info(
                    f"Storage Update | source={source} | round={round} | weight={weight} | federation nodes: {self._sources_expected}"
                )

                self._sources_received.add(source)
                updates_left = self._sources_expected.difference(self._sources_received)
                logging.info(
                    f"Updates received ({len(self._sources_received)}/{len(self._sources_expected)}) | Missing nodes: {updates_left}"
                )
                if self._round_updates_lock.locked() and not updates_left:
                    all_rec = await self._all_updates_received()
                    if all_rec:
                        await self._notify()
            await self._updates_storage_lock.release_async()
        else:
            if source not in self._sources_received:
                logging.info(f"Discard update | source: {source} not in expected updates for this Round")

    async def get_round_updates(self):
        """
        Retrieve the most recent valid updates for this round, filling gaps if needed.

        Returns:
            dict: A dictionary mapping node ID to (model, weight) tuples.
        """
        await self._updates_storage_lock.acquire_async()
        updates_missing = self._sources_expected.difference(self._sources_received)
        if updates_missing:
            self._missing_ones = updates_missing
            logging.info(f"Missing updates from sources: {updates_missing}")
        else:
            self._missing_ones.clear()

        self._nodes_using_historic.clear()
        updates = {}
        for sr in self._sources_received:
            source_historic = self.us[sr][1]
            last_updt_received = self.us[sr][0]
            updt: Update = None
            updt = source_historic[-1]  # Get last update received
            if last_updt_received and last_updt_received == updt:
                logging.info(f"Missing update from source: {sr}, using last update received..")
                self._nodes_using_historic.add(sr)
            else:
                last_updt_received = updt
                self.us[sr] = (last_updt_received, source_historic)  # Update storage with new last update used
            updates[sr] = (updt.model, updt.weight)

        await self._updates_storage_lock.release_async()
        return updates

    async def notify_federation_update(self, updt_nei_event: UpdateNeighborEvent):
        """
        Handle federation node join/leave events.

        Args:
            updt_nei_event (UpdateNeighborEvent): Event with neighbor update data.
        """
        source, remove = await updt_nei_event.get_event_data()
        if not remove:
            if self._round_updates_lock.locked():
                logging.info(f"Source: {source} will be count next round")
            else:
                await self._update_source(source, remove)
        else:
            if source not in self._sources_received:  # Not received update from this source yet
                await self._update_source(source, remove=True)
                all_rec = await self._all_updates_received()  # Verify if discarding node aggregation could be done
                if all_rec:
                    await self._notify()
            else:
                logging.info(f"Already received update from: {source}, it will be discarded next round")

    async def _update_source(self, source, remove=False):
        """
        Add or remove a node from the expected sources.

        Args:
            source (str): Node ID.
            remove (bool): Whether to remove the node from the expected list.
        """
        logging.info(f"🔄 Update | remove: {remove} | source: {source}")
        await self._updates_storage_lock.acquire_async()
        if remove:
            self._sources_expected.discard(source)
        else:
            self.us[source] = (None, deque(maxlen=self._buffersize))
            self._sources_expected.add(source)
        logging.info(f"federation nodes expected this round: {self._sources_expected}")
        await self._updates_storage_lock.release_async()

    async def get_round_missing_nodes(self):
        """
        Return the set of nodes whose updates were not received this round.

        Returns:
            set: Missing node IDs.
        """
        return self._missing_ones

    async def notify_if_all_updates_received(self):
        """
        Set a notification trigger and notify aggregator if all updates are already received.
        """
        logging.info("Set notification when all expected updates received")
        await self._round_updates_lock.acquire_async()
        await self._updates_storage_lock.acquire_async()
        all_received = await self._all_updates_received()
        await self._updates_storage_lock.release_async()
        if all_received:
            await self._notify()

    async def stop_notifying_updates(self):
        """
        Cancel any notification triggers for update reception.
        """
        if self._round_updates_lock.locked():
            logging.info("Stop notification updates")
            await self._round_updates_lock.release_async()

    async def _notify(self):
        """
        Notify the aggregator that all expected updates have been received.
        """
        await self._notification_sent_lock.acquire_async()
        if self._notification:
            await self._notification_sent_lock.release_async()
            return
        self._notification = True
        await self.stop_notifying_updates()
        await self._notification_sent_lock.release_async()
        logging.info("🔄 Notifying aggregator to release aggregation")
        await self.agg.notify_all_updates_received()

    async def _all_updates_received(self):
        """
        Check if all expected updates have been received.

        Returns:
            bool: True if no updates are missing.
        """
        updates_left = self._sources_expected.difference(self._sources_received)
        all_received = False
        if len(updates_left) == 0:
            logging.info("All updates have been received this round")
            if await self._round_updates_lock.locked_async():
                await self._round_updates_lock.release_async()
            all_received = True
        return all_received

`agg` `property` ¶

Returns the aggregator instance.

`us` `property` ¶

Returns the internal updates storage dictionary.

`init(aggregator, addr, buffersize=MAX_UPDATE_BUFFER_SIZE)` ¶

Initialize the update handler with required locks and storage.

Parameters:

Name	Type	Description	Default
`aggregator`	`Aggregator`	Aggregator instance for the federation.	required
`addr`	`str`	Address of the local node.	required
`buffersize`	`int`	Maximum number of historical updates to keep per node.	`MAX_UPDATE_BUFFER_SIZE`

Source code in nebula/core/aggregation/updatehandlers/dflupdatehandler.py

def __init__(self, aggregator, addr, buffersize=MAX_UPDATE_BUFFER_SIZE):
    """
    Initialize the update handler with required locks and storage.

    Args:
        aggregator (Aggregator): Aggregator instance for the federation.
        addr (str): Address of the local node.
        buffersize (int): Maximum number of historical updates to keep per node.
    """
    self._addr = addr
    self._aggregator: Aggregator = aggregator
    self._buffersize = buffersize
    self._updates_storage: dict[str, tuple[Update, deque[Update]]] = {}
    self._updates_storage_lock = Locker(name="updates_storage_lock", async_lock=True)
    self._sources_expected = set()
    self._sources_received = set()
    self._round_updates_lock = Locker(name="round_updates_lock", async_lock=True)
    self._update_federation_lock = Locker(name="update_federation_lock", async_lock=True)
    self._notification_sent_lock = Locker(name="notification_sent_lock", async_lock=True)
    self._notification = False
    self._missing_ones = set()
    self._nodes_using_historic = set()

`get_round_missing_nodes()` `async` ¶

Return the set of nodes whose updates were not received this round.

Returns:

Name	Type	Description
`set`		Missing node IDs.

Source code in nebula/core/aggregation/updatehandlers/dflupdatehandler.py

async def get_round_missing_nodes(self):
    """
    Return the set of nodes whose updates were not received this round.

    Returns:
        set: Missing node IDs.
    """
    return self._missing_ones

`get_round_updates()` `async` ¶

Retrieve the most recent valid updates for this round, filling gaps if needed.

Returns:

Name	Type	Description
`dict`		A dictionary mapping node ID to (model, weight) tuples.

Source code in nebula/core/aggregation/updatehandlers/dflupdatehandler.py

async def get_round_updates(self):
    """
    Retrieve the most recent valid updates for this round, filling gaps if needed.

    Returns:
        dict: A dictionary mapping node ID to (model, weight) tuples.
    """
    await self._updates_storage_lock.acquire_async()
    updates_missing = self._sources_expected.difference(self._sources_received)
    if updates_missing:
        self._missing_ones = updates_missing
        logging.info(f"Missing updates from sources: {updates_missing}")
    else:
        self._missing_ones.clear()

    self._nodes_using_historic.clear()
    updates = {}
    for sr in self._sources_received:
        source_historic = self.us[sr][1]
        last_updt_received = self.us[sr][0]
        updt: Update = None
        updt = source_historic[-1]  # Get last update received
        if last_updt_received and last_updt_received == updt:
            logging.info(f"Missing update from source: {sr}, using last update received..")
            self._nodes_using_historic.add(sr)
        else:
            last_updt_received = updt
            self.us[sr] = (last_updt_received, source_historic)  # Update storage with new last update used
        updates[sr] = (updt.model, updt.weight)

    await self._updates_storage_lock.release_async()
    return updates

`init(config=None)` `async` ¶

Subscribe to update-related events from the event manager.

Source code in nebula/core/aggregation/updatehandlers/dflupdatehandler.py

async def init(self, config=None):
    """
    Subscribe to update-related events from the event manager.
    """
    await EventManager.get_instance().subscribe_node_event(UpdateNeighborEvent, self.notify_federation_update)
    await EventManager.get_instance().subscribe_node_event(UpdateReceivedEvent, self.storage_update)

`notify_federation_update(updt_nei_event)` `async` ¶

Handle federation node join/leave events.

Parameters:

Name	Type	Description	Default
`updt_nei_event`	`UpdateNeighborEvent`	Event with neighbor update data.	required

Source code in nebula/core/aggregation/updatehandlers/dflupdatehandler.py

async def notify_federation_update(self, updt_nei_event: UpdateNeighborEvent):
    """
    Handle federation node join/leave events.

    Args:
        updt_nei_event (UpdateNeighborEvent): Event with neighbor update data.
    """
    source, remove = await updt_nei_event.get_event_data()
    if not remove:
        if self._round_updates_lock.locked():
            logging.info(f"Source: {source} will be count next round")
        else:
            await self._update_source(source, remove)
    else:
        if source not in self._sources_received:  # Not received update from this source yet
            await self._update_source(source, remove=True)
            all_rec = await self._all_updates_received()  # Verify if discarding node aggregation could be done
            if all_rec:
                await self._notify()
        else:
            logging.info(f"Already received update from: {source}, it will be discarded next round")

`notify_if_all_updates_received()` `async` ¶

Set a notification trigger and notify aggregator if all updates are already received.

Source code in nebula/core/aggregation/updatehandlers/dflupdatehandler.py

async def notify_if_all_updates_received(self):
    """
    Set a notification trigger and notify aggregator if all updates are already received.
    """
    logging.info("Set notification when all expected updates received")
    await self._round_updates_lock.acquire_async()
    await self._updates_storage_lock.acquire_async()
    all_received = await self._all_updates_received()
    await self._updates_storage_lock.release_async()
    if all_received:
        await self._notify()

`round_expected_updates(federation_nodes)` `async` ¶

Define which nodes are expected to send updates in this round and reset internal state.

Parameters:

Name	Type	Description	Default
`federation_nodes`	`set`	Set of node IDs expected to participate this round.	required

Source code in nebula/core/aggregation/updatehandlers/dflupdatehandler.py

async def round_expected_updates(self, federation_nodes: set):
    """
    Define which nodes are expected to send updates in this round and reset internal state.

    Args:
        federation_nodes (set): Set of node IDs expected to participate this round.
    """
    await self._update_federation_lock.acquire_async()
    await self._updates_storage_lock.acquire_async()
    self._sources_expected = federation_nodes.copy()
    self._sources_received.clear()

    # Initialize new nodes
    for fn in federation_nodes:
        if fn not in self.us:
            self.us[fn] = (None, deque(maxlen=self._buffersize))

    # Clear removed nodes
    removed_nodes = [node for node in self._updates_storage.keys() if node not in federation_nodes]
    for rn in removed_nodes:
        del self._updates_storage[rn]

    # Check already received updates
    await self._check_updates_already_received()

    await self._updates_storage_lock.release_async()
    await self._update_federation_lock.release_async()

    # Lock to check if all updates received
    if self._round_updates_lock.locked():
        self._round_updates_lock.release_async()

    self._notification = False

`stop_notifying_updates()` `async` ¶

Cancel any notification triggers for update reception.

Source code in nebula/core/aggregation/updatehandlers/dflupdatehandler.py

async def stop_notifying_updates(self):
    """
    Cancel any notification triggers for update reception.
    """
    if self._round_updates_lock.locked():
        logging.info("Stop notification updates")
        await self._round_updates_lock.release_async()

`storage_update(updt_received_event)` `async` ¶

Store an incoming update and trigger aggregation if all updates are received.

Parameters:

Name	Type	Description	Default
`updt_received_event`	`UpdateReceivedEvent`	Event with model update data.	required

Source code in nebula/core/aggregation/updatehandlers/dflupdatehandler.py

async def storage_update(self, updt_received_event: UpdateReceivedEvent):
    """
    Store an incoming update and trigger aggregation if all updates are received.

    Args:
        updt_received_event (UpdateReceivedEvent): Event with model update data.
    """
    time_received = time.time()
    (model, weight, source, round, _) = await updt_received_event.get_event_data()
    if source in self._sources_expected:
        updt = Update(model, weight, source, round, time_received)
        await self._updates_storage_lock.acquire_async()
        if updt in self.us[source][1]:
            logging.info(f"Discard | Alerady received update from source: {source} for round: {round}")
        else:
            last_update_used = self.us[source][0]
            self.us[source][1].append(updt)
            self.us[source] = (last_update_used, self.us[source][1])
            logging.info(
                f"Storage Update | source={source} | round={round} | weight={weight} | federation nodes: {self._sources_expected}"
            )

            self._sources_received.add(source)
            updates_left = self._sources_expected.difference(self._sources_received)
            logging.info(
                f"Updates received ({len(self._sources_received)}/{len(self._sources_expected)}) | Missing nodes: {updates_left}"
            )
            if self._round_updates_lock.locked() and not updates_left:
                all_rec = await self._all_updates_received()
                if all_rec:
                    await self._notify()
        await self._updates_storage_lock.release_async()
    else:
        if source not in self._sources_received:
            logging.info(f"Discard update | source: {source} not in expected updates for this Round")

`Update` ¶

Represents a model update received from a node in a specific training round.

Attributes:

Name	Type	Description
`model`	`object`	The model object or weights received.
`weight`	`float`	The weight or importance of the update.
`source`	`str`	Identifier of the node that sent the update.
`round`	`int`	Training round this update belongs to.
`time_received`	`float`	Timestamp when the update was received.

Source code in nebula/core/aggregation/updatehandlers/dflupdatehandler.py

class Update:
    """
    Represents a model update received from a node in a specific training round.

    Attributes:
        model (object): The model object or weights received.
        weight (float): The weight or importance of the update.
        source (str): Identifier of the node that sent the update.
        round (int): Training round this update belongs to.
        time_received (float): Timestamp when the update was received.
    """
    def __init__(self, model, weight, source, round, time_received):
        self.model = model
        self.weight = weight
        self.source = source
        self.round = round
        self.time_received = time_received

    def __eq__(self, other):
        """
        Checks if two updates belong to the same round.
        """
        return self.round == other.round

`eq(other)` ¶

Checks if two updates belong to the same round.

Source code in nebula/core/aggregation/updatehandlers/dflupdatehandler.py

def __eq__(self, other):
    """
    Checks if two updates belong to the same round.
    """
    return self.round == other.round

Documentation for Dflupdatehandler Module¶

DFLUpdateHandler ¶

agg property ¶

us property ¶

__init__(aggregator, addr, buffersize=MAX_UPDATE_BUFFER_SIZE) ¶

get_round_missing_nodes() async ¶

get_round_updates() async ¶

init(config=None) async ¶

notify_federation_update(updt_nei_event) async ¶

notify_if_all_updates_received() async ¶

round_expected_updates(federation_nodes) async ¶

stop_notifying_updates() async ¶

storage_update(updt_received_event) async ¶

Update ¶

__eq__(other) ¶

`DFLUpdateHandler` ¶

`agg` `property` ¶

`us` `property` ¶

`init(aggregator, addr, buffersize=MAX_UPDATE_BUFFER_SIZE)` ¶

`get_round_missing_nodes()` `async` ¶

`get_round_updates()` `async` ¶

`init(config=None)` `async` ¶

`notify_federation_update(updt_nei_event)` `async` ¶

`notify_if_all_updates_received()` `async` ¶

`round_expected_updates(federation_nodes)` `async` ¶

`stop_notifying_updates()` `async` ¶

`storage_update(updt_received_event)` `async` ¶

`Update` ¶

`eq(other)` ¶