petals/src/petals/server/block_selection.py

from dataclasses import dataclass
from typing import Dict, List, Optional, Tuple

import numpy as np
from hivemind import PeerID, get_logger

from petals.data_structures import RemoteModuleInfo, ServerState

__all__ = ["choose_best_blocks", "should_choose_other_blocks"]

logger = get_logger(__name__)


@dataclass
class Span:
    start: int
    end: int
    throughput: float
    state: ServerState

    @property
    def length(self):
        return self.end - self.start

    def move_to(self, new_start: int) -> None:
        self.start, self.end = new_start, new_start + self.length


def compute_spans(module_infos: List[Optional[RemoteModuleInfo]]) -> Tuple[Dict[PeerID, Span], np.ndarray]:
    spans = {}
    throughputs = np.zeros(len(module_infos))
    for block, module in enumerate(module_infos):
        if module is None:
            continue

        # We sort servers here to ensure that we get exactly the same throughputs for a given set of servers.
        # If the order were not defined, we would get slightly different values due to floating point errors,
        # which may cause excess block replacements.
        for peer_id, server in sorted(module.servers.items()):
            if server.state == ServerState.OFFLINE:
                continue

            if peer_id in spans:
                spans[peer_id].start = min(spans[peer_id].start, block)
                spans[peer_id].end = max(spans[peer_id].start, block + 1)
            else:
                spans[peer_id] = Span(start=block, end=block + 1, throughput=server.throughput, state=server.state)

            throughputs[block] += server.throughput

    return spans, throughputs


def _choose_best_start(throughputs: np.ndarray, num_blocks: int) -> int:
    options = ((sorted(throughputs[i : i + num_blocks]), i) for i in range(0, len(throughputs) - num_blocks + 1))
    return min(options)[-1]


def choose_best_blocks(num_blocks: int, module_infos: List[Optional[RemoteModuleInfo]]) -> List[int]:
    _, throughputs = compute_spans(module_infos)
    start = _choose_best_start(throughputs, num_blocks)
    return list(range(start, start + num_blocks))


def should_choose_other_blocks(
    local_peer_id: PeerID, module_infos: List[Optional[RemoteModuleInfo]], balance_quality: float
) -> bool:
    if balance_quality > 1.0:
        return True  # Forces rebalancing on each check (may be used for debugging purposes)

    spans, throughputs = compute_spans(module_infos)
    initial_throughput = throughputs.min()
    eps = 1e-3

    assert local_peer_id in spans, "Span served by this server is not present in the DHT"
    local_span = spans[local_peer_id]
    throughputs[local_span.start : local_span.end] -= local_span.throughput * (1 + eps)
    # Without (1 + eps) here, we would sometimes subtract a value slightly less than local_span.throughput
    # due to the floating point error, which would cause excess block replacements.
    # Also, subtracting local_span.throughput * (1 + eps) makes _choose_best_start() prefer
    # the previous server position in case of other things being almost equal.

    if initial_throughput > eps and throughputs.min() <= 0:
        return False  # Switching blocks would make the swarm disjoint

    new_start = _choose_best_start(throughputs, local_span.length)
    if local_span.start == new_start:
        return False  # This server is on its best place already

    throughputs[local_span.start : local_span.end] += local_span.throughput * eps
    local_span.move_to(new_start)
    throughputs[local_span.start : local_span.end] += local_span.throughput

    moved = True
    while moved:
        servers = list(spans.keys())
        np.random.shuffle(servers)

        moved = False
        for peer_id in servers:
            span = spans[peer_id]
            throughputs[span.start : span.end] -= span.throughput * (1 + eps)

            new_start = _choose_best_start(throughputs, span.length)

            throughputs[span.start : span.end] += span.throughput * eps
            if span.start != new_start:
                span.move_to(new_start)
                moved = True
            throughputs[span.start : span.end] += span.throughput

    new_throughput = throughputs.min()
    if new_throughput < initial_throughput or new_throughput < eps:
        return False

    actual_quality = initial_throughput / new_throughput
    logger.info(f"Swarm balance quality: {actual_quality * 100:.1f}%")

    return actual_quality < balance_quality - eps
Rebalance swarm when necessary (#34) 2 years ago			`from dataclasses import dataclass`
			`from typing import Dict, List, Optional, Tuple`

			`import numpy as np`
			`from hivemind import PeerID, get_logger`
Implement block selection on servers (#20) 2 years ago
Make Petals a pip-installable package (attempt 2) (#102) 1. Petals can be now installed using `pip install git+https://github.com/bigscience-workshop/petals` - In case if you already cloned the repo, you can do `pip install .` or `pip install .[dev]` 2. Moved `src` => `src/petals` - Replaced `from src.smth import smth` with `from petals.smth import smth` 3. Moved `cli` => `src/petals/cli` - Replaced `python -m cli.run_smth` with `python -m petals.cli.run_smth` (all utilities are now available right after pip installation) 4. Moved the `requirements*.txt` contents to `setup.cfg` (`requirements.txt` for packages is not supported well by modern packaging utils) 5. Increased the package version from `0.2` to `1.0alpha1` 2 years ago			`from petals.data_structures import RemoteModuleInfo, ServerState`
Implement block selection on servers (#20) 2 years ago
Rebalance swarm when necessary (#34) 2 years ago			`__all__ = ["choose_best_blocks", "should_choose_other_blocks"]`

Use get_logger(__name__) instead of get_logger(__file__) (#265) 1 year ago			`logger = get_logger(__name__)`
Rebalance swarm when necessary (#34) 2 years ago

			`@dataclass`
			`class Span:`
			`start: int`
			`end: int`
			`throughput: float`
Add `allowed_servers`, `max_retries` options to the client, improve logs (#235) 1 year ago			`state: ServerState`
Rebalance swarm when necessary (#34) 2 years ago
			`@property`
			`def length(self):`
			`return self.end - self.start`

			`def move_to(self, new_start: int) -> None:`
			`self.start, self.end = new_start, new_start + self.length`

Implement block selection on servers (#20) 2 years ago
Optimize RemoteSequenceManager (#106) - [x] made RemoteSequenceManager into a background thread that pre-fetches information instead of running just in time - [x] moved routing-related stuff to petals.client.routing - [x] extract remote peer routing information to RemoteSequenceInfo - [x] made sure that the code survives continued use (e.g. one hour) - [x] updated every spot where update_ is called manually - [x] modified get_sequence to check that the thread is alive, warn if not - [x] removed max_retries, switched rpc_info to exponential backoff - [x] fixed a bg that causes RemoteSeq* to lose user-defined hyperparameters (e.g. timeout) upon subsequencing (sequential[3:5]) - [x] moved client-side points strategy to client.routing - [x] ensured that RemoteSequenceManager thread created in get_remote_module properly shuts down when the module is destroyed - [x] resolved minor affected todos - [x] modified tests to no longer use PYTHONPATH - [x] worked around protocol error in rpc_info Co-authored-by: Aleksandr Borzunov <borzunov.alexander@gmail.com> Co-authored-by: Artem Chumachenko <artek.chumak@gmail.com> 2 years ago			`def compute_spans(module_infos: List[Optional[RemoteModuleInfo]]) -> Tuple[Dict[PeerID, Span], np.ndarray]:`
Rebalance swarm when necessary (#34) 2 years ago			`spans = {}`
			`throughputs = np.zeros(len(module_infos))`
			`for block, module in enumerate(module_infos):`
Implement block selection on servers (#20) 2 years ago			`if module is None:`
			`continue`

Fix floating point issues in block_selection.py (#89) 2 years ago			`# We sort servers here to ensure that we get exactly the same throughputs for a given set of servers.`
			`# If the order were not defined, we would get slightly different values due to floating point errors,`
			`# which may cause excess block replacements.`
			`for peer_id, server in sorted(module.servers.items()):`
Rebalance swarm when necessary (#34) 2 years ago			`if server.state == ServerState.OFFLINE:`
			`continue`

			`if peer_id in spans:`
			`spans[peer_id].start = min(spans[peer_id].start, block)`
			`spans[peer_id].end = max(spans[peer_id].start, block + 1)`
			`else:`
Add `allowed_servers`, `max_retries` options to the client, improve logs (#235) 1 year ago			`spans[peer_id] = Span(start=block, end=block + 1, throughput=server.throughput, state=server.state)`
Rebalance swarm when necessary (#34) 2 years ago
			`throughputs[block] += server.throughput`

			`return spans, throughputs`


Fix floating point issues in block_selection.py (#89) 2 years ago			`def _choose_best_start(throughputs: np.ndarray, num_blocks: int) -> int:`
			`options = ((sorted(throughputs[i : i + num_blocks]), i) for i in range(0, len(throughputs) - num_blocks + 1))`
Rebalance swarm when necessary (#34) 2 years ago			`return min(options)[-1]`


			`def choose_best_blocks(num_blocks: int, module_infos: List[Optional[RemoteModuleInfo]]) -> List[int]:`
Optimize RemoteSequenceManager (#106) - [x] made RemoteSequenceManager into a background thread that pre-fetches information instead of running just in time - [x] moved routing-related stuff to petals.client.routing - [x] extract remote peer routing information to RemoteSequenceInfo - [x] made sure that the code survives continued use (e.g. one hour) - [x] updated every spot where update_ is called manually - [x] modified get_sequence to check that the thread is alive, warn if not - [x] removed max_retries, switched rpc_info to exponential backoff - [x] fixed a bg that causes RemoteSeq* to lose user-defined hyperparameters (e.g. timeout) upon subsequencing (sequential[3:5]) - [x] moved client-side points strategy to client.routing - [x] ensured that RemoteSequenceManager thread created in get_remote_module properly shuts down when the module is destroyed - [x] resolved minor affected todos - [x] modified tests to no longer use PYTHONPATH - [x] worked around protocol error in rpc_info Co-authored-by: Aleksandr Borzunov <borzunov.alexander@gmail.com> Co-authored-by: Artem Chumachenko <artek.chumak@gmail.com> 2 years ago			`_, throughputs = compute_spans(module_infos)`
Fix floating point issues in block_selection.py (#89) 2 years ago			`start = _choose_best_start(throughputs, num_blocks)`
Rebalance swarm when necessary (#34) 2 years ago			`return list(range(start, start + num_blocks))`


			`def should_choose_other_blocks(`
Enable rebalancing by default (#84) 2 years ago			`local_peer_id: PeerID, module_infos: List[Optional[RemoteModuleInfo]], balance_quality: float`
Rebalance swarm when necessary (#34) 2 years ago			`) -> bool:`
Enable rebalancing by default (#84) 2 years ago			`if balance_quality > 1.0:`
Fix "Too many open files" during rebalancing (#83) Now, the number of open files stays the same after every rebalancing. 2 years ago			`return True # Forces rebalancing on each check (may be used for debugging purposes)`

Optimize RemoteSequenceManager (#106) - [x] made RemoteSequenceManager into a background thread that pre-fetches information instead of running just in time - [x] moved routing-related stuff to petals.client.routing - [x] extract remote peer routing information to RemoteSequenceInfo - [x] made sure that the code survives continued use (e.g. one hour) - [x] updated every spot where update_ is called manually - [x] modified get_sequence to check that the thread is alive, warn if not - [x] removed max_retries, switched rpc_info to exponential backoff - [x] fixed a bg that causes RemoteSeq* to lose user-defined hyperparameters (e.g. timeout) upon subsequencing (sequential[3:5]) - [x] moved client-side points strategy to client.routing - [x] ensured that RemoteSequenceManager thread created in get_remote_module properly shuts down when the module is destroyed - [x] resolved minor affected todos - [x] modified tests to no longer use PYTHONPATH - [x] worked around protocol error in rpc_info Co-authored-by: Aleksandr Borzunov <borzunov.alexander@gmail.com> Co-authored-by: Artem Chumachenko <artek.chumak@gmail.com> 2 years ago			`spans, throughputs = compute_spans(module_infos)`
Rebalance swarm when necessary (#34) 2 years ago			`initial_throughput = throughputs.min()`
Fix floating point issues in block_selection.py (#89) 2 years ago			`eps = 1e-3`
Rebalance swarm when necessary (#34) 2 years ago
			`assert local_peer_id in spans, "Span served by this server is not present in the DHT"`
			`local_span = spans[local_peer_id]`
Fix floating point issues in block_selection.py (#89) 2 years ago			`throughputs[local_span.start : local_span.end] -= local_span.throughput * (1 + eps)`
			`# Without (1 + eps) here, we would sometimes subtract a value slightly less than local_span.throughput`
			`# due to the floating point error, which would cause excess block replacements.`
			`# Also, subtracting local_span.throughput * (1 + eps) makes _choose_best_start() prefer`
			`# the previous server position in case of other things being almost equal.`
Rebalance swarm when necessary (#34) 2 years ago
Don't switch blocks if it makes swarm disjoint (#210) Even if the swarm seems to have at least 2 servers for each block, turning off on one of the servers could break it. That's because once a server is turned off, others may move to a better position, creating a significant downtime on their way. This PR prohibits switching blocks if it would make the swarm disjoint along the way. 1 year ago			`if initial_throughput > eps and throughputs.min() <= 0:`
			`return False # Switching blocks would make the swarm disjoint`

Fix floating point issues in block_selection.py (#89) 2 years ago			`new_start = _choose_best_start(throughputs, local_span.length)`
Rebalance swarm when necessary (#34) 2 years ago			`if local_span.start == new_start:`
			`return False # This server is on its best place already`

Fix floating point issues in block_selection.py (#89) 2 years ago			`throughputs[local_span.start : local_span.end] += local_span.throughput * eps`
			`local_span.move_to(new_start)`
Rebalance swarm when necessary (#34) 2 years ago			`throughputs[local_span.start : local_span.end] += local_span.throughput`

			`moved = True`
			`while moved:`
			`servers = list(spans.keys())`
			`np.random.shuffle(servers)`

			`moved = False`
			`for peer_id in servers:`
			`span = spans[peer_id]`
Fix floating point issues in block_selection.py (#89) 2 years ago			`throughputs[span.start : span.end] -= span.throughput * (1 + eps)`
Rebalance swarm when necessary (#34) 2 years ago
Fix floating point issues in block_selection.py (#89) 2 years ago			`new_start = _choose_best_start(throughputs, span.length)`

			`throughputs[span.start : span.end] += span.throughput * eps`
Rebalance swarm when necessary (#34) 2 years ago			`if span.start != new_start:`
			`span.move_to(new_start)`
			`moved = True`
			`throughputs[span.start : span.end] += span.throughput`

			`new_throughput = throughputs.min()`
Use public swarm by default (#92) This PR makes servers and clients use public swarm's bootstrap peers if no other initial peers are specified. If you'd like a server to start a new swarm, provide the `--new_swarm` CLI argument. 2 years ago			`if new_throughput < initial_throughput or new_throughput < eps:`
			`return False`

Enable rebalancing by default (#84) 2 years ago			`actual_quality = initial_throughput / new_throughput`
			`logger.info(f"Swarm balance quality: {actual_quality * 100:.1f}%")`
Rebalance swarm when necessary (#34) 2 years ago
Enable rebalancing by default (#84) 2 years ago			`return actual_quality < balance_quality - eps`