diff --git a/setup.cfg b/setup.cfg index c485cd5..ca1f4c7 100644 --- a/setup.cfg +++ b/setup.cfg @@ -32,12 +32,12 @@ packages = find: python_requires = >=3.7 install_requires = torch>=1.12 - bitsandbytes==0.37.1 + bitsandbytes==0.38.0.post2 accelerate==0.15.0 huggingface-hub==0.11.1 transformers>=4.25.1,<5.0.0 speedtest-cli==2.1.3 - hivemind @ git+https://github.com/learning-at-home/hivemind.git + hivemind==1.1.7 tensor_parallel==1.0.23 humanfriendly async-timeout>=4.0.2 diff --git a/src/petals/cli/run_server.py b/src/petals/cli/run_server.py index 57761fd..5e7efb5 100644 --- a/src/petals/cli/run_server.py +++ b/src/petals/cli/run_server.py @@ -47,7 +47,7 @@ def main(): parser.add_argument('--announce_maddrs', nargs='+', required=False, help='Visible multiaddrs the host announces for external connections from other peers') - parser.add_argument('--daemon_startup_timeout', type=float, default=120, + parser.add_argument('--daemon_startup_timeout', type=float, default=60, help='Timeout for the libp2p daemon connecting to initial peers') parser.add_argument('--compression', type=str, default='NONE', required=False, help='Tensor compression communication') diff --git a/src/petals/client/remote_model.py b/src/petals/client/remote_model.py index 937cd9c..dc987e4 100644 --- a/src/petals/client/remote_model.py +++ b/src/petals/client/remote_model.py @@ -32,7 +32,7 @@ class DistributedBloomConfig(BloomConfig): initial_peers: List[str] = PUBLIC_INITIAL_PEERS # a list of initial peers for hivemind DHT dht_prefix: str # a prefix for all dht keys that correspond to this model (usually equal to model name) - daemon_startup_timeout: int = 120 # timeout for the libp2p daemon connecting to initial peers + daemon_startup_timeout: int = 60 # timeout for the libp2p daemon connecting to initial peers dht: Optional[hivemind.DHT] = None # a running DHT instance, e.g. when using the same DHT for multiple models request_timeout: int = 3 * 60 # a number of seconds for waiting result from each node max_retries: Optional[int] = None # max number retries before the client raises an exception (default: inf)