Update src/petals/server/handler.py

10 months ago · 6910c532e0
parent 6d62057f08
commit 6910c532e0
1 changed files with 1 additions and 1 deletions
--- a/src/petals/server/handler.py
+++ b/src/petals/server/handler.py
@ -168,7 +168,7 @@ class TransformerConnectionHandler(ConnectionHandler):
                batch_size = request.tensors[0].size[0] if request.tensors else 1

                async with self._allocate_cache(
-                    requested_backends, batch_size, max_length, alloc_timeout
+                    requested_backends, batch_size=batch_size, max_length=max_length, timeout=alloc_timeout
                ) as cache_handles:
                    background_tasks = set()
                    async for output_tensors, can_push in iterate_rpc_inference(