From 19d0e378398698e74ed75fe0debc01f2ca2351bc Mon Sep 17 00:00:00 2001 From: Max Ryabinin Date: Wed, 25 Jan 2023 02:44:47 +0100 Subject: [PATCH] Add a temporary hack for larger models --- src/petals/server/server.py | 9 +++++++++ 1 file changed, 9 insertions(+) diff --git a/src/petals/server/server.py b/src/petals/server/server.py index 9ab80c9..459ae2f 100644 --- a/src/petals/server/server.py +++ b/src/petals/server/server.py @@ -118,6 +118,15 @@ class Server: use_auth_token=use_auth_token, revision=revision, ) + elif converted_model_name_or_path == "facebook/opt-175b": + bloom_config = BloomConfig.from_pretrained( + "bigscience/bloom-petals" + ) + bloom_config.hidden_size = 12288 + bloom_config.n_layer = 96 + bloom_config.n_head = 96 + bloom_config.vocab_size = 50272 + self.block_config = bloom_config else: def _patch_bloom_config(bloom_config: BloomConfig, opt_config: OPTConfig): bloom_config.hidden_size = opt_config.hidden_size