diff --git a/setup.cfg b/setup.cfg index d6a2913..8bb0000 100644 --- a/setup.cfg +++ b/setup.cfg @@ -36,7 +36,7 @@ install_requires = accelerate>=0.20.3,<0.21.0 huggingface-hub>=0.11.1,<1.0.0 tokenizers>=0.13.3 - transformers>=4.31.0,<4.32.0 + transformers>=4.32.0 speedtest-cli==2.1.3 pydantic>=1.10,<2.0 # 2.0 is incompatible with hivemind yet hivemind==1.1.9 diff --git a/src/petals/server/from_pretrained.py b/src/petals/server/from_pretrained.py index bfbf03e..3468be9 100644 --- a/src/petals/server/from_pretrained.py +++ b/src/petals/server/from_pretrained.py @@ -61,7 +61,7 @@ def load_pretrained_block( ) # dummy load, check that keys match - report = block.load_state_dict(state_dict, strict=True) + report = block.load_state_dict(state_dict, strict=False) assert not report.missing_keys, f"Some block weights are missing: {report.missing_keys}" for param_name, _ in block.named_parameters():