Create dummy data when materializing qkv_proj

2024-10-31 09:20:41 +00:00 · 2023-09-03 19:20:07 +03:00 · 2023-09-03 19:20:07 +03:00 · 4159e557bf
commit 4159e557bf
parent 9cb4c721e7
1 changed files with 4 additions and 0 deletions
--- a/src/petals/server/from_pretrained.py
+++ b/src/petals/server/from_pretrained.py
@ -76,6 +76,10 @@ def load_pretrained_block(
            if not str(param.dtype).startswith(("torch.uint", "torch.int", "torch.bool")):
                param = param.to(torch_dtype)
            set_module_tensor_to_device(block, param_name, "cpu", value=param, dtype=param.dtype)
        else:
            cur_block = getattr(block, param_name)
            dummy_value = torch.empty_like(cur_block, device="cpu")
            set_module_tensor_to_device(block, param_name, "cpu", dummy_value)
    logger.info(f"Loaded {model_name} block {block_index}")
    logger.debug(f"Details: {report}")