remove slow_but_exact, add quantization

main_fix
justheuristic 2 years ago
parent 43399d7898
commit fde9d50850

@ -21,12 +21,11 @@ logger = logging.get_logger(__name__)
_CHECKPOINT_FOR_DOC = "bigscience/Bloom" _CHECKPOINT_FOR_DOC = "bigscience/Bloom"
_CONFIG_FOR_DOC = "MemoryEfficientBloomConfig" _CONFIG_FOR_DOC = "MemoryEfficientBloomConfig"
_TOKENIZER_FOR_DOC = "BloomTokenizer" _TOKENIZER_FOR_DOC = "BloomTokenizer"
_NOT_IMPLEMENTED = 'NOT_IMPLEMENTED'
class MemoryEfficientBloomConfig(_VanillaBloomConfig): class MemoryEfficientBloomConfig(_VanillaBloomConfig):
compression: str = 'none' compression: str = 'none'
slow_but_exact = _NOT_IMPLEMENTED slow_but_exact: bool = False
class BloomPreTrainedModel(PreTrainedModel): class BloomPreTrainedModel(PreTrainedModel):
@ -144,7 +143,7 @@ BLOOM_INPUTS_DOCSTRING = r"""
class BloomModel(BloomPreTrainedModel): class BloomModel(BloomPreTrainedModel):
def __init__(self, config): def __init__(self, config):
super().__init__(config) super().__init__(config)
assert config.slow_but_exact == _NOT_IMPLEMENTED, "slow_but_exact mode was removed for code simplicity" assert not config.slow_but_exact, "slow_but_exact mode was removed for code simplicity"
self.embed_dim = config.hidden_size self.embed_dim = config.hidden_size
self.n_head = config.n_head self.n_head = config.n_head

Loading…
Cancel
Save