0xGrrr commited on
Commit
c9bf07b
1 Parent(s): 1e1a20a

Update modeling_mpt.py

Browse files

This PR adds the accelerate support for MPT models as seen on https://huggingface.co/mosaicml/mpt-7b/discussions/45

Files changed (1) hide show
  1. modeling_mpt.py +1 -0
modeling_mpt.py CHANGED
@@ -23,6 +23,7 @@ Tokenizer = Union[PreTrainedTokenizer, PreTrainedTokenizerFast]
23
  class MPTPreTrainedModel(PreTrainedModel):
24
  config_class = MPTConfig
25
  base_model_prefix = 'model'
 
26
 
27
  class MPTModel(MPTPreTrainedModel):
28
 
 
23
  class MPTPreTrainedModel(PreTrainedModel):
24
  config_class = MPTConfig
25
  base_model_prefix = 'model'
26
+ _no_split_modules=["MPTBlock"]
27
 
28
  class MPTModel(MPTPreTrainedModel):
29