from ._base import * | |
class BloomGPTQForCausalLM(BaseGPTQForCausalLM): | |
layer_type = "BloomBlock" | |
layers_block_name = "transformer.h" | |
outside_layer_modules = ["transformer.word_embeddings", "transformer.word_embeddings_layernorm", "transformer.ln_f"] | |
inside_layer_modules = [ | |
["self_attention.query_key_value"], | |
["self_attention.dense"], | |
["mlp.dense_h_to_4h"], | |
["mlp.dense_4h_to_h"] | |
] | |
__all__ = ["BloomGPTQForCausalLM"] | |