16 lines
474 B
Python
16 lines
474 B
Python
from ._base import *
|
|
|
|
|
|
class BloomGPTQForCausalLM(BaseGPTQForCausalLM):
|
|
layer_type = "BloomBlock"
|
|
layers_block_name = "transformer.h"
|
|
outside_layer_modules = ["transformer.word_embeddings", "transformer.word_embeddings_layernorm", "transformer.ln_f"]
|
|
inside_layer_modules = [
|
|
["self_attention.query_key_value"],
|
|
["self_attention.dense"],
|
|
["mlp.dense_h_to_4h"],
|
|
["mlp.dense_4h_to_h"]
|
|
]
|
|
|
|
|
|
__all__ = ["BloomGPTQForCausalLM"]
|