from transformers import PretrainedConfig | |
class BitNetConfig(PretrainedConfig): | |
model_type = "bitnet" | |
def __init__(self, bit_width=1.58, group_size=64, **kwargs): | |
super().__init__(**kwargs) | |
self.bit_width = bit_width # ζιιεδ½ζ° | |
self.group_size = group_size # ιεεη»ε€§ε° |