nm-autobot's picture
Upload folder using huggingface_hub
b99bb9b verified
raw
history blame contribute delete
263 Bytes
default_stage:
default_modifiers:
GPTQModifier:
targets: [Linear]
ignore: [lm_head, 're:.*mlp.gate[.].*']
scheme: W8A16
bypass_divisibility_checks: false
block_size: 128
dampening_frac: 0.01
offload_hessians: false