alexmarques's picture
Upload folder using huggingface_hub
c471080 verified
quant_stage:
quant_modifiers:
GPTQModifier:
sequential_update: true
dampening_frac: 0.1
ignore: [lm_head]
scheme: W8A8
targets: Linear
observer: mse