glm-4v-9b-W4A16-G128 / recipe.yaml
kylesayrs's picture
Upload folder using huggingface_hub
318549b verified
DEFAULT_stage:
DEFAULT_modifiers:
GPTQModifier:
sequential_targets: [GLMBlock]
dampening_frac: 10000000000.0
scheme: W8A8
targets: Linear
ignore: [transformer.output_layer, 're:transformer.vision.*']