bnjmnmarie's picture
Upload folder using huggingface_hub
3b1a22b verified
raw
history blame contribute delete
489 Bytes
default_stage:
default_modifiers:
SmoothQuantModifier:
smoothing_strength: 0.8
mappings:
- !!python/tuple
- ['re:.*self_attn.o_proj$']
- re:.*self_attn.v_proj$
- !!python/tuple
- ['re:.*mlp.down_proj$']
- re:.*mlp.up_proj$
ignore: []
GPTQModifier:
targets: [Linear]
ignore: [lm_head]
scheme: W8A8
block_size: 128
dampening_frac: 0.01
actorder: static
offload_hessians: false