Commit ba8563c 1 parent a76563a commit ba8563c Copy full SHA for ba8563c
File tree 3 files changed +4
-5
lines changed
src/llmcompressor/modifiers/quantization/gptq
3 files changed +4
-5
lines changed Original file line number Diff line number Diff line change 16
16
from llmcompressor .core import State
17
17
from llmcompressor .modifiers import Modifier , ModifierFactory
18
18
from llmcompressor .modifiers .quantization .calibration import freeze_module_quantization
19
- from llmcompressor .modifiers .quantization .gptq .utils . gptq_quantize import (
19
+ from llmcompressor .modifiers .quantization .gptq .gptq_quantize import (
20
20
accumulate_hessian ,
21
21
make_empty_hessian ,
22
22
quantize_weight ,
36
36
37
37
class GPTQModifier (Modifier , HooksMixin ):
38
38
"""
39
- Modifier for applying the one-shot OBCQ algorithm to a model
39
+ Implements the GPTQ algorithm from https://arxiv.org/abs/2210.17323. This modifier
40
+ uses activations to calibrate a hessian matrix, which is then used to determine
41
+ optimal quantizion values and orderings for the model weights.
40
42
41
43
| Sample yaml:
42
44
| test_stage:
File renamed without changes.
Load Diff This file was deleted.
You can’t perform that action at this time.
0 commit comments