diff --git a/torchao/quantization/quantize_/common/packing_format.py b/torchao/quantization/quantize_/common/packing_format.py index 89acf4eff3..ba969fff00 100644 --- a/torchao/quantization/quantize_/common/packing_format.py +++ b/torchao/quantization/quantize_/common/packing_format.py @@ -37,6 +37,13 @@ class PackingFormat(str, Enum): MARLIN_SPARSE = "marlin_sparse" """ - Unpacked means the subbyte quantized data is stored as int8 + Unpacked to int8 means the subbyte quantized data is stored as int8 """ UNPACKED_TO_INT8 = "unpacked_to_int8" + + """ + Opaque packing format that's used for tensors that does not have a predefined packing format + (that may be decided on hardware, tensor shape, library availability etc.) and it's not + needed for the rest of the system to understand the specific format that's adopted. + """ + OPAQUE = "opaque"