Skip to content

Commit

Permalink
clean-up
Browse files Browse the repository at this point in the history
  • Loading branch information
dsikka committed Oct 11, 2024
1 parent 5c1f9d2 commit 2575cb7
Show file tree
Hide file tree
Showing 3 changed files with 2 additions and 7 deletions.
1 change: 0 additions & 1 deletion src/compressed_tensors/quantization/lifecycle/apply.py
Original file line number Diff line number Diff line change
Expand Up @@ -246,7 +246,6 @@ def apply_quantization_status(model: Module, status: QuantizationStatus):
if current_status < status >= QuantizationStatus.CALIBRATION > current_status:
# only quantize weights up front when our end goal state is calibration,
# weight quantization parameters are already loaded for frozen/compressed
# TODO: to be removed from compressed-tensors
quantize_weights_upfront = status == QuantizationStatus.CALIBRATION
model.apply(
lambda module: set_module_for_calibration(
Expand Down
6 changes: 1 addition & 5 deletions src/compressed_tensors/quantization/lifecycle/frozen.py
Original file line number Diff line number Diff line change
Expand Up @@ -45,11 +45,7 @@ def freeze_module_quantization(module: Module):
delattr(module, "input_observer")
if hasattr(module, "weight_observer") and not scheme.weights.dynamic:
delattr(module, "weight_observer")
if (
hasattr(module, "output_observer")
and not is_kv_cache_quant_scheme(scheme)
and not scheme.output_activations.dynamic
):
if hasattr(module, "output_observer") and not scheme.output_activations.dynamic:
delattr(module, "output_observer")

module.quantization_status = QuantizationStatus.FROZEN
2 changes: 1 addition & 1 deletion src/compressed_tensors/quantization/quant_args.py
Original file line number Diff line number Diff line change
Expand Up @@ -120,7 +120,7 @@ def get_observer(self):
# keeps state across samples for dynamic
self.observer = "memoryless"

return self.observer
return Observer.load_from_registry(self.observer, quantization_args=self)

# TODO: update to be removed into llm-compressor
def get_kv_cache(self):
Expand Down

0 comments on commit 2575cb7

Please sign in to comment.