check_model_arch()
prepare_model()
QuantAnalyzer
QuantAnalyzer.enable_per_layer_mse_loss()
QuantAnalyzer.analyze()
CallbackFunc
QuantAnalyzer.check_model_sensitivity_to_quantization()
QuantAnalyzer.perform_per_layer_analysis_by_enabling_quant_wrappers()
QuantAnalyzer.perform_per_layer_analysis_by_disabling_quant_wrappers()
QuantAnalyzer.export_per_layer_encoding_min_max_range()
QuantAnalyzer.export_per_layer_stats_histogram()
QuantAnalyzer.export_per_layer_mse_loss()
QuantizationSimModel
QuantizationSimModel.compute_encodings()
QuantizationSimModel.export()
quantsim.save_checkpoint()
quantsim.load_checkpoint()
QuantScheme
QuantScheme.post_training_percentile
QuantScheme.post_training_tf
QuantScheme.post_training_tf_enhanced
QuantScheme.training_range_learning_with_tf_enhanced_init
QuantScheme.training_range_learning_with_tf_init
apply_adaround()
AdaroundParameters
equalize_model()
correct_bias()
ConvBnInfoType
ActivationType
ActivationType.no_activation
ActivationType.relu
ActivationType.relu6
QuantParams
AutoQuant
reestimate_bn_stats()
fold_all_batch_norms_to_scale()
AdapterMetaData
peft.replace_lora_layers_with_quantizable_layers()
peft.track_lora_meta_data()
PeftQuantUtils
PeftQuantUtils.disable_lora_adapters()
PeftQuantUtils.enable_adapter_and_load_weights()
PeftQuantUtils.export_adapter_weights()
PeftQuantUtils.freeze_base_model()
PeftQuantUtils.freeze_base_model_activation_quantizers()
PeftQuantUtils.freeze_base_model_param_quantizers()
PeftQuantUtils.get_fp_lora_layer()
PeftQuantUtils.get_quantized_lora_layer()
PeftQuantUtils.quantize_lora_scale_with_fixed_range()
PeftQuantUtils.set_bitwidth_for_lora_adapters()
BaseQuantizationMixin
BaseQuantizationMixin.input_quantizers
BaseQuantizationMixin.output_quantizers
BaseQuantizationMixin.param_quantizers
BaseQuantizationMixin.__quant_init__()
BaseQuantizationMixin.compute_encodings()
BaseQuantizationMixin.forward()
QuantizerBase
QuantizerBase.allow_overwrite()
QuantizerBase.compute_encodings()
QuantizerBase.get_encoding()
QuantizerBase.get_legacy_encodings()
QuantizerBase.is_initialized()
QuantizerBase.register_quantization_parameter()
QuantizerBase.set_legacy_encodings()
QuantizeDequantize
QuantizeDequantize.forward()
Quantize
Quantize.forward()
EncodingAnalyzer
MinMaxEncodingAnalyzer
SqnrEncodingAnalyzer
PercentileEncodingAnalyzer
FakeQuantizationMixin
FakeQuantizationMixin.input_quantizers
FakeQuantizationMixin.output_quantizers
FakeQuantizationMixin.param_quantizers
FakeQuantizationMixin.forward()
FakeQuantizationMixin.__quant_init__()
FakeQuantizationMixin.compute_encodings()
FakeQuantizationMixin.from_module()
FakeQuantizationMixin.implements()
QuantizationMixin
QuantizationMixin.input_quantizers
QuantizationMixin.output_quantizers
QuantizationMixin.param_quantizers
QuantizationMixin.forward()
QuantizationMixin.__quant_init__()
QuantizationMixin.set_kernel()
QuantizationMixin.set_default_kernel()
QuantizationMixin.compute_encodings()
QuantizationMixin.from_module()
QuantizationMixin.get_default_kernel()
QuantizationMixin.get_kernel()
QuantizationMixin.implements()
quantize()
quantize_dequantize()
dequantize()
FloatQuantizeDequantize
visualize_stats()
ClsSetInfo
fold_all_batch_norms()
scale_model()
bias_fold()
fold_given_batch_norms()
scale_cls_sets()
ModelCompressor
ModelCompressor.compress_model()
GreedySelectionParameters
SpatialSvdParameters
SpatialSvdParameters.AutoModeParams
SpatialSvdParameters.ManualModeParams
SpatialSvdParameters.Mode
SpatialSvdParameters.Mode.auto
SpatialSvdParameters.Mode.manual
WeightSvdParameters
WeightSvdParameters.AutoModeParams
WeightSvdParameters.ManualModeParams
WeightSvdParameters.Mode
WeightSvdParameters.Mode.auto
WeightSvdParameters.Mode.manual
ChannelPruningParameters
ChannelPruningParameters.AutoModeParams
ChannelPruningParameters.ManualModeParams
ChannelPruningParameters.Mode
ChannelPruningParameters.Mode.auto
ChannelPruningParameters.Mode.manual
ModuleCompRatioPair
VisualizeCompression
VisualizeCompression.display_eval_scores()
VisualizeCompression.display_comp_ratio_plot()
visualize_relative_weight_ranges_to_identify_problematic_layers()
visualize_weight_ranges()
visualize_changes_after_optimization()
LayerOutputUtil
LayerOutputUtil.generate_layer_outputs()
NamingScheme
NamingScheme.ONNX
NamingScheme.PYTORCH
NamingScheme.TORCHSCRIPT
CostMetric
CostMetric.mac
CostMetric.memory
CompressionScheme
CompressionScheme.channel_pruning
CompressionScheme.spatial_svd
CompressionScheme.weight_svd