Intel® Neural Compressor
latest▼
Click link above to switch version
Getting Started
Installation
API
Legal Information
Security Policy
Repo
Intel® Neural Compressor
Index
Index
A
|
B
|
C
|
D
|
E
|
F
|
G
|
H
|
I
|
K
|
L
|
M
|
N
|
O
|
P
|
Q
|
R
|
S
|
T
|
U
|
V
|
W
|
X
A
AcceleratorRegistry (class in neural_compressor.torch.utils.auto_accelerator)
add_fp8_support() (in module neural_compressor.jax.utils.utility)
apply_inlining() (in module neural_compressor.tensorflow.quantization.utils.utility)
apply_single_pattern_pair() (in module neural_compressor.torch.algorithms.pt2e_quant.half_precision_rewriter)
Auto_Accelerator (class in neural_compressor.torch.utils.auto_accelerator)
auto_detect_accelerator() (in module neural_compressor.torch.utils.auto_accelerator)
AutoAlpha (class in neural_compressor.torch.algorithms.smooth_quant.utility)
autoround_quantize_entry() (in module neural_compressor.torch.quantization.algorithm_entry)
AutoRoundConfig (class in neural_compressor.torch.quantization.config)
AutoRoundQuantizer (class in neural_compressor.torch.algorithms.autoround.autoround)
autotune() (in module neural_compressor.tensorflow.quantization.autotune)
(in module neural_compressor.torch.quantization.autotune)
awq_quantize_entry() (in module neural_compressor.torch.quantization.algorithm_entry)
AWQConfig (class in neural_compressor.torch.quantization.config)
AWQQuantizer (class in neural_compressor.torch.algorithms.weight_only.awq)
axis (neural_compressor.torch.algorithms.weight_only.hqq.qtensor.QTensorMetaInfo attribute)
B
BaseConfig (class in neural_compressor.common.base_config)
BaseDataLoader (class in neural_compressor.tensorflow.utils.data)
BaseModel (class in neural_compressor.tensorflow.utils.model_wrappers)
BatchSampler (class in neural_compressor.tensorflow.utils.data)
BF16Convert (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.bf16.bf16_convert)
BiasCorrection (class in neural_compressor.tensorflow.quantization.utils.transform_graph.bias_correction)
block_wise_calibration() (in module neural_compressor.torch.utils.block_wise)
build_captured_dataloader() (in module neural_compressor.torch.algorithms.smooth_quant.utility)
bypass_reshape() (in module neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_decomposed_bn)
(in module neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_decomposed_in)
C
cal_scale() (in module neural_compressor.torch.algorithms.smooth_quant.utility)
Calibration (class in neural_compressor.torch.algorithms.smooth_quant.utility)
call_counter() (in module neural_compressor.common.utils.utility)
can_pack_with_numba() (in module neural_compressor.torch.utils.environ)
CaptureOutputToFile (class in neural_compressor.tensorflow.utils.utility)
causal_lm_make_replace_generate_function() (in module neural_compressor.jax.utils.utility)
cfg_to_qconfig() (in module neural_compressor.torch.algorithms.smooth_quant.utility)
(in module neural_compressor.torch.algorithms.static_quant.utility)
change_config_to_hf_format() (in module neural_compressor.torch.algorithms.weight_only.save_load)
check_backend() (in module neural_compressor.jax.utils.utility)
check_cfg_and_qconfig() (in module neural_compressor.torch.algorithms.smooth_quant.utility)
(in module neural_compressor.torch.algorithms.static_quant.utility)
checkpoint_session() (in module neural_compressor.tensorflow.utils.model_wrappers)
clean_module_weight() (in module neural_compressor.torch.algorithms.layer_wise.utils)
collate_tf_preds() (in module neural_compressor.tensorflow.quantization.utils.utility)
combine_histogram() (in module neural_compressor.tensorflow.utils.utility)
ComposableConfig (class in neural_compressor.common.base_config)
config_list (neural_compressor.common.base_config.ComposableConfig attribute)
(neural_compressor.common.base_tuning.ConfigSet attribute)
ConfigLoader (class in neural_compressor.common.base_tuning)
ConfigRegistry (class in neural_compressor.common.base_config)
ConfigSet (class in neural_compressor.common.base_tuning)
construct_function_from_graph_def() (in module neural_compressor.tensorflow.quantization.utils.utility)
convert() (in module neural_compressor.torch.algorithms.qat.quant_utils)
(in module neural_compressor.torch.quantization.quantize)
convert_model_with_mapping() (in module neural_compressor.torch.algorithms.qat.quant_utils)
ConvertAddToBiasAddOptimizer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.convert_add_to_biasadd)
ConvertLayoutOptimizer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.convert_layout)
ConvertLeakyReluOptimizer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.convert_leakyrelu)
ConvertNanToRandom (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.convert_nan_to_random)
ConvertPlaceholderToConst (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.convert_placeholder_to_const)
CPU_Accelerator (class in neural_compressor.torch.utils.auto_accelerator)
CpuInfo (class in neural_compressor.common.utils.utility)
(class in neural_compressor.tensorflow.utils.utility)
create_quant_spec_from_config() (in module neural_compressor.torch.algorithms.pt2e_quant.utility)
create_xiq_quantizer_from_pt2e_config() (in module neural_compressor.torch.algorithms.pt2e_quant.utility)
CUDA_Accelerator (class in neural_compressor.torch.utils.auto_accelerator)
D
deep_get() (in module neural_compressor.tensorflow.utils.utility)
default_collate() (in module neural_compressor.tensorflow.utils.data)
DequantizeCastOptimizer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.bf16.dequantize_cast_optimizer)
detect_device() (in module neural_compressor.torch.utils.utility)
detect_processor_type_based_on_hw() (in module neural_compressor.common.utils.utility)
device_synchronize() (in module neural_compressor.torch.utils.environ)
DilatedContraction (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.dilated_contraction)
disable_random() (in module neural_compressor.tensorflow.utils.utility)
dowload_hf_model() (in module neural_compressor.torch.utils.utility)
DummyDataset (class in neural_compressor.tensorflow.utils.data)
DummyDatasetV2 (class in neural_compressor.tensorflow.utils.data)
dump_elapsed_time() (in module neural_compressor.common.utils.utility)
(in module neural_compressor.tensorflow.utils.utility)
dump_model_op_stats() (in module neural_compressor.torch.algorithms.autoround.autoround)
(in module neural_compressor.torch.algorithms.smooth_quant.utility)
(in module neural_compressor.torch.algorithms.static_quant.utility)
(in module neural_compressor.torch.utils.utility)
dynamic_quantize() (in module neural_compressor.jax.algorithms.dynamic)
DynamicQDQLayer (class in neural_compressor.jax.quantization.layers_dynamic)
DynamicQuantConfig (class in neural_compressor.jax.quantization.config)
(class in neural_compressor.torch.quantization.config)
E
ElemFormat (class in neural_compressor.torch.algorithms.mx_quant.utils)
enough_memo_store_scale() (in module neural_compressor.torch.algorithms.smooth_quant.utility)
estimator_session() (in module neural_compressor.tensorflow.utils.model_wrappers)
EvaluationFuncWrapper (class in neural_compressor.common.base_tuning)
Evaluator (class in neural_compressor.common.base_tuning)
ExpandDimsOptimizer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.expanddims_optimizer)
export() (in module neural_compressor.torch.export.pt2e_export)
export_hf2compressored_model() (in module neural_compressor.torch.export.export_hf)
export_model_for_pt2e_quant() (in module neural_compressor.torch.export.pt2e_export)
F
FakeAffineTensorQuantFunction (class in neural_compressor.torch.algorithms.weight_only.modules)
fetch_module() (in module neural_compressor.torch.algorithms.weight_only.utility)
(in module neural_compressor.torch.utils.utility)
FetchWeightFromReshapeOptimizer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fetch_weight_from_reshape)
filter_fn() (in module neural_compressor.torch.algorithms.weight_only.hqq.quantizer)
finalize_calibration() (in module neural_compressor.torch.quantization.quantize)
find_all_layers() (in module neural_compressor.torch.algorithms.weight_only.gptq)
find_layers() (in module neural_compressor.torch.algorithms.weight_only.gptq)
find_layers_name() (in module neural_compressor.torch.algorithms.weight_only.gptq)
find_matching_blocks() (in module neural_compressor.torch.utils.utility)
fix_ref_type_of_graph_def() (in module neural_compressor.tensorflow.quantization.utils.utility)
fn (neural_compressor.torch.algorithms.pt2e_quant.half_precision_rewriter.PatternPair attribute)
FoldBatchNormNodesOptimizer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fold_batch_norm)
forward_wrapper() (in module neural_compressor.torch.algorithms.smooth_quant.utility)
(in module neural_compressor.torch.algorithms.weight_only.utility)
(in module neural_compressor.torch.utils.utility)
fp8_entry() (in module neural_compressor.torch.quantization.algorithm_entry)
FP8Config (class in neural_compressor.torch.quantization.config)
FreezeFakeQuantOpOptimizer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.int8.freeze_fake_quant)
FreezeValueTransformer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.int8.freeze_value)
frozen_pb_session() (in module neural_compressor.tensorflow.utils.model_wrappers)
FuseBiasAddAndAddOptimizer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_biasadd_add)
FuseColumnWiseMulOptimizer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_column_wise_mul)
FuseConvRedundantDequantizeTransformer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.int8.fuse_conv_redundant_dequantize)
FuseConvRequantizeTransformer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.int8.fuse_conv_requantize)
FuseConvWithMathOptimizer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_conv_with_math)
FuseDecomposedBNOptimizer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_decomposed_bn)
FuseDecomposedINOptimizer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_decomposed_in)
FuseGeluOptimizer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_gelu)
FuseLayerNormOptimizer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_layer_norm)
FuseMatMulRedundantDequantizeTransformer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.int8.fuse_matmul_redundant_dequantize)
FuseMatMulRequantizeDequantizeNewAPITransformer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.int8.fuse_matmul_requantize)
FuseMatMulRequantizeDequantizeTransformer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.int8.fuse_matmul_requantize)
FuseMatMulRequantizeNewAPITransformer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.int8.fuse_matmul_requantize)
FuseMatMulRequantizeTransformer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.int8.fuse_matmul_requantize)
FuseNodeStartWithConcatV2 (class in neural_compressor.tensorflow.quantization.utils.quantize_graph.qdq.fuse_qdq_concatv2)
(class in neural_compressor.tensorflow.quantization.utils.quantize_graph.quantize_graph_concatv2)
FuseNodeStartWithConv2d (class in neural_compressor.tensorflow.quantization.utils.quantize_graph.qdq.fuse_qdq_conv)
(class in neural_compressor.tensorflow.quantization.utils.quantize_graph.quantize_graph_conv)
FuseNodeStartWithDeconv2d (class in neural_compressor.tensorflow.quantization.utils.quantize_graph.qdq.fuse_qdq_deconv)
FuseNodeStartWithFusedBatchNormV3 (class in neural_compressor.tensorflow.quantization.utils.quantize_graph.qdq.fuse_qdq_bn)
(class in neural_compressor.tensorflow.quantization.utils.quantize_graph.quantize_graph_bn)
FuseNodeStartWithFusedInstanceNorm (class in neural_compressor.tensorflow.quantization.utils.quantize_graph.qdq.fuse_qdq_in)
FuseNodeStartWithMatmul (class in neural_compressor.tensorflow.quantization.utils.quantize_graph.qdq.fuse_qdq_matmul)
(class in neural_compressor.tensorflow.quantization.utils.quantize_graph.quantize_graph_matmul)
FuseNodeStartWithPooling (class in neural_compressor.tensorflow.quantization.utils.quantize_graph.qdq.fuse_qdq_pooling)
(class in neural_compressor.tensorflow.quantization.utils.quantize_graph.quantize_graph_pooling)
FusePadWithConv2DOptimizer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_pad_with_conv)
FusePadWithFP32Conv2DOptimizer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_pad_with_fp32_conv)
FuseTransposeReshapeOptimizer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_reshape_transpose)
G
generate_activation_observer() (in module neural_compressor.torch.algorithms.static_quant.utility)
generate_feed_dict() (in module neural_compressor.tensorflow.quantization.utils.utility)
generate_xpu_qconfig() (in module neural_compressor.torch.algorithms.static_quant.utility)
GenerateGraphWithQDQPattern (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.qdq.insert_qdq_pattern)
get_absorb_layers() (in module neural_compressor.torch.algorithms.weight_only.utility)
get_accelerator() (in module neural_compressor.torch.utils.environ)
get_all_config_set() (in module neural_compressor.tensorflow.quantization.autotune)
(in module neural_compressor.torch.quantization.autotune)
get_all_config_set_from_config_registry() (in module neural_compressor.common.base_config)
get_all_fp32_data() (in module neural_compressor.tensorflow.utils.utility)
get_all_registered_configs() (in module neural_compressor.jax.quantization.config)
(in module neural_compressor.tensorflow.keras.quantization.config)
(in module neural_compressor.torch.quantization.config)
get_block_names() (in module neural_compressor.torch.utils.utility)
get_block_prefix() (in module neural_compressor.torch.algorithms.weight_only.utility)
(in module neural_compressor.torch.utils.block_wise)
get_children() (in module neural_compressor.torch.algorithms.layer_wise.utils)
get_const_dim_count() (in module neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_decomposed_bn)
(in module neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_decomposed_in)
get_dataloader() (in module neural_compressor.torch.algorithms.autoround.autoround)
get_default_AutoRound_config() (in module neural_compressor.torch.quantization.config)
get_default_awq_config() (in module neural_compressor.torch.quantization.config)
get_default_double_quant_config() (in module neural_compressor.torch.quantization.config)
get_default_dynamic_config() (in module neural_compressor.jax.quantization.config)
(in module neural_compressor.torch.quantization.config)
get_default_fp8_config() (in module neural_compressor.torch.quantization.config)
get_default_fp8_config_set() (in module neural_compressor.torch.quantization.config)
get_default_gptq_config() (in module neural_compressor.torch.quantization.config)
get_default_hqq_config() (in module neural_compressor.torch.quantization.config)
get_default_mixed_precision_config() (in module neural_compressor.torch.quantization.config)
get_default_mixed_precision_config_set() (in module neural_compressor.torch.quantization.config)
get_default_mx_config() (in module neural_compressor.torch.quantization.config)
get_default_qat_module_mappings() (in module neural_compressor.torch.quantization.config)
get_default_rtn_config() (in module neural_compressor.torch.quantization.config)
get_default_sq_config() (in module neural_compressor.tensorflow.quantization.config)
(in module neural_compressor.torch.quantization.config)
get_default_static_config() (in module neural_compressor.jax.quantization.config)
(in module neural_compressor.torch.quantization.config)
get_default_static_quant_config() (in module neural_compressor.tensorflow.keras.quantization.config)
(in module neural_compressor.tensorflow.quantization.config)
get_default_teq_config() (in module neural_compressor.torch.quantization.config)
get_depth() (in module neural_compressor.torch.algorithms.static_quant.utility)
get_dequantize_fun() (in module neural_compressor.jax.utils.utility)
get_dict_at_depth() (in module neural_compressor.torch.algorithms.static_quant.utility)
get_double_quant_config_dict() (in module neural_compressor.torch.utils.utility)
get_element_under_depth() (in module neural_compressor.torch.algorithms.static_quant.utility)
get_enum_from_format() (in module neural_compressor.torch.utils.utility)
get_filter_fn() (in module neural_compressor.torch.algorithms.pt2e_quant.half_precision_rewriter)
get_graph_def() (in module neural_compressor.tensorflow.quantization.utils.utility)
get_half_precision_node_set() (in module neural_compressor.torch.algorithms.pt2e_quant.half_precision_rewriter)
get_input_output_node_names() (in module neural_compressor.tensorflow.quantization.utils.utility)
get_ipex_version() (in module neural_compressor.torch.utils.environ)
get_layer_names_in_block() (in module neural_compressor.torch.utils.utility)
get_mllm_dataloader() (in module neural_compressor.torch.algorithms.autoround.autoround)
get_model_device() (in module neural_compressor.torch.utils.utility)
get_model_info() (in module neural_compressor.torch.utils.utility)
get_model_input_shape() (in module neural_compressor.tensorflow.quantization.utils.utility)
get_model_type() (in module neural_compressor.tensorflow.utils.model_wrappers)
get_module() (in module neural_compressor.torch.algorithms.layer_wise.utils)
(in module neural_compressor.torch.algorithms.smooth_quant.utility)
(in module neural_compressor.torch.algorithms.weight_only.utility)
(in module neural_compressor.torch.utils.utility)
get_module_input_output() (in module neural_compressor.torch.algorithms.weight_only.utility)
get_multimodal_block_names() (in module neural_compressor.torch.utils.utility)
get_named_children() (in module neural_compressor.torch.algorithms.layer_wise.utils)
get_non_persistent_buffers() (in module neural_compressor.torch.utils.utility)
get_parent() (in module neural_compressor.torch.algorithms.smooth_quant.utility)
(in module neural_compressor.torch.algorithms.weight_only.utility)
get_processor_type_from_user_config() (in module neural_compressor.torch.utils.utility)
get_q_params() (in module neural_compressor.jax.utils.utility)
get_quant_config() (in module neural_compressor.torch.algorithms.qat.quant_utils)
get_quant_config_with_scheme() (in module neural_compressor.torch.algorithms.qat.quant_utils)
get_quantizable_ops_from_cfgs() (in module neural_compressor.torch.algorithms.static_quant.utility)
get_quantizable_ops_recursively() (in module neural_compressor.torch.algorithms.smooth_quant.utility)
(in module neural_compressor.torch.algorithms.static_quant.utility)
get_quantization_format() (in module neural_compressor.torch.algorithms.qat.quant_utils)
get_quantize_fun() (in module neural_compressor.jax.utils.utility)
get_quantizer() (in module neural_compressor.torch.utils.utility)
get_rtn_double_quant_config_set() (in module neural_compressor.torch.quantization.autotune)
get_scale() (in module neural_compressor.jax.utils.utility)
get_super_module_by_name() (in module neural_compressor.torch.algorithms.layer_wise.utils)
get_tensor_by_name() (in module neural_compressor.tensorflow.quantization.utils.utility)
get_tensor_histogram() (in module neural_compressor.tensorflow.utils.utility)
get_tf_model_type() (in module neural_compressor.tensorflow.utils.model_wrappers)
get_torch_version() (in module neural_compressor.torch.utils.environ)
get_unquantized_node_set() (in module neural_compressor.torch.algorithms.pt2e_quant.half_precision_rewriter)
get_used_cpu_mem_MB() (in module neural_compressor.torch.utils.environ)
get_used_hpu_mem_MB() (in module neural_compressor.torch.utils.environ)
get_woq_tuning_config() (in module neural_compressor.torch.quantization.config)
get_workspace() (in module neural_compressor.common.utils.utility)
GPTQ (class in neural_compressor.torch.algorithms.weight_only.gptq)
gptq_entry() (in module neural_compressor.torch.quantization.algorithm_entry)
GPTQConfig (class in neural_compressor.torch.quantization.config)
GPTQuantizer (class in neural_compressor.torch.algorithms.weight_only.gptq)
graph_def_session() (in module neural_compressor.tensorflow.utils.model_wrappers)
graph_session() (in module neural_compressor.tensorflow.utils.model_wrappers)
GraphAnalyzer (class in neural_compressor.tensorflow.quantization.utils.graph_util)
GraphConverter (class in neural_compressor.tensorflow.quantization.utils.graph_converter)
GraphCseOptimizer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.graph_cse_optimizer)
GraphFoldConstantOptimizer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fold_constant)
GraphRewriterBase (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.graph_base)
GraphRewriterHelper (class in neural_compressor.tensorflow.quantization.utils.graph_util)
GraphTrace (class in neural_compressor.torch.algorithms.smooth_quant.utility)
(class in neural_compressor.torch.algorithms.weight_only.utility)
GraphTransformBase (class in neural_compressor.tensorflow.quantization.utils.transform_graph.graph_transform_base)
GrapplerOptimizer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.grappler_pass)
group_size (neural_compressor.torch.algorithms.weight_only.hqq.qtensor.QTensorMetaInfo attribute)
H
HalfPrecisionConverter (class in neural_compressor.torch.algorithms.mixed_precision.half_precision_convert)
HalfPrecisionModuleWrapper (class in neural_compressor.torch.algorithms.mixed_precision.module_wrappers)
HPU_Accelerator (class in neural_compressor.torch.utils.auto_accelerator)
HPUWeightOnlyLinear (class in neural_compressor.torch.algorithms.weight_only.modules)
hqq_entry() (in module neural_compressor.torch.quantization.algorithm_entry)
HQQConfig (class in neural_compressor.torch.quantization.config)
HQQLinear (class in neural_compressor.torch.algorithms.weight_only.hqq.core)
HQQModuleConfig (class in neural_compressor.torch.algorithms.weight_only.hqq.config)
HQQTensorHandle (class in neural_compressor.torch.algorithms.weight_only.hqq.core)
HQQuantizer (class in neural_compressor.torch.algorithms.weight_only.hqq.quantizer)
hybrid_gptq_entry() (in module neural_compressor.torch.quantization.algorithm_entry)
HybridGPTQConfig (class in neural_compressor.torch.quantization.config)
I
INCAcceleratorType (class in neural_compressor.torch.utils.auto_accelerator)
INCWeightOnlyLinear (class in neural_compressor.torch.algorithms.weight_only.modules)
IndexFetcher (class in neural_compressor.tensorflow.utils.data)
init_tuning() (in module neural_compressor.common.base_tuning)
initialize_int8_avgpool() (in module neural_compressor.tensorflow.keras.layers.pool2d)
initialize_int8_conv2d() (in module neural_compressor.tensorflow.keras.layers.conv2d)
initialize_int8_dense() (in module neural_compressor.tensorflow.keras.layers.dense)
initialize_int8_depthwise_conv2d() (in module neural_compressor.tensorflow.keras.layers.depthwise_conv2d)
initialize_int8_maxpool() (in module neural_compressor.tensorflow.keras.layers.pool2d)
initialize_int8_separable_conv2d() (in module neural_compressor.tensorflow.keras.layers.separable_conv2d)
InjectDummyBiasAddOptimizer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.dummy_biasadd)
InsertLogging (class in neural_compressor.tensorflow.quantization.utils.transform_graph.insert_logging)
InsertPrintMinMaxNode (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.insert_print_node)
INT8StaticQuantConfig (class in neural_compressor.torch.quantization.config)
is_ckpt_format() (in module neural_compressor.tensorflow.quantization.utils.utility)
is_hpex_available() (in module neural_compressor.torch.utils.environ)
is_hpex_support_g_idx() (in module neural_compressor.torch.utils.environ)
is_hpu_available() (in module neural_compressor.torch.utils.environ)
is_ipex_available() (in module neural_compressor.torch.utils.environ)
is_ipex_imported() (in module neural_compressor.torch.utils.environ)
is_leaf() (in module neural_compressor.torch.algorithms.weight_only.gptq)
is_numba_available() (in module neural_compressor.torch.utils.environ)
is_optimum_available() (in module neural_compressor.torch.utils.environ)
is_optimum_habana_available() (in module neural_compressor.torch.utils.environ)
is_package_available() (in module neural_compressor.torch.utils.environ)
is_quantlinear() (in module neural_compressor.torch.algorithms.qat.quant_utils)
is_saved_model_format() (in module neural_compressor.tensorflow.quantization.utils.utility)
is_tbb_available() (in module neural_compressor.torch.utils.environ)
is_transformers_imported() (in module neural_compressor.torch.utils.environ)
IterableFetcher (class in neural_compressor.tensorflow.utils.data)
IterableSampler (class in neural_compressor.tensorflow.utils.data)
iterate_over_layers() (in module neural_compressor.jax.utils.utility)
iterator_sess_run() (in module neural_compressor.tensorflow.quantization.utils.utility)
itex_installed() (in module neural_compressor.tensorflow.utils.utility)
K
keras_session() (in module neural_compressor.tensorflow.utils.model_wrappers)
KerasAdaptor (class in neural_compressor.tensorflow.algorithms.static_quant.keras)
KerasConfigConverter (class in neural_compressor.tensorflow.algorithms.static_quant.keras)
KerasModel (class in neural_compressor.tensorflow.utils.model_wrappers)
KerasQuantizedGemmaWrapper (class in neural_compressor.jax.quantization.saving)
KerasQuantizedModelBackboneWrapper (class in neural_compressor.jax.quantization.saving)
KerasQuantizedModelWrapper (class in neural_compressor.jax.quantization.saving)
KerasQuantizedModelWrapperMixin (class in neural_compressor.jax.quantization.saving)
KerasQuantizedTokenizerWrapper (class in neural_compressor.jax.quantization.saving)
KerasQuantizedViTWrapper (class in neural_compressor.jax.quantization.saving)
KerasQuery (class in neural_compressor.tensorflow.algorithms.static_quant.keras)
KerasSurgery (class in neural_compressor.tensorflow.algorithms.static_quant.keras)
L
LazyImport (class in neural_compressor.common.utils.utility)
load() (in module neural_compressor.torch.algorithms.layer_wise.load)
(in module neural_compressor.torch.algorithms.pt2e_quant.save_load)
(in module neural_compressor.torch.algorithms.static_quant.save_load)
(in module neural_compressor.torch.algorithms.weight_only.save_load)
(in module neural_compressor.torch.quantization.save_load_entry)
load_config_mapping() (in module neural_compressor.common.utils.save_load)
load_empty_model() (in module neural_compressor.torch.utils.utility)
load_first_layer_only() (in module neural_compressor.torch.algorithms.layer_wise.utils)
load_layer_wise_quantized_model() (in module neural_compressor.torch.algorithms.layer_wise.utils)
load_model_from_shards_with_safetensors() (in module neural_compressor.torch.algorithms.layer_wise.utils)
load_module() (in module neural_compressor.torch.algorithms.layer_wise.utils)
load_non_persistent_buffers() (in module neural_compressor.torch.utils.utility)
load_saved_model() (in module neural_compressor.tensorflow.utils.model_wrappers)
load_tensor() (in module neural_compressor.torch.algorithms.layer_wise.utils)
load_tensor_from_safetensors() (in module neural_compressor.torch.algorithms.layer_wise.utils)
load_tensor_from_safetensors_shard() (in module neural_compressor.torch.algorithms.layer_wise.utils)
load_tensor_from_shard() (in module neural_compressor.torch.algorithms.layer_wise.utils)
load_value() (in module neural_compressor.torch.algorithms.layer_wise.utils)
log_process() (in module neural_compressor.common.utils.utility)
log_quantizable_layers_per_transformer() (in module neural_compressor.torch.algorithms.weight_only.gptq)
Logger (class in neural_compressor.common.utils.logger)
M
Matmul (class in neural_compressor.torch.algorithms.weight_only.modules)
MergeDuplicatedQDQOptimizer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.qdq.merge_duplicated_qdq)
MetaInfoChangingMemOpOptimizer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.int8.meta_op_optimizer)
MinMaxObserver (class in neural_compressor.jax.quantization.layers_static)
mixed_precision_entry() (in module neural_compressor.torch.quantization.algorithm_entry)
MixedPrecisionConfig (class in neural_compressor.torch.quantization.config)
Mode (class in neural_compressor.common.utils.constants)
Model (class in neural_compressor.tensorflow.utils.model)
model_forward() (in module neural_compressor.torch.algorithms.smooth_quant.utility)
(in module neural_compressor.torch.algorithms.weight_only.utility)
model_forward_per_sample() (in module neural_compressor.torch.algorithms.smooth_quant.utility)
MODEL_LEVEL (neural_compressor.common.tuning_param.ParamLevel attribute)
module
neural_compressor
neural_compressor.common
neural_compressor.common.base_config
neural_compressor.common.base_tuning
neural_compressor.common.tuning_param
neural_compressor.common.utils
neural_compressor.common.utils.constants
neural_compressor.common.utils.logger
neural_compressor.common.utils.save_load
neural_compressor.common.utils.utility
neural_compressor.common.version
neural_compressor.jax
neural_compressor.jax.algorithms
neural_compressor.jax.algorithms.dynamic
neural_compressor.jax.algorithms.static
neural_compressor.jax.quantization
neural_compressor.jax.quantization.config
neural_compressor.jax.quantization.layers_dynamic
neural_compressor.jax.quantization.layers_static
neural_compressor.jax.quantization.quantize
neural_compressor.jax.quantization.saving
neural_compressor.jax.utils
neural_compressor.jax.utils.utility
neural_compressor.tensorflow
neural_compressor.tensorflow.algorithms
neural_compressor.tensorflow.algorithms.smoother
neural_compressor.tensorflow.algorithms.smoother.calibration
neural_compressor.tensorflow.algorithms.smoother.core
neural_compressor.tensorflow.algorithms.smoother.scaler
neural_compressor.tensorflow.algorithms.static_quant
neural_compressor.tensorflow.algorithms.static_quant.keras
neural_compressor.tensorflow.algorithms.static_quant.tensorflow
neural_compressor.tensorflow.keras
neural_compressor.tensorflow.keras.layers
neural_compressor.tensorflow.keras.layers.conv2d
neural_compressor.tensorflow.keras.layers.dense
neural_compressor.tensorflow.keras.layers.depthwise_conv2d
neural_compressor.tensorflow.keras.layers.layer_initializer
neural_compressor.tensorflow.keras.layers.pool2d
neural_compressor.tensorflow.keras.layers.separable_conv2d
neural_compressor.tensorflow.keras.quantization
neural_compressor.tensorflow.keras.quantization.config
neural_compressor.tensorflow.quantization
neural_compressor.tensorflow.quantization.algorithm_entry
neural_compressor.tensorflow.quantization.autotune
neural_compressor.tensorflow.quantization.config
neural_compressor.tensorflow.quantization.quantize
neural_compressor.tensorflow.quantization.utils
neural_compressor.tensorflow.quantization.utils.graph_converter
neural_compressor.tensorflow.quantization.utils.graph_rewriter
neural_compressor.tensorflow.quantization.utils.graph_rewriter.bf16
neural_compressor.tensorflow.quantization.utils.graph_rewriter.bf16.bf16_convert
neural_compressor.tensorflow.quantization.utils.graph_rewriter.bf16.dequantize_cast_optimizer
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.convert_add_to_biasadd
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.convert_layout
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.convert_leakyrelu
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.convert_nan_to_random
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.convert_placeholder_to_const
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.dilated_contraction
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.dummy_biasadd
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.expanddims_optimizer
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fetch_weight_from_reshape
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fold_batch_norm
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fold_constant
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_biasadd_add
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_column_wise_mul
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_conv_with_math
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_decomposed_bn
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_decomposed_in
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_gelu
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_layer_norm
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_pad_with_conv
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_pad_with_fp32_conv
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_reshape_transpose
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.graph_cse_optimizer
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.grappler_pass
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.insert_print_node
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.move_squeeze_after_relu
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.pre_optimize
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.remove_training_nodes
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.rename_batch_norm
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.split_shared_input
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.strip_equivalent_nodes
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.strip_unused_nodes
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.switch_optimizer
neural_compressor.tensorflow.quantization.utils.graph_rewriter.graph_base
neural_compressor.tensorflow.quantization.utils.graph_rewriter.int8
neural_compressor.tensorflow.quantization.utils.graph_rewriter.int8.freeze_fake_quant
neural_compressor.tensorflow.quantization.utils.graph_rewriter.int8.freeze_value
neural_compressor.tensorflow.quantization.utils.graph_rewriter.int8.fuse_conv_redundant_dequantize
neural_compressor.tensorflow.quantization.utils.graph_rewriter.int8.fuse_conv_requantize
neural_compressor.tensorflow.quantization.utils.graph_rewriter.int8.fuse_matmul_redundant_dequantize
neural_compressor.tensorflow.quantization.utils.graph_rewriter.int8.fuse_matmul_requantize
neural_compressor.tensorflow.quantization.utils.graph_rewriter.int8.meta_op_optimizer
neural_compressor.tensorflow.quantization.utils.graph_rewriter.int8.post_hostconst_converter
neural_compressor.tensorflow.quantization.utils.graph_rewriter.int8.post_quantized_op_cse
neural_compressor.tensorflow.quantization.utils.graph_rewriter.int8.scale_propagation
neural_compressor.tensorflow.quantization.utils.graph_rewriter.qdq
neural_compressor.tensorflow.quantization.utils.graph_rewriter.qdq.insert_qdq_pattern
neural_compressor.tensorflow.quantization.utils.graph_rewriter.qdq.merge_duplicated_qdq
neural_compressor.tensorflow.quantization.utils.graph_rewriter.qdq.share_qdq_y_pattern
neural_compressor.tensorflow.quantization.utils.graph_util
neural_compressor.tensorflow.quantization.utils.quantize_graph
neural_compressor.tensorflow.quantization.utils.quantize_graph.qdq
neural_compressor.tensorflow.quantization.utils.quantize_graph.qdq.fuse_qdq_bn
neural_compressor.tensorflow.quantization.utils.quantize_graph.qdq.fuse_qdq_concatv2
neural_compressor.tensorflow.quantization.utils.quantize_graph.qdq.fuse_qdq_conv
neural_compressor.tensorflow.quantization.utils.quantize_graph.qdq.fuse_qdq_deconv
neural_compressor.tensorflow.quantization.utils.quantize_graph.qdq.fuse_qdq_in
neural_compressor.tensorflow.quantization.utils.quantize_graph.qdq.fuse_qdq_matmul
neural_compressor.tensorflow.quantization.utils.quantize_graph.qdq.fuse_qdq_pooling
neural_compressor.tensorflow.quantization.utils.quantize_graph.qdq.optimize_qdq
neural_compressor.tensorflow.quantization.utils.quantize_graph.quantize_graph_base
neural_compressor.tensorflow.quantization.utils.quantize_graph.quantize_graph_bn
neural_compressor.tensorflow.quantization.utils.quantize_graph.quantize_graph_concatv2
neural_compressor.tensorflow.quantization.utils.quantize_graph.quantize_graph_conv
neural_compressor.tensorflow.quantization.utils.quantize_graph.quantize_graph_for_intel_cpu
neural_compressor.tensorflow.quantization.utils.quantize_graph.quantize_graph_matmul
neural_compressor.tensorflow.quantization.utils.quantize_graph.quantize_graph_pooling
neural_compressor.tensorflow.quantization.utils.quantize_graph_common
neural_compressor.tensorflow.quantization.utils.transform_graph
neural_compressor.tensorflow.quantization.utils.transform_graph.bias_correction
neural_compressor.tensorflow.quantization.utils.transform_graph.graph_transform_base
neural_compressor.tensorflow.quantization.utils.transform_graph.insert_logging
neural_compressor.tensorflow.quantization.utils.transform_graph.rerange_quantized_concat
neural_compressor.tensorflow.quantization.utils.utility
neural_compressor.tensorflow.utils
neural_compressor.tensorflow.utils.constants
neural_compressor.tensorflow.utils.data
neural_compressor.tensorflow.utils.model
neural_compressor.tensorflow.utils.model_wrappers
neural_compressor.tensorflow.utils.utility
neural_compressor.torch
neural_compressor.torch.algorithms
neural_compressor.torch.algorithms.autoround
neural_compressor.torch.algorithms.autoround.autoround
neural_compressor.torch.algorithms.base_algorithm
neural_compressor.torch.algorithms.fp8_quant
neural_compressor.torch.algorithms.fp8_quant.observer
neural_compressor.torch.algorithms.fp8_quant.patched_module_base
neural_compressor.torch.algorithms.fp8_quant.scaling_method_base
neural_compressor.torch.algorithms.layer_wise
neural_compressor.torch.algorithms.layer_wise.load
neural_compressor.torch.algorithms.layer_wise.modified_pickle
neural_compressor.torch.algorithms.layer_wise.utils
neural_compressor.torch.algorithms.mixed_precision
neural_compressor.torch.algorithms.mixed_precision.half_precision_convert
neural_compressor.torch.algorithms.mixed_precision.module_wrappers
neural_compressor.torch.algorithms.mx_quant
neural_compressor.torch.algorithms.mx_quant.mx
neural_compressor.torch.algorithms.mx_quant.utils
neural_compressor.torch.algorithms.pt2e_quant
neural_compressor.torch.algorithms.pt2e_quant.core
neural_compressor.torch.algorithms.pt2e_quant.half_precision_rewriter
neural_compressor.torch.algorithms.pt2e_quant.save_load
neural_compressor.torch.algorithms.pt2e_quant.utility
neural_compressor.torch.algorithms.qat
neural_compressor.torch.algorithms.qat.quant_linear
neural_compressor.torch.algorithms.qat.quant_utils
neural_compressor.torch.algorithms.qat.tensor_quantizer
neural_compressor.torch.algorithms.smooth_quant
neural_compressor.torch.algorithms.smooth_quant.save_load
neural_compressor.torch.algorithms.smooth_quant.smooth_quant
neural_compressor.torch.algorithms.smooth_quant.utility
neural_compressor.torch.algorithms.static_quant
neural_compressor.torch.algorithms.static_quant.save_load
neural_compressor.torch.algorithms.static_quant.static_quant
neural_compressor.torch.algorithms.static_quant.utility
neural_compressor.torch.algorithms.weight_only
neural_compressor.torch.algorithms.weight_only.awq
neural_compressor.torch.algorithms.weight_only.gptq
neural_compressor.torch.algorithms.weight_only.hqq
neural_compressor.torch.algorithms.weight_only.hqq.bitpack
neural_compressor.torch.algorithms.weight_only.hqq.config
neural_compressor.torch.algorithms.weight_only.hqq.core
neural_compressor.torch.algorithms.weight_only.hqq.optimizer
neural_compressor.torch.algorithms.weight_only.hqq.qtensor
neural_compressor.torch.algorithms.weight_only.hqq.quantizer
neural_compressor.torch.algorithms.weight_only.modules
neural_compressor.torch.algorithms.weight_only.rtn
neural_compressor.torch.algorithms.weight_only.save_load
neural_compressor.torch.algorithms.weight_only.teq
neural_compressor.torch.algorithms.weight_only.utility
neural_compressor.torch.export
neural_compressor.torch.export.export_hf
neural_compressor.torch.export.pt2e_export
neural_compressor.torch.quantization
neural_compressor.torch.quantization.algorithm_entry
neural_compressor.torch.quantization.autotune
neural_compressor.torch.quantization.config
neural_compressor.torch.quantization.quantize
neural_compressor.torch.quantization.save_load_entry
neural_compressor.torch.utils
neural_compressor.torch.utils.auto_accelerator
neural_compressor.torch.utils.bit_packer
neural_compressor.torch.utils.block_wise
neural_compressor.torch.utils.constants
neural_compressor.torch.utils.environ
neural_compressor.torch.utils.utility
neural_compressor.version
move_input_device() (in module neural_compressor.torch.utils.utility)
move_input_to_device() (in module neural_compressor.torch.algorithms.smooth_quant.utility)
(in module neural_compressor.torch.algorithms.weight_only.utility)
MoveSqueezeAfterReluOptimizer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.move_squeeze_after_relu)
MulLinear (class in neural_compressor.torch.algorithms.weight_only.modules)
mx_quant_entry() (in module neural_compressor.torch.quantization.algorithm_entry)
MXLinear (class in neural_compressor.torch.algorithms.mx_quant.mx)
MXQuantConfig (class in neural_compressor.torch.quantization.config)
MXQuantizer (class in neural_compressor.torch.algorithms.mx_quant.mx)
N
name (neural_compressor.common.base_config.BaseConfig attribute)
nbits (neural_compressor.torch.algorithms.weight_only.hqq.qtensor.QTensorMetaInfo attribute)
need_apply() (in module neural_compressor.jax.quantization.quantize)
(in module neural_compressor.tensorflow.quantization.quantize)
(in module neural_compressor.torch.quantization.quantize)
neural_compressor
module
neural_compressor.common
module
neural_compressor.common.base_config
module
neural_compressor.common.base_tuning
module
neural_compressor.common.tuning_param
module
neural_compressor.common.utils
module
neural_compressor.common.utils.constants
module
neural_compressor.common.utils.logger
module
neural_compressor.common.utils.save_load
module
neural_compressor.common.utils.utility
module
neural_compressor.common.version
module
neural_compressor.jax
module
neural_compressor.jax.algorithms
module
neural_compressor.jax.algorithms.dynamic
module
neural_compressor.jax.algorithms.static
module
neural_compressor.jax.quantization
module
neural_compressor.jax.quantization.config
module
neural_compressor.jax.quantization.layers_dynamic
module
neural_compressor.jax.quantization.layers_static
module
neural_compressor.jax.quantization.quantize
module
neural_compressor.jax.quantization.saving
module
neural_compressor.jax.utils
module
neural_compressor.jax.utils.utility
module
neural_compressor.tensorflow
module
neural_compressor.tensorflow.algorithms
module
neural_compressor.tensorflow.algorithms.smoother
module
neural_compressor.tensorflow.algorithms.smoother.calibration
module
neural_compressor.tensorflow.algorithms.smoother.core
module
neural_compressor.tensorflow.algorithms.smoother.scaler
module
neural_compressor.tensorflow.algorithms.static_quant
module
neural_compressor.tensorflow.algorithms.static_quant.keras
module
neural_compressor.tensorflow.algorithms.static_quant.tensorflow
module
neural_compressor.tensorflow.keras
module
neural_compressor.tensorflow.keras.layers
module
neural_compressor.tensorflow.keras.layers.conv2d
module
neural_compressor.tensorflow.keras.layers.dense
module
neural_compressor.tensorflow.keras.layers.depthwise_conv2d
module
neural_compressor.tensorflow.keras.layers.layer_initializer
module
neural_compressor.tensorflow.keras.layers.pool2d
module
neural_compressor.tensorflow.keras.layers.separable_conv2d
module
neural_compressor.tensorflow.keras.quantization
module
neural_compressor.tensorflow.keras.quantization.config
module
neural_compressor.tensorflow.quantization
module
neural_compressor.tensorflow.quantization.algorithm_entry
module
neural_compressor.tensorflow.quantization.autotune
module
neural_compressor.tensorflow.quantization.config
module
neural_compressor.tensorflow.quantization.quantize
module
neural_compressor.tensorflow.quantization.utils
module
neural_compressor.tensorflow.quantization.utils.graph_converter
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.bf16
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.bf16.bf16_convert
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.bf16.dequantize_cast_optimizer
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.convert_add_to_biasadd
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.convert_layout
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.convert_leakyrelu
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.convert_nan_to_random
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.convert_placeholder_to_const
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.dilated_contraction
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.dummy_biasadd
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.expanddims_optimizer
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fetch_weight_from_reshape
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fold_batch_norm
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fold_constant
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_biasadd_add
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_column_wise_mul
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_conv_with_math
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_decomposed_bn
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_decomposed_in
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_gelu
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_layer_norm
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_pad_with_conv
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_pad_with_fp32_conv
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_reshape_transpose
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.graph_cse_optimizer
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.grappler_pass
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.insert_print_node
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.move_squeeze_after_relu
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.pre_optimize
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.remove_training_nodes
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.rename_batch_norm
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.split_shared_input
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.strip_equivalent_nodes
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.strip_unused_nodes
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.switch_optimizer
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.graph_base
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.int8
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.int8.freeze_fake_quant
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.int8.freeze_value
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.int8.fuse_conv_redundant_dequantize
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.int8.fuse_conv_requantize
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.int8.fuse_matmul_redundant_dequantize
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.int8.fuse_matmul_requantize
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.int8.meta_op_optimizer
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.int8.post_hostconst_converter
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.int8.post_quantized_op_cse
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.int8.scale_propagation
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.qdq
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.qdq.insert_qdq_pattern
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.qdq.merge_duplicated_qdq
module
neural_compressor.tensorflow.quantization.utils.graph_rewriter.qdq.share_qdq_y_pattern
module
neural_compressor.tensorflow.quantization.utils.graph_util
module
neural_compressor.tensorflow.quantization.utils.quantize_graph
module
neural_compressor.tensorflow.quantization.utils.quantize_graph.qdq
module
neural_compressor.tensorflow.quantization.utils.quantize_graph.qdq.fuse_qdq_bn
module
neural_compressor.tensorflow.quantization.utils.quantize_graph.qdq.fuse_qdq_concatv2
module
neural_compressor.tensorflow.quantization.utils.quantize_graph.qdq.fuse_qdq_conv
module
neural_compressor.tensorflow.quantization.utils.quantize_graph.qdq.fuse_qdq_deconv
module
neural_compressor.tensorflow.quantization.utils.quantize_graph.qdq.fuse_qdq_in
module
neural_compressor.tensorflow.quantization.utils.quantize_graph.qdq.fuse_qdq_matmul
module
neural_compressor.tensorflow.quantization.utils.quantize_graph.qdq.fuse_qdq_pooling
module
neural_compressor.tensorflow.quantization.utils.quantize_graph.qdq.optimize_qdq
module
neural_compressor.tensorflow.quantization.utils.quantize_graph.quantize_graph_base
module
neural_compressor.tensorflow.quantization.utils.quantize_graph.quantize_graph_bn
module
neural_compressor.tensorflow.quantization.utils.quantize_graph.quantize_graph_concatv2
module
neural_compressor.tensorflow.quantization.utils.quantize_graph.quantize_graph_conv
module
neural_compressor.tensorflow.quantization.utils.quantize_graph.quantize_graph_for_intel_cpu
module
neural_compressor.tensorflow.quantization.utils.quantize_graph.quantize_graph_matmul
module
neural_compressor.tensorflow.quantization.utils.quantize_graph.quantize_graph_pooling
module
neural_compressor.tensorflow.quantization.utils.quantize_graph_common
module
neural_compressor.tensorflow.quantization.utils.transform_graph
module
neural_compressor.tensorflow.quantization.utils.transform_graph.bias_correction
module
neural_compressor.tensorflow.quantization.utils.transform_graph.graph_transform_base
module
neural_compressor.tensorflow.quantization.utils.transform_graph.insert_logging
module
neural_compressor.tensorflow.quantization.utils.transform_graph.rerange_quantized_concat
module
neural_compressor.tensorflow.quantization.utils.utility
module
neural_compressor.tensorflow.utils
module
neural_compressor.tensorflow.utils.constants
module
neural_compressor.tensorflow.utils.data
module
neural_compressor.tensorflow.utils.model
module
neural_compressor.tensorflow.utils.model_wrappers
module
neural_compressor.tensorflow.utils.utility
module
neural_compressor.torch
module
neural_compressor.torch.algorithms
module
neural_compressor.torch.algorithms.autoround
module
neural_compressor.torch.algorithms.autoround.autoround
module
neural_compressor.torch.algorithms.base_algorithm
module
neural_compressor.torch.algorithms.fp8_quant
module
neural_compressor.torch.algorithms.fp8_quant.observer
module
neural_compressor.torch.algorithms.fp8_quant.patched_module_base
module
neural_compressor.torch.algorithms.fp8_quant.scaling_method_base
module
neural_compressor.torch.algorithms.layer_wise
module
neural_compressor.torch.algorithms.layer_wise.load
module
neural_compressor.torch.algorithms.layer_wise.modified_pickle
module
neural_compressor.torch.algorithms.layer_wise.utils
module
neural_compressor.torch.algorithms.mixed_precision
module
neural_compressor.torch.algorithms.mixed_precision.half_precision_convert
module
neural_compressor.torch.algorithms.mixed_precision.module_wrappers
module
neural_compressor.torch.algorithms.mx_quant
module
neural_compressor.torch.algorithms.mx_quant.mx
module
neural_compressor.torch.algorithms.mx_quant.utils
module
neural_compressor.torch.algorithms.pt2e_quant
module
neural_compressor.torch.algorithms.pt2e_quant.core
module
neural_compressor.torch.algorithms.pt2e_quant.half_precision_rewriter
module
neural_compressor.torch.algorithms.pt2e_quant.save_load
module
neural_compressor.torch.algorithms.pt2e_quant.utility
module
neural_compressor.torch.algorithms.qat
module
neural_compressor.torch.algorithms.qat.quant_linear
module
neural_compressor.torch.algorithms.qat.quant_utils
module
neural_compressor.torch.algorithms.qat.tensor_quantizer
module
neural_compressor.torch.algorithms.smooth_quant
module
neural_compressor.torch.algorithms.smooth_quant.save_load
module
neural_compressor.torch.algorithms.smooth_quant.smooth_quant
module
neural_compressor.torch.algorithms.smooth_quant.utility
module
neural_compressor.torch.algorithms.static_quant
module
neural_compressor.torch.algorithms.static_quant.save_load
module
neural_compressor.torch.algorithms.static_quant.static_quant
module
neural_compressor.torch.algorithms.static_quant.utility
module
neural_compressor.torch.algorithms.weight_only
module
neural_compressor.torch.algorithms.weight_only.awq
module
neural_compressor.torch.algorithms.weight_only.gptq
module
neural_compressor.torch.algorithms.weight_only.hqq
module
neural_compressor.torch.algorithms.weight_only.hqq.bitpack
module
neural_compressor.torch.algorithms.weight_only.hqq.config
module
neural_compressor.torch.algorithms.weight_only.hqq.core
module
neural_compressor.torch.algorithms.weight_only.hqq.optimizer
module
neural_compressor.torch.algorithms.weight_only.hqq.qtensor
module
neural_compressor.torch.algorithms.weight_only.hqq.quantizer
module
neural_compressor.torch.algorithms.weight_only.modules
module
neural_compressor.torch.algorithms.weight_only.rtn
module
neural_compressor.torch.algorithms.weight_only.save_load
module
neural_compressor.torch.algorithms.weight_only.teq
module
neural_compressor.torch.algorithms.weight_only.utility
module
neural_compressor.torch.export
module
neural_compressor.torch.export.export_hf
module
neural_compressor.torch.export.pt2e_export
module
neural_compressor.torch.quantization
module
neural_compressor.torch.quantization.algorithm_entry
module
neural_compressor.torch.quantization.autotune
module
neural_compressor.torch.quantization.config
module
neural_compressor.torch.quantization.quantize
module
neural_compressor.torch.quantization.save_load_entry
module
neural_compressor.torch.utils
module
neural_compressor.torch.utils.auto_accelerator
module
neural_compressor.torch.utils.bit_packer
module
neural_compressor.torch.utils.block_wise
module
neural_compressor.torch.utils.constants
module
neural_compressor.torch.utils.environ
module
neural_compressor.torch.utils.utility
module
neural_compressor.version
module
node_from_map() (in module neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_decomposed_bn)
(in module neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_decomposed_in)
(in module neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_layer_norm)
node_name_from_input() (in module neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_decomposed_bn)
(in module neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_decomposed_in)
(in module neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_layer_norm)
O
ObserverBase (class in neural_compressor.torch.algorithms.fp8_quant.observer)
OP_LEVEL (neural_compressor.common.tuning_param.ParamLevel attribute)
OP_TYPE_LEVEL (neural_compressor.common.tuning_param.ParamLevel attribute)
OperatorConfig (class in neural_compressor.jax.quantization.config)
(class in neural_compressor.tensorflow.keras.quantization.config)
(class in neural_compressor.torch.quantization.config)
optimize_weights_proximal_legacy() (in module neural_compressor.torch.algorithms.weight_only.hqq.optimizer)
OptimizeQDQGraph (class in neural_compressor.tensorflow.quantization.utils.quantize_graph.qdq.optimize_qdq)
P
pack_array_with_numba_b2_c16() (in module neural_compressor.torch.utils.bit_packer)
pack_array_with_numba_b2_c32() (in module neural_compressor.torch.utils.bit_packer)
pack_array_with_numba_b2_c64() (in module neural_compressor.torch.utils.bit_packer)
pack_array_with_numba_b2_c8() (in module neural_compressor.torch.utils.bit_packer)
pack_array_with_numba_b4_c16() (in module neural_compressor.torch.utils.bit_packer)
pack_array_with_numba_b4_c32() (in module neural_compressor.torch.utils.bit_packer)
pack_array_with_numba_b4_c64() (in module neural_compressor.torch.utils.bit_packer)
pack_array_with_numba_b4_c8() (in module neural_compressor.torch.utils.bit_packer)
pack_array_with_numba_b8_c16() (in module neural_compressor.torch.utils.bit_packer)
pack_array_with_numba_b8_c32() (in module neural_compressor.torch.utils.bit_packer)
pack_array_with_numba_b8_c64() (in module neural_compressor.torch.utils.bit_packer)
pack_array_with_numba_b8_c8() (in module neural_compressor.torch.utils.bit_packer)
Packer (class in neural_compressor.torch.algorithms.weight_only.hqq.bitpack)
packing (neural_compressor.torch.algorithms.weight_only.hqq.qtensor.QTensorMetaInfo attribute)
ParamLevel (class in neural_compressor.common.tuning_param)
params_list (neural_compressor.common.base_config.BaseConfig attribute)
parse_cfgs() (in module neural_compressor.torch.algorithms.static_quant.utility)
parse_saved_model() (in module neural_compressor.tensorflow.quantization.utils.utility)
patch_hqq_moduile() (in module neural_compressor.torch.algorithms.weight_only.hqq.quantizer)
PatchedModuleBase (class in neural_compressor.torch.algorithms.fp8_quant.patched_module_base)
pattern_factory() (in module neural_compressor.torch.algorithms.pt2e_quant.half_precision_rewriter)
PatternPair (class in neural_compressor.torch.algorithms.pt2e_quant.half_precision_rewriter)
PickleError
PicklingError
PostCseOptimizer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.int8.post_quantized_op_cse)
PostHostConstConverter (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.int8.post_hostconst_converter)
postprocess_model() (in module neural_compressor.torch.utils.utility)
PreOptimization (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.pre_optimize)
prepare() (in module neural_compressor.torch.quantization.quantize)
prepare_deserialized_quantized_model() (in module neural_compressor.jax.quantization.saving)
prepare_qat() (in module neural_compressor.torch.quantization.quantize)
preprocess_quant_config() (in module neural_compressor.torch.quantization.quantize)
print_model() (in module neural_compressor.jax.utils.utility)
ProcessorType (class in neural_compressor.common.utils.utility)
pt2e_dynamic_quant_entry() (in module neural_compressor.torch.quantization.algorithm_entry)
pt2e_static_quant_entry() (in module neural_compressor.torch.quantization.algorithm_entry)
Q
QAvgPool2D (class in neural_compressor.tensorflow.keras.layers.pool2d)
QConv2D (class in neural_compressor.tensorflow.keras.layers.conv2d)
QDense (class in neural_compressor.tensorflow.keras.layers.dense)
QDepthwiseConv2D (class in neural_compressor.tensorflow.keras.layers.depthwise_conv2d)
qdq_quantize() (in module neural_compressor.torch.algorithms.smooth_quant.smooth_quant)
qdq_weight_actor() (in module neural_compressor.torch.algorithms.weight_only.utility)
qdq_weight_asym() (in module neural_compressor.torch.algorithms.weight_only.utility)
qdq_weight_sym() (in module neural_compressor.torch.algorithms.weight_only.utility)
QDQLayer (class in neural_compressor.torch.algorithms.layer_wise.utils)
(class in neural_compressor.torch.algorithms.weight_only.modules)
QDynamicCachedGemma3Attention (class in neural_compressor.jax.quantization.layers_dynamic)
QDynamicDense (class in neural_compressor.jax.quantization.layers_dynamic)
QDynamicDenseMixin (class in neural_compressor.jax.quantization.layers_dynamic)
QDynamicEinsumDense (class in neural_compressor.jax.quantization.layers_dynamic)
QDynamicGemma3VisionAttention (class in neural_compressor.jax.quantization.layers_dynamic)
QDynamicMultiHeadAttention (class in neural_compressor.jax.quantization.layers_dynamic)
QDynamicReversibleEmbedding (class in neural_compressor.jax.quantization.layers_dynamic)
QMaxPool2D (class in neural_compressor.tensorflow.keras.layers.pool2d)
QSeparableConv2D (class in neural_compressor.tensorflow.keras.layers.separable_conv2d)
QStaticCachedGemma3Attention (class in neural_compressor.jax.quantization.layers_static)
QStaticDense (class in neural_compressor.jax.quantization.layers_static)
QStaticDenseMixin (class in neural_compressor.jax.quantization.layers_static)
QStaticEinsumDense (class in neural_compressor.jax.quantization.layers_static)
QStaticGemma3VisionAttention (class in neural_compressor.jax.quantization.layers_static)
QStaticMultiHeadAttention (class in neural_compressor.jax.quantization.layers_static)
QStaticReversibleEmbedding (class in neural_compressor.jax.quantization.layers_static)
QStaticRotaryEmbedding (class in neural_compressor.jax.quantization.layers_static)
QTensor (class in neural_compressor.torch.algorithms.weight_only.hqq.qtensor)
QTensorConfig (class in neural_compressor.torch.algorithms.weight_only.hqq.config)
QTensorMetaInfo (class in neural_compressor.torch.algorithms.weight_only.hqq.qtensor)
quant_config_from_json_object() (in module neural_compressor.jax.quantization.saving)
quant_config_to_json_object() (in module neural_compressor.jax.quantization.saving)
quant_dequant_w_v1() (in module neural_compressor.torch.algorithms.smooth_quant.utility)
quant_dequant_x_v1() (in module neural_compressor.torch.algorithms.smooth_quant.utility)
quant_tensor() (in module neural_compressor.torch.algorithms.weight_only.utility)
quant_weight_w_scale() (in module neural_compressor.torch.algorithms.weight_only.utility)
quantize() (in module neural_compressor.torch.quantization.quantize)
quantize_4bit() (in module neural_compressor.torch.algorithms.weight_only.utility)
quantize_elemwise_op() (in module neural_compressor.torch.algorithms.mx_quant.utils)
quantize_model() (in module neural_compressor.jax.quantization.quantize)
(in module neural_compressor.tensorflow.quantization.quantize)
quantize_model_with_single_config() (in module neural_compressor.tensorflow.quantization.quantize)
quantize_mx_op() (in module neural_compressor.torch.algorithms.mx_quant.utils)
QuantizeGraphBase (class in neural_compressor.tensorflow.quantization.utils.quantize_graph.quantize_graph_base)
QuantizeGraphForIntel (class in neural_compressor.tensorflow.quantization.utils.quantize_graph.quantize_graph_for_intel_cpu)
QuantizeGraphHelper (class in neural_compressor.tensorflow.quantization.utils.quantize_graph_common)
QuantizeNodeBase (class in neural_compressor.tensorflow.quantization.utils.quantize_graph.quantize_graph_base)
Quantizer (class in neural_compressor.torch.algorithms.base_algorithm)
(class in neural_compressor.torch.algorithms.weight_only.gptq)
QuantLinear (class in neural_compressor.torch.algorithms.qat.quant_linear)
R
RAWGPTQuantizer (class in neural_compressor.torch.algorithms.weight_only.gptq)
read_graph() (in module neural_compressor.tensorflow.quantization.utils.utility)
read_json_file() (in module neural_compressor.torch.utils.utility)
reconstruct_saved_model() (in module neural_compressor.tensorflow.quantization.utils.utility)
recover_forward() (in module neural_compressor.torch.algorithms.weight_only.utility)
(in module neural_compressor.torch.utils.block_wise)
recover_model_from_json() (in module neural_compressor.torch.algorithms.smooth_quant.save_load)
register_accelerator() (in module neural_compressor.torch.utils.auto_accelerator)
register_algo() (in module neural_compressor.jax.utils.utility)
(in module neural_compressor.tensorflow.utils.utility)
(in module neural_compressor.torch.utils.utility)
register_autotune() (in module neural_compressor.torch.algorithms.smooth_quant.utility)
register_config() (in module neural_compressor.common.base_config)
register_dynamic_quantized_layer() (in module neural_compressor.jax.quantization.layers_dynamic)
register_observer() (in module neural_compressor.torch.algorithms.fp8_quant.observer)
register_pack_func() (in module neural_compressor.torch.utils.bit_packer)
register_patched_module() (in module neural_compressor.torch.algorithms.fp8_quant.patched_module_base)
register_scaling_methods() (in module neural_compressor.torch.algorithms.fp8_quant.scaling_method_base)
register_static_quantized_layer() (in module neural_compressor.jax.quantization.layers_static)
register_supported_configs_for_fwk() (in module neural_compressor.common.base_config)
register_weight_hooks() (in module neural_compressor.torch.algorithms.layer_wise.utils)
RemoveTrainingNodesOptimizer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.remove_training_nodes)
RenameBatchNormOptimizer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.rename_batch_norm)
replace_forward() (in module neural_compressor.torch.algorithms.weight_only.utility)
(in module neural_compressor.torch.utils.block_wise)
replace_pattern (neural_compressor.torch.algorithms.pt2e_quant.half_precision_rewriter.PatternPair attribute)
replace_with_quant_linear() (in module neural_compressor.torch.algorithms.qat.quant_utils)
replacement_fn() (in module neural_compressor.torch.algorithms.weight_only.hqq.quantizer)
RerangeQuantizedConcat (class in neural_compressor.tensorflow.quantization.utils.transform_graph.rerange_quantized_concat)
reshape_in_channel_to_last() (in module neural_compressor.torch.algorithms.smooth_quant.utility)
reshape_scale_as_input() (in module neural_compressor.torch.algorithms.smooth_quant.utility)
reshape_scale_as_weight() (in module neural_compressor.torch.algorithms.smooth_quant.utility)
RoundingMode (class in neural_compressor.torch.algorithms.mx_quant.utils)
rtn_entry() (in module neural_compressor.torch.quantization.algorithm_entry)
RTNConfig (class in neural_compressor.torch.quantization.config)
RTNQuantizer (class in neural_compressor.torch.algorithms.weight_only.rtn)
S
Sampler (class in neural_compressor.common.base_tuning)
save() (in module neural_compressor.torch.algorithms.pt2e_quant.save_load)
(in module neural_compressor.torch.algorithms.static_quant.save_load)
(in module neural_compressor.torch.algorithms.weight_only.save_load)
(in module neural_compressor.torch.quantization.save_load_entry)
save_config_mapping() (in module neural_compressor.common.utils.save_load)
save_layers_in_shards_iteratively() (in module neural_compressor.torch.algorithms.layer_wise.utils)
SaveableLayerMixin (class in neural_compressor.jax.quantization.saving)
saved_model_session() (in module neural_compressor.tensorflow.utils.model_wrappers)
SaveLoadFormat (class in neural_compressor.torch.utils.constants)
ScaleProPagationTransformer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.int8.scale_propagation)
ScalingMethodBase (class in neural_compressor.torch.algorithms.fp8_quant.scaling_method_base)
search_clip() (in module neural_compressor.torch.algorithms.weight_only.utility)
search_pattern (neural_compressor.torch.algorithms.pt2e_quant.half_precision_rewriter.PatternPair attribute)
SequentialSampler (class in neural_compressor.common.base_tuning)
(class in neural_compressor.tensorflow.utils.data)
set_module() (in module neural_compressor.torch.algorithms.smooth_quant.utility)
(in module neural_compressor.torch.algorithms.weight_only.utility)
(in module neural_compressor.torch.utils.utility)
set_random_seed() (in module neural_compressor.common.utils.utility)
set_resume_from() (in module neural_compressor.common.utils.utility)
set_tensorboard() (in module neural_compressor.common.utils.utility)
set_workspace() (in module neural_compressor.common.utils.utility)
shape (neural_compressor.torch.algorithms.weight_only.hqq.qtensor.QTensorMetaInfo attribute)
ShareQDQForItexYPatternOptimizer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.qdq.share_qdq_y_pattern)
simple_inference() (in module neural_compressor.torch.algorithms.static_quant.utility)
singleton() (in module neural_compressor.common.utils.utility)
(in module neural_compressor.tensorflow.utils.utility)
slim_session() (in module neural_compressor.tensorflow.utils.model_wrappers)
smooth_quant_entry() (in module neural_compressor.tensorflow.quantization.algorithm_entry)
(in module neural_compressor.torch.quantization.algorithm_entry)
SmoothQuant (class in neural_compressor.tensorflow.algorithms.smoother.core)
SmoothQuantCalibration (class in neural_compressor.tensorflow.algorithms.smoother.calibration)
SmoothQuantCalibrationLLM (class in neural_compressor.tensorflow.algorithms.smoother.calibration)
SmoothQuantConfig (class in neural_compressor.tensorflow.quantization.config)
(class in neural_compressor.torch.quantization.config)
SmoothQuantQuantizer (class in neural_compressor.torch.algorithms.smooth_quant.smooth_quant)
SmoothQuantScaler (class in neural_compressor.tensorflow.algorithms.smoother.scaler)
SmoothQuantScalerLLM (class in neural_compressor.tensorflow.algorithms.smoother.scaler)
SplitSharedInputOptimizer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.split_shared_input)
SQLinearWrapper (class in neural_compressor.torch.algorithms.smooth_quant.utility)
static_quant_entry() (in module neural_compressor.tensorflow.quantization.algorithm_entry)
(in module neural_compressor.torch.quantization.algorithm_entry)
static_quantize() (in module neural_compressor.jax.algorithms.static)
StaticQDQLayer (class in neural_compressor.jax.quantization.layers_static)
StaticQuantConfig (class in neural_compressor.jax.quantization.config)
(class in neural_compressor.tensorflow.keras.quantization.config)
(class in neural_compressor.tensorflow.quantization.config)
(class in neural_compressor.torch.quantization.config)
StaticQuantQuantizer (class in neural_compressor.torch.algorithms.static_quant.static_quant)
Statistics (class in neural_compressor.common.utils.utility)
strip_equivalent_nodes() (in module neural_compressor.tensorflow.quantization.utils.utility)
strip_unused_nodes() (in module neural_compressor.tensorflow.quantization.utils.utility)
StripEquivalentNodesOptimizer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.strip_equivalent_nodes)
StripUnusedNodesOptimizer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.strip_unused_nodes)
SwitchOptimizer (class in neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.switch_optimizer)
T
Tensorflow_ITEXAdaptor (class in neural_compressor.tensorflow.algorithms.static_quant.tensorflow)
TensorFlowAdaptor (class in neural_compressor.tensorflow.algorithms.static_quant.tensorflow)
TensorflowBaseModel (class in neural_compressor.tensorflow.utils.model_wrappers)
TensorflowCheckpointModel (class in neural_compressor.tensorflow.utils.model_wrappers)
TensorFlowConfig (class in neural_compressor.tensorflow.algorithms.static_quant.tensorflow)
TensorflowConfigConverter (class in neural_compressor.tensorflow.algorithms.static_quant.tensorflow)
TensorflowGlobalConfig (class in neural_compressor.tensorflow.utils.model)
TensorflowLLMModel (class in neural_compressor.tensorflow.utils.model_wrappers)
TensorflowModel (class in neural_compressor.tensorflow.utils.model_wrappers)
TensorflowQuery (class in neural_compressor.tensorflow.algorithms.static_quant.tensorflow)
TensorflowSavedModelModel (class in neural_compressor.tensorflow.utils.model_wrappers)
TensorQuantizer (class in neural_compressor.torch.algorithms.qat.tensor_quantizer)
teq_quantize_entry() (in module neural_compressor.torch.quantization.algorithm_entry)
TEQConfig (class in neural_compressor.torch.quantization.config)
TEQLinearFakeQuant (class in neural_compressor.torch.algorithms.weight_only.modules)
TEQuantizer (class in neural_compressor.torch.algorithms.weight_only.teq)
TFSlimNetsFactory (class in neural_compressor.tensorflow.utils.utility)
to_device() (in module neural_compressor.torch.utils.utility)
to_dtype() (in module neural_compressor.torch.utils.utility)
TorchBaseConfig (class in neural_compressor.torch.quantization.config)
TorchSmoothQuant (class in neural_compressor.torch.algorithms.smooth_quant.utility)
trace_gptq_target_blocks() (in module neural_compressor.torch.algorithms.weight_only.gptq)
TrainableEquivalentTransformation (class in neural_compressor.torch.algorithms.weight_only.teq)
transformation() (in module neural_compressor.torch.algorithms.pt2e_quant.half_precision_rewriter)
TransformerBasedModelBlockPatternDetector (class in neural_compressor.torch.algorithms.static_quant.utility)
try_loading_keras() (in module neural_compressor.tensorflow.utils.model_wrappers)
TuningConfig (class in neural_compressor.common.base_tuning)
TuningLogger (class in neural_compressor.common.utils.logger)
TuningMonitor (class in neural_compressor.common.base_tuning)
TuningParam (class in neural_compressor.common.tuning_param)
U
UnpackedWeightOnlyLinearParams (class in neural_compressor.torch.algorithms.weight_only.modules)
UnpicklingError
update_module() (in module neural_compressor.torch.algorithms.layer_wise.utils)
update_sq_scale() (in module neural_compressor.torch.algorithms.smooth_quant.utility)
V
valid_keras_format() (in module neural_compressor.tensorflow.utils.utility)
valid_reshape_inputs() (in module neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_decomposed_bn)
(in module neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_decomposed_in)
validate_and_inference_input_output() (in module neural_compressor.tensorflow.utils.model_wrappers)
validate_graph_node() (in module neural_compressor.tensorflow.utils.model_wrappers)
validate_modules() (in module neural_compressor.torch.utils.utility)
values_from_const() (in module neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_decomposed_bn)
(in module neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_decomposed_in)
(in module neural_compressor.tensorflow.quantization.utils.graph_rewriter.generic.fuse_layer_norm)
verify_api() (in module neural_compressor.jax.utils.utility)
version1_eq_version2() (in module neural_compressor.tensorflow.utils.utility)
version1_gt_version2() (in module neural_compressor.tensorflow.utils.utility)
version1_gte_version2() (in module neural_compressor.tensorflow.utils.utility)
version1_lt_version2() (in module neural_compressor.tensorflow.utils.utility)
version1_lte_version2() (in module neural_compressor.tensorflow.utils.utility)
VersionManager (class in neural_compressor.jax.quantization.saving)
W
W8A8PT2EQuantizer (class in neural_compressor.torch.algorithms.pt2e_quant.core)
WeightOnlyLinear (class in neural_compressor.torch.algorithms.weight_only.modules)
white_list (neural_compressor.tensorflow.quantization.config.SmoothQuantConfig attribute)
WOQModelLoader (class in neural_compressor.torch.algorithms.weight_only.save_load)
WrapperLayer (class in neural_compressor.torch.algorithms.smooth_quant.utility)
write_graph() (in module neural_compressor.tensorflow.quantization.utils.utility)
write_json_file() (in module neural_compressor.torch.utils.utility)
X
XPU_Accelerator (class in neural_compressor.torch.utils.auto_accelerator)