LICENSE
README.md
setup.py
./intel_extension_for_transformers/__init__.py
./intel_extension_for_transformers/version.py
./intel_extension_for_transformers/backends/__init__.py
./intel_extension_for_transformers/backends/neural_engine/__init__.py
./intel_extension_for_transformers/backends/neural_engine/compile/__init__.py
./intel_extension_for_transformers/backends/neural_engine/compile/compile.py
./intel_extension_for_transformers/backends/neural_engine/compile/graph_utils.py
./intel_extension_for_transformers/backends/neural_engine/compile/logger.py
./intel_extension_for_transformers/backends/neural_engine/compile/onnx_utils.py
./intel_extension_for_transformers/backends/neural_engine/compile/tf_utils.py
./intel_extension_for_transformers/backends/neural_engine/compile/extractors/__init__.py
./intel_extension_for_transformers/backends/neural_engine/compile/extractors/extractor.py
./intel_extension_for_transformers/backends/neural_engine/compile/extractors/onnx_extractor.py
./intel_extension_for_transformers/backends/neural_engine/compile/extractors/tf_extractor.py
./intel_extension_for_transformers/backends/neural_engine/compile/graph/__init__.py
./intel_extension_for_transformers/backends/neural_engine/compile/graph/graph.py
./intel_extension_for_transformers/backends/neural_engine/compile/loaders/__init__.py
./intel_extension_for_transformers/backends/neural_engine/compile/loaders/loader.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/__init__.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/all.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/assert.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/batch_matmul.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/batch_matmul_v2.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/bias_add.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/cast.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/concat.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/conv.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/empty_ops.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/expand_dims.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/fused_batch_matmul_v2.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/fused_batch_norm_v3.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/fused_gemm.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/fused_matmul.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/gather.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/gather_elements.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/gelu.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/gemm.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/iterator_get_next.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/iterator_v2.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/layer_normalization.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/map_and_batch_dataset.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/matmul.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/mean.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/mkl_layer_norm.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/model_dataset.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/one_hot.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/onnx_input.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/op.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/optimize_dataset.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/pack.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/placeholder.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/quantize_linear.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/quantize_v2.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/quantized_fused_matmul_and_dequantize.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/quantized_matmul_with_bias_and_dequantize.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/reduce_mean.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/reduce_sum.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/reshape.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/scatter_elements.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/softmax.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/split.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/squeeze.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/strided_slice.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/tensor.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/top_k.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/transpose.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/unpack.py
./intel_extension_for_transformers/backends/neural_engine/compile/ops/unsqueeze.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/__init__.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/add_cls_token.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/add_embeddings.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/attention_mask_length_adaptive_keep_indices.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/attention_output_layer_norm_length_adaptive_keep_indices.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/attention_reshape.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/collect_quant_info.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/conv_reshape.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/embeddingbag.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/gelu.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/generate_sequence.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/input_data.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/input_file.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/insert_bf16_node.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/insert_quant_node.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/interact_features.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/last_layer_shape.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/layer_norm.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/layer_norm_with_reduce_mean.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/matmul_with_bias.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/matmul_with_bias_add.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/matmul_with_bias_gelu.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/matmul_with_bias_relu.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/matmul_with_bias_sigmoid.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/matmul_with_bias_tanh.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/merged_embeddingbag.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/output_data.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/padding_sequence.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/pattern.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/position_embeddings.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/position_embeddings_v1.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/qkv_merge.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/qkv_reshape.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/quantize_fusion.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/reshape_after_restore_hidden_states.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/reshape_before_and_after_attention_out_layer_norm_gather_elements.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/reshape_before_restore_hidden_states.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/reshape_fusion.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/restore_hidden_states_in_length_adaptive_update_indices.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/start_end_logits.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/subgraph_matcher.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/token_type_embeddings.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/token_type_embeddings_v1.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/transpose_batch_matmul.py
./intel_extension_for_transformers/backends/neural_engine/compile/sub_graph/word_embeddings.py
./intel_extension_for_transformers/optimization/__init__.py
./intel_extension_for_transformers/optimization/benchmark.py
./intel_extension_for_transformers/optimization/config.py
./intel_extension_for_transformers/optimization/distillation.py
./intel_extension_for_transformers/optimization/model.py
./intel_extension_for_transformers/optimization/optimizer.py
./intel_extension_for_transformers/optimization/optimizer_tf.py
./intel_extension_for_transformers/optimization/pipeline.py
./intel_extension_for_transformers/optimization/pruning.py
./intel_extension_for_transformers/optimization/quantization.py
./intel_extension_for_transformers/optimization/trainer.py
./intel_extension_for_transformers/optimization/dynamic/__init__.py
./intel_extension_for_transformers/optimization/dynamic/drop_and_restore_utils.py
./intel_extension_for_transformers/optimization/dynamic/evolution.py
./intel_extension_for_transformers/optimization/mixture/__init__.py
./intel_extension_for_transformers/optimization/mixture/auto_distillation.py
./intel_extension_for_transformers/optimization/pytorch_pruner/__init__.py
./intel_extension_for_transformers/optimization/pytorch_pruner/patterns.py
./intel_extension_for_transformers/optimization/pytorch_pruner/prune_utils.py
./intel_extension_for_transformers/optimization/pytorch_pruner/pruner.py
./intel_extension_for_transformers/optimization/pytorch_pruner/pruning.py
./intel_extension_for_transformers/optimization/pytorch_pruner/scheduler.py
./intel_extension_for_transformers/optimization/utils/__init__.py
./intel_extension_for_transformers/optimization/utils/metrics.py
./intel_extension_for_transformers/optimization/utils/objectives.py
./intel_extension_for_transformers/optimization/utils/utility.py
./intel_extension_for_transformers/optimization/utils/utility_tf.py
./intel_extension_for_transformers/optimization/utils/models/__init__.py
./intel_extension_for_transformers/optimization/utils/models/modeling_bert_dynamic.py
./intel_extension_for_transformers/optimization/utils/models/modeling_roberta_dynamic.py
./intel_extension_for_transformers/preprocessing/__init__.py
./intel_extension_for_transformers/preprocessing/data_augmentation.py
./intel_extension_for_transformers/preprocessing/utils.py
intel_extension_for_transformers.egg-info/PKG-INFO
intel_extension_for_transformers.egg-info/SOURCES.txt
intel_extension_for_transformers.egg-info/dependency_links.txt
intel_extension_for_transformers.egg-info/requires.txt
intel_extension_for_transformers.egg-info/top_level.txt
intel_extension_for_transformers/backends/neural_engine/bin/neural_engine