diff --git a/docs/api_doc/optimization/config.rst b/docs/api_doc/optimization/config.rst index 435f5d6ddad..2ca607c03dc 100644 --- a/docs/api_doc/optimization/config.rst +++ b/docs/api_doc/optimization/config.rst @@ -4,7 +4,4 @@ Config .. autoapisummary:: intel_extension_for_transformers.transformers.utils.metrics intel_extension_for_transformers.transformers.utils.objectives - intel_extension_for_transformers.transformers.config - intel_extension_for_transformers.transformers.quantization - intel_extension_for_transformers.transformers.distillation - intel_extension_for_transformers.transformers.pruning + intel_extension_for_transformers.transformers.utils.config diff --git a/docs/api_doc/optimization/tf_optimization.rst b/docs/api_doc/optimization/tf_optimization.rst deleted file mode 100644 index 3aa7cb7864a..00000000000 --- a/docs/api_doc/optimization/tf_optimization.rst +++ /dev/null @@ -1,6 +0,0 @@ -TensorFlow Optimizer -============== - -.. autoapisummary:: - - intel_extension_for_transformers.transformers.optimizer_tf diff --git a/docs/api_doc/user_api.rst b/docs/api_doc/user_api.rst index 712132f5d55..80a7ead6078 100644 --- a/docs/api_doc/user_api.rst +++ b/docs/api_doc/user_api.rst @@ -7,7 +7,5 @@ The following Python API information is available: :maxdepth: 1 optimization/trainer.rst - optimization/optimizer.rst optimization/model.rst - optimization/tf_optimization.rst optimization/config.rst diff --git a/examples/.config/tensorflow_optimize.json b/examples/.config/tensorflow_optimize.json deleted file mode 100644 index ab0aacaf6ce..00000000000 --- a/examples/.config/tensorflow_optimize.json +++ /dev/null @@ -1,255 +0,0 @@ -{ - "bert_base_mrpc_static": { - "working_dir": "huggingface/tensorflow/text-classification/quantization/ptq", - "tune":{ - "cmd": "bash run_tuning.sh", - "params": { - "topology": "bert_base_mrpc_static", - "output_model": "saved_results", - "cache_dir": "${HOME}/.cache/nlp_toolkit/text-classification" - } - }, - "benchmark": { - "cmd": "bash run_benchmark.sh", - "params": { - "topology": "bert_base_mrpc_static", - "mode": "accuracy", - "batch_size": "64", - "iters": "100", - "int8": "false", - "config": "saved_results", - "cache_dir": "${HOME}/.cache/nlp_toolkit/text-classification" - } - } - }, - "distilgpt2_clm": { - "working_dir": "huggingface/tensorflow/language-modeling/quantization/ptq", - "tune":{ - "cmd": "bash run_tuning.sh", - "params": { - "topology": "distilgpt2_clm", - "output_model": "saved_results", - "cache_dir": "${HOME}/.cache/nlp_toolkit/language-modeling" - } - }, - "benchmark": { - "cmd": "bash run_benchmark.sh", - "params": { - "topology": "distilgpt2_clm", - "mode": "accuracy", - "batch_size": "16", - "iters": "100", - "int8": "false", - "config": "saved_results", - "cache_dir": "${HOME}/.cache/nlp_toolkit/language-modeling" - } - } - }, - "distilbert_mlm": { - "working_dir": "huggingface/tensorflow/language-modeling/quantization/ptq", - "tune":{ - "cmd": "bash run_tuning.sh", - "params": { - "topology": "distilbert_mlm", - "output_model": "saved_results", - "cache_dir": "${HOME}/.cache/nlp_toolkit/language-modeling" - } - }, - "benchmark": { - "cmd": "bash run_benchmark.sh", - "params": { - "topology": "distilbert_mlm", - "mode": "accuracy", - "batch_size": "16", - "iters": "100", - "int8": "false", - "config": "saved_results", - "cache_dir": "${HOME}/.cache/nlp_toolkit/language-modeling" - } - } - }, - "bert_base_ner": { - "working_dir": "huggingface/tensorflow/token-classification/quantization", - "tune":{ - "cmd": "bash run_tuning.sh", - "params": { - "topology": "bert_base_ner", - "output_model": "saved_results", - "cache_dir": "${HOME}/.cache/nlp_toolkit/token-classification" - } - }, - "benchmark": { - "cmd": "bash run_benchmark.sh", - "params": { - "topology": "bert_base_ner", - "mode": "accuracy", - "batch_size": "16", - "iters": "100", - "int8": "false", - "config": "saved_results", - "cache_dir": "${HOME}/.cache/nlp_toolkit/token-classification" - } - } - }, - "distilbert_qa": { - "working_dir": "huggingface/tensorflow/question-answering/quantization", - "tune":{ - "cmd": "bash run_tuning.sh", - "params": { - "topology": "distilbert_qa", - "output_model": "saved_results", - "cache_dir": "${HOME}/.cache/nlp_toolkit/question-answering" - } - }, - "benchmark": { - "cmd": "bash run_benchmark.sh", - "params": { - "topology": "distilbert_qa", - "mode": "accuracy", - "batch_size": "16", - "iters": "100", - "int8": "false", - "config": "saved_results", - "cache_dir": "${HOME}/.cache/nlp_toolkit/question-answering" - } - } - }, - "distilbert_swag": { - "working_dir": "huggingface/tensorflow/multiple-choice/quantization", - "tune":{ - "cmd": "bash run_tuning.sh", - "params": { - "topology": "distilbert_swag", - "output_model": "saved_results", - "cache_dir": "${HOME}/.cache/nlp_toolkit/multiple-choice" - } - }, - "benchmark": { - "cmd": "bash run_benchmark.sh", - "params": { - "topology": "distilbert_swag", - "mode": "accuracy", - "batch_size": "16", - "iters": "100", - "int8": "false", - "config": "saved_results", - "cache_dir": "${HOME}/.cache/nlp_toolkit/multiple-choice" - } - } - }, - "roberta_qa": { - "working_dir": "huggingface/tensorflow/question-answering/quantization", - "tune":{ - "cmd": "bash run_tuning.sh", - "params": { - "topology": "roberta_qa", - "output_model": "saved_results", - "cache_dir": "${HOME}/.cache/nlp_toolkit/question-answering" - } - }, - "benchmark": { - "cmd": "bash run_benchmark.sh", - "params": { - "topology": "roberta_qa", - "mode": "accuracy", - "batch_size": "16", - "iters": "100", - "int8": "false", - "config": "saved_results", - "cache_dir": "${HOME}/.cache/nlp_toolkit/question-answering" - } - } - }, - "distilroberta_mlm": { - "working_dir": "huggingface/tensorflow/language-modeling/quantization/ptq", - "tune":{ - "cmd": "bash run_tuning.sh", - "params": { - "topology": "distilroberta_mlm", - "output_model": "saved_results", - "cache_dir": "${HOME}/.cache/nlp_toolkit/language-modeling" - } - }, - "benchmark": { - "cmd": "bash run_benchmark.sh", - "params": { - "topology": "distilroberta_mlm", - "mode": "accuracy", - "batch_size": "16", - "iters": "100", - "int8": "false", - "config": "saved_results", - "cache_dir": "${HOME}/.cache/nlp_toolkit/language-modeling" - } - } - }, - "legalbert_mrpc": { - "working_dir": "huggingface/tensorflow/text-classification/quantization/ptq", - "tune":{ - "cmd": "bash run_tuning.sh", - "params": { - "topology": "legalbert_mrpc", - "output_model": "saved_results", - "cache_dir": "${HOME}/.cache/nlp_toolkit/text-classification" - } - }, - "benchmark": { - "cmd": "bash run_benchmark.sh", - "params": { - "topology": "legalbert_mrpc", - "mode": "accuracy", - "batch_size": "16", - "iters": "100", - "int8": "false", - "config": "saved_results", - "cache_dir": "${HOME}/.cache/nlp_toolkit/text-classification" - } - } - }, - "xlnet_mrpc": { - "working_dir": "huggingface/tensorflow/text-classification/quantization/ptq", - "tune":{ - "cmd": "bash run_tuning.sh", - "params": { - "topology": "xlnet_mrpc", - "output_model": "saved_results", - "cache_dir": "${HOME}/.cache/nlp_toolkit/text-classification" - } - }, - "benchmark": { - "cmd": "bash run_benchmark.sh", - "params": { - "topology": "xlnet_mrpc", - "mode": "accuracy", - "batch_size": "16", - "iters": "100", - "int8": "false", - "config": "saved_results", - "cache_dir": "${HOME}/.cache/nlp_toolkit/text-classification" - } - } - }, - "albert_large_mrpc": { - "working_dir": "huggingface/tensorflow/text-classification/quantization/ptq", - "tune":{ - "cmd": "bash run_tuning.sh", - "params": { - "topology": "albert_large_mrpc", - "output_model": "saved_results", - "cache_dir": "${HOME}/.cache/nlp_toolkit/text-classification" - } - }, - "benchmark": { - "cmd": "bash run_benchmark.sh", - "params": { - "topology": "albert_large_mrpc", - "mode": "accuracy", - "batch_size": "16", - "iters": "100", - "int8": "false", - "config": "saved_results", - "cache_dir": "${HOME}/.cache/nlp_toolkit/text-classification" - } - } - } -}