diff --git a/latest/CODE_OF_CONDUCT.html b/latest/CODE_OF_CONDUCT.html index 28971c139..80826f485 100644 --- a/latest/CODE_OF_CONDUCT.html +++ b/latest/CODE_OF_CONDUCT.html @@ -4,7 +4,7 @@ - Contributor Covenant Code of Conduct — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Contributor Covenant Code of Conduct — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -225,7 +225,7 @@

AttributionSphinx using a theme provided by Read the Docs. - +

Cookies | Privacy
diff --git a/latest/SECURITY.html b/latest/SECURITY.html index 6e37733c4..230ac2f38 100644 --- a/latest/SECURITY.html +++ b/latest/SECURITY.html @@ -4,7 +4,7 @@ - Security Policy — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Security Policy — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -120,7 +120,7 @@

Report a VulnerabilitySphinx using a theme provided by Read the Docs. - +

diff --git a/latest/_sources/docs/community/contributing.md.txt b/latest/_sources/docs/community/contributing.md.txt index 7a5102849..faffe40a9 100644 --- a/latest/_sources/docs/community/contributing.md.txt +++ b/latest/_sources/docs/community/contributing.md.txt @@ -116,8 +116,8 @@ To check bazel files manually: ```bash # install go -wget https://golang.org/dl/go1.15.3.linux-.html64.tar.gz -sudo tar -C /usr/local -xzf go1.15.3.linux-.html64.tar.gz +wget https://golang.org/dl/go1.15.3.linux-amd64.tar.gz +sudo tar -C /usr/local -xzf go1.15.3.linux-amd64.tar.gz export PATH=$PATH:/usr/local/go/bin # install buildifier diff --git a/latest/_sources/docs/design/how_to_write_custom_op.md.txt b/latest/_sources/docs/design/how_to_write_custom_op.md.txt index 8d3d04248..05626fb31 100644 --- a/latest/_sources/docs/design/how_to_write_custom_op.md.txt +++ b/latest/_sources/docs/design/how_to_write_custom_op.md.txt @@ -130,7 +130,7 @@ class EltwiseBaseOp : public OpKernel { } ...... // Create an eltwise forward descriptor and primitive descriptor - eltwise_forward::desc fwd_desc(prop_kind::forward, alg_kind_, src.html, + eltwise_forward::desc fwd_desc(prop_kind::forward, alg_kind_, src_md, alpha_, beta_); dnnl::primitive_attr attr; attr.set_scratchpad_mode(dnnl::scratchpad_mode::user); diff --git a/latest/_sources/docs/install/experimental/install_for_arc_gpu.md.txt b/latest/_sources/docs/install/experimental/install_for_arc_gpu.md.txt index a3d3297b6..de35ba936 100644 --- a/latest/_sources/docs/install/experimental/install_for_arc_gpu.md.txt +++ b/latest/_sources/docs/install/experimental/install_for_arc_gpu.md.txt @@ -72,7 +72,7 @@ The steps to install the runtime components in Ubuntu Linux (within WSL2) are: sudo apt-get install -y gpg-agent wget wget -qO - https://repositories.intel.com/gpu/intel-graphics.key | sudo gpg --dearmor --output /usr/share/keyrings/intel-graphics.gpg - echo "deb [arch=.html64 signed-by=/usr/share/keyrings/intel-graphics.gpg] https://repositories.intel.com/gpu/ubuntu jammy/lts/2350 unified" | sudo tee /etc/apt/sources.list.d/intel-gpu-jammy.list + echo "deb [arch=amd64 signed-by=/usr/share/keyrings/intel-graphics.gpg] https://repositories.intel.com/gpu/ubuntu jammy/lts/2350 unified" | sudo tee /etc/apt/sources.list.d/intel-gpu-jammy.list sudo apt-get update ``` @@ -122,7 +122,7 @@ The steps to install the runtime components in Ubuntu Linux are: sudo apt-get install -y gpg-agent wget wget -qO - https://repositories.intel.com/gpu/intel-graphics.key | sudo gpg --dearmor --output /usr/share/keyrings/intel-graphics.gpg - echo "deb [arch=.html64 signed-by=/usr/share/keyrings/intel-graphics.gpg] https://repositories.intel.com/gpu/ubuntu jammy/lts/2350 unified" | sudo tee /etc/apt/sources.list.d/intel-gpu-jammy.list + echo "deb [arch=amd64 signed-by=/usr/share/keyrings/intel-graphics.gpg] https://repositories.intel.com/gpu/ubuntu jammy/lts/2350 unified" | sudo tee /etc/apt/sources.list.d/intel-gpu-jammy.list sudo apt-get update ``` diff --git a/latest/_static/documentation_options.js b/latest/_static/documentation_options.js index e6c0d9379..4bcfb6d68 100644 --- a/latest/_static/documentation_options.js +++ b/latest/_static/documentation_options.js @@ -1,5 +1,5 @@ const DOCUMENTATION_OPTIONS = { - VERSION: '0.1.dev1+gc09a994', + VERSION: '0.1.dev1+g26e99fc', LANGUAGE: 'en', COLLAPSE_INDEX: false, BUILDER: 'html', diff --git a/latest/docker/README.html b/latest/docker/README.html index e9ece2143..c1c4c162b 100644 --- a/latest/docker/README.html +++ b/latest/docker/README.html @@ -4,7 +4,7 @@ - Intel® Extension for TensorFlow* Docker Container Guide — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Intel® Extension for TensorFlow* Docker Container Guide — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -213,7 +213,7 @@

Verify That Intel GPU is Accessible From TensorFlowSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docker/tensorflow-serving/README.html b/latest/docker/tensorflow-serving/README.html index 0142b97fa..d83c89a6b 100644 --- a/latest/docker/tensorflow-serving/README.html +++ b/latest/docker/tensorflow-serving/README.html @@ -4,7 +4,7 @@ - Intel® Extension for TensorFlow* Serving - Docker Container Guide — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Intel® Extension for TensorFlow* Serving - Docker Container Guide — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -169,7 +169,7 @@

Running the ContainerSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/README.html b/latest/docs/README.html index f3da94eef..2e882c24d 100644 --- a/latest/docs/README.html +++ b/latest/docs/README.html @@ -4,7 +4,7 @@ - Welcome to Intel® Extension for TensorFlow* documentation — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Welcome to Intel® Extension for TensorFlow* documentation — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -234,7 +234,7 @@

HighlightsSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/build_docs/docs_build_tips.html b/latest/docs/build_docs/docs_build_tips.html index 58622d364..966b2418e 100644 --- a/latest/docs/build_docs/docs_build_tips.html +++ b/latest/docs/build_docs/docs_build_tips.html @@ -4,7 +4,7 @@ - Online Documentation Build Guide — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Online Documentation Build Guide — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -161,7 +161,7 @@

Build to Local TestSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/build_docs/source/index.html b/latest/docs/build_docs/source/index.html index 012c15b83..8ed8cd38d 100644 --- a/latest/docs/build_docs/source/index.html +++ b/latest/docs/build_docs/source/index.html @@ -4,7 +4,7 @@ - Welcome to Intel ® Extension for TensorFlow* documentation! — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Welcome to Intel ® Extension for TensorFlow* documentation! — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -110,7 +110,7 @@

Welcome to Intel ® Extension for TensorFlow* documentation!Sphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/community/contributing.html b/latest/docs/community/contributing.html index e8443acb3..ff90cfbd6 100644 --- a/latest/docs/community/contributing.html +++ b/latest/docs/community/contributing.html @@ -4,7 +4,7 @@ - Contributing guidelines — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Contributing guidelines — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -221,8 +221,8 @@

bazel style guidebuildifier is a tool for formatting bazel BUILD and .bzl files with a standard convention (xxx.tpl files are not supported).

To check bazel files manually:

# install go
-wget https://golang.org/dl/go1.15.3.linux-.html64.tar.gz
-sudo tar -C /usr/local -xzf go1.15.3.linux-.html64.tar.gz
+wget https://golang.org/dl/go1.15.3.linux-amd64.tar.gz
+sudo tar -C /usr/local -xzf go1.15.3.linux-amd64.tar.gz
 export PATH=$PATH:/usr/local/go/bin
 
 # install buildifier
@@ -260,7 +260,7 @@ 

Documentation style guideSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/community/releases.html b/latest/docs/community/releases.html index 11d546c54..36b2dec32 100644 --- a/latest/docs/community/releases.html +++ b/latest/docs/community/releases.html @@ -4,7 +4,7 @@ - Releases — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Releases — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -130,7 +130,7 @@

Incompatible ChangesSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/design/directory_structure.html b/latest/docs/design/directory_structure.html index e754aedfb..ac916d806 100644 --- a/latest/docs/design/directory_structure.html +++ b/latest/docs/design/directory_structure.html @@ -4,7 +4,7 @@ - Directory Tree Structure — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Directory Tree Structure — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -186,7 +186,7 @@

Directory Tree StructureSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/design/extension_design.html b/latest/docs/design/extension_design.html index 6251c5069..27ed1ca48 100644 --- a/latest/docs/design/extension_design.html +++ b/latest/docs/design/extension_design.html @@ -4,7 +4,7 @@ - Extension Design — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Extension Design — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -124,7 +124,7 @@

ResourcesSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/design/how_to_write_custom_op.html b/latest/docs/design/how_to_write_custom_op.html index 96e714f18..35fc31559 100644 --- a/latest/docs/design/how_to_write_custom_op.html +++ b/latest/docs/design/how_to_write_custom_op.html @@ -4,7 +4,7 @@ - How to write custom op — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + How to write custom op — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -232,7 +232,7 @@

4. Implement the kernels } ...... // Create an eltwise forward descriptor and primitive descriptor - eltwise_forward::desc fwd_desc(prop_kind::forward, alg_kind_, src.html, + eltwise_forward::desc fwd_desc(prop_kind::forward, alg_kind_, src_md, alpha_, beta_); dnnl::primitive_attr attr; attr.set_scratchpad_mode(dnnl::scratchpad_mode::user); @@ -381,7 +381,7 @@

9. Install and VerifySphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/design/optimization/README.html b/latest/docs/design/optimization/README.html index 11faf1ee1..83b06b9d6 100644 --- a/latest/docs/design/optimization/README.html +++ b/latest/docs/design/optimization/README.html @@ -4,7 +4,7 @@ - Optimizations Design — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Optimizations Design — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -109,7 +109,7 @@

Optimizations DesignSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/design/optimization/oneDNN_object_cache.html b/latest/docs/design/optimization/oneDNN_object_cache.html index 63ce24afe..8f40a54b2 100644 --- a/latest/docs/design/optimization/oneDNN_object_cache.html +++ b/latest/docs/design/optimization/oneDNN_object_cache.html @@ -4,7 +4,7 @@ - oneDNN object cache optimization — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + oneDNN object cache optimization — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -130,7 +130,7 @@

Optimization in convolutionSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/guide/FAQ.html b/latest/docs/guide/FAQ.html index aae9575d8..b49e4dbad 100644 --- a/latest/docs/guide/FAQ.html +++ b/latest/docs/guide/FAQ.html @@ -4,7 +4,7 @@ - Frequently Asked Questions — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Frequently Asked Questions — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -206,7 +206,7 @@

Runtime Built with Sphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/guide/INT8_quantization.html b/latest/docs/guide/INT8_quantization.html index 79b6a57cf..37400e6e0 100644 --- a/latest/docs/guide/INT8_quantization.html +++ b/latest/docs/guide/INT8_quantization.html @@ -4,7 +4,7 @@ - INT8 Quantization — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + INT8 Quantization — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -159,7 +159,7 @@

UsageSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/guide/OpenXLA.html b/latest/docs/guide/OpenXLA.html index de7465dc7..7d6b6531c 100644 --- a/latest/docs/guide/OpenXLA.html +++ b/latest/docs/guide/OpenXLA.html @@ -4,7 +4,7 @@ - OpenXLA — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + OpenXLA — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -212,7 +212,7 @@

ReferencesSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/guide/XPUAutoShard.html b/latest/docs/guide/XPUAutoShard.html index 869527655..ec81a7d39 100644 --- a/latest/docs/guide/XPUAutoShard.html +++ b/latest/docs/guide/XPUAutoShard.html @@ -4,7 +4,7 @@ - XPUAutoShard on GPU [Experimental] — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + XPUAutoShard on GPU [Experimental] — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -194,7 +194,7 @@

Examples Built with Sphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/guide/aamp_tune.html b/latest/docs/guide/aamp_tune.html index f6d02bd7d..1f553f2f9 100644 --- a/latest/docs/guide/aamp_tune.html +++ b/latest/docs/guide/aamp_tune.html @@ -4,7 +4,7 @@ - Tune Advanced Auto Mixed Precision — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Tune Advanced Auto Mixed Precision — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -439,7 +439,7 @@

Tuning Performance Example on MobileNetSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/guide/advanced_auto_mixed_precision.html b/latest/docs/guide/advanced_auto_mixed_precision.html index 47ce26c57..c01c91932 100644 --- a/latest/docs/guide/advanced_auto_mixed_precision.html +++ b/latest/docs/guide/advanced_auto_mixed_precision.html @@ -4,7 +4,7 @@ - Advanced Auto Mixed Precision — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Advanced Auto Mixed Precision — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -420,7 +420,7 @@

Custom OperationSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/guide/environment_variables.html b/latest/docs/guide/environment_variables.html index e25b2230f..063de7ff5 100644 --- a/latest/docs/guide/environment_variables.html +++ b/latest/docs/guide/environment_variables.html @@ -4,7 +4,7 @@ - Environment Variables — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Environment Variables — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -234,7 +234,7 @@

Auto Mixed Precision OptionsSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/guide/features.html b/latest/docs/guide/features.html index 41d90a796..6227426a4 100644 --- a/latest/docs/guide/features.html +++ b/latest/docs/guide/features.html @@ -4,7 +4,7 @@ - Features — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Features — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -227,7 +227,7 @@

TensorFlow ServingSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/guide/how_to_enable_profiler.html b/latest/docs/guide/how_to_enable_profiler.html index 256b2eb97..a2fe76fd7 100644 --- a/latest/docs/guide/how_to_enable_profiler.html +++ b/latest/docs/guide/how_to_enable_profiler.html @@ -4,7 +4,7 @@ - GPU Profiler — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + GPU Profiler — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -212,7 +212,7 @@

FAQSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/guide/infrastructure.html b/latest/docs/guide/infrastructure.html index 4416ecf43..89f538f8c 100644 --- a/latest/docs/guide/infrastructure.html +++ b/latest/docs/guide/infrastructure.html @@ -4,7 +4,7 @@ - Infrastructure — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Infrastructure — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -147,7 +147,7 @@

XPU EngineSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/guide/itex_fusion.html b/latest/docs/guide/itex_fusion.html index 616e16cd9..ae4043d82 100644 --- a/latest/docs/guide/itex_fusion.html +++ b/latest/docs/guide/itex_fusion.html @@ -4,7 +4,7 @@ - Graph fusion — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Graph fusion — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -315,7 +315,7 @@

Generic layout optimizerSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/guide/itex_ops.html b/latest/docs/guide/itex_ops.html index ede1dbe66..c78caf275 100644 --- a/latest/docs/guide/itex_ops.html +++ b/latest/docs/guide/itex_ops.html @@ -4,7 +4,7 @@ - Customized Operators — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Customized Operators — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -305,7 +305,7 @@

itex.ops.ItexLS Built with Sphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/guide/itex_ops_override.html b/latest/docs/guide/itex_ops_override.html index 814d61fe7..502bc059f 100644 --- a/latest/docs/guide/itex_ops_override.html +++ b/latest/docs/guide/itex_ops_override.html @@ -4,7 +4,7 @@ - Operators Override — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Operators Override — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -213,7 +213,7 @@

AdamWSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/guide/keras3_support.html b/latest/docs/guide/keras3_support.html index 3ccfbfc5d..af4c06d14 100644 --- a/latest/docs/guide/keras3_support.html +++ b/latest/docs/guide/keras3_support.html @@ -4,7 +4,7 @@ - Keras 3 Overview — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Keras 3 Overview — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -234,7 +234,7 @@

Situations leads to warning or ErrorSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/guide/keras_mixed_precision.html b/latest/docs/guide/keras_mixed_precision.html index 798507445..1c7ac29cb 100644 --- a/latest/docs/guide/keras_mixed_precision.html +++ b/latest/docs/guide/keras_mixed_precision.html @@ -4,7 +4,7 @@ - Keras Mixed Precision — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Keras Mixed Precision — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -417,7 +417,7 @@

Training the model with a custom training loopSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/guide/launch.html b/latest/docs/guide/launch.html index 3341db74d..a1e0e1f61 100644 --- a/latest/docs/guide/launch.html +++ b/latest/docs/guide/launch.html @@ -4,7 +4,7 @@ - Launch Script User Guide — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Launch Script User Guide — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -913,7 +913,7 @@

Default memory allocatorSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/guide/next_pluggable_device.html b/latest/docs/guide/next_pluggable_device.html index ba519f3d6..2e6a7e3e1 100644 --- a/latest/docs/guide/next_pluggable_device.html +++ b/latest/docs/guide/next_pluggable_device.html @@ -4,7 +4,7 @@ - NextPluggableDevice Overview — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + NextPluggableDevice Overview — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -176,7 +176,7 @@

Check Currently Used Device TypeSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/guide/performance.html b/latest/docs/guide/performance.html index aac770539..0cd4a93e8 100644 --- a/latest/docs/guide/performance.html +++ b/latest/docs/guide/performance.html @@ -4,7 +4,7 @@ - Performance Data — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Performance Data — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -984,7 +984,7 @@

Additional Performance Data for Intel AI Data Center ProductsSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/guide/practice_guide.html b/latest/docs/guide/practice_guide.html index f3a3763a1..8b154d013 100644 --- a/latest/docs/guide/practice_guide.html +++ b/latest/docs/guide/practice_guide.html @@ -4,7 +4,7 @@ - Practice Guide — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Practice Guide — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -324,7 +324,7 @@

GPU Practice GuideSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/guide/python_api.html b/latest/docs/guide/python_api.html index 09cfd42d6..f7f00b3fb 100644 --- a/latest/docs/guide/python_api.html +++ b/latest/docs/guide/python_api.html @@ -4,7 +4,7 @@ - Python APIs — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Python APIs — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -503,7 +503,7 @@

itex versionSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/guide/tf_serving_install.html b/latest/docs/guide/tf_serving_install.html index 2c4229146..96a6c09fb 100644 --- a/latest/docs/guide/tf_serving_install.html +++ b/latest/docs/guide/tf_serving_install.html @@ -4,7 +4,7 @@ - Install TensorFlow Serving with Intel® Extension for TensorFlow* — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Install TensorFlow Serving with Intel® Extension for TensorFlow* — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -370,7 +370,7 @@

Run sampleSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/guide/threadpool.html b/latest/docs/guide/threadpool.html index 8b57cb475..41c292ebb 100644 --- a/latest/docs/guide/threadpool.html +++ b/latest/docs/guide/threadpool.html @@ -4,7 +4,7 @@ - Selecting Thread Pool in Intel® Extension for TensorFlow* CPU [Experimental] — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Selecting Thread Pool in Intel® Extension for TensorFlow* CPU [Experimental] — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -303,7 +303,7 @@

Example Built with Sphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/guide/weight_prepack.html b/latest/docs/guide/weight_prepack.html index d18cf0710..7aeabc023 100644 --- a/latest/docs/guide/weight_prepack.html +++ b/latest/docs/guide/weight_prepack.html @@ -4,7 +4,7 @@ - Online Weight Prepack — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Online Weight Prepack — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -166,7 +166,7 @@

ReferenceSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/install/experimental/install_for_arc_gpu.html b/latest/docs/install/experimental/install_for_arc_gpu.html index a96a991d6..f9cc47a7a 100644 --- a/latest/docs/install/experimental/install_for_arc_gpu.html +++ b/latest/docs/install/experimental/install_for_arc_gpu.html @@ -4,7 +4,7 @@ - Experimental: Intel® Arc™ A-Series GPU Software Installation — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Experimental: Intel® Arc™ A-Series GPU Software Installation — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -188,7 +188,7 @@
Ubuntu Linux Installed in WSL2
sudo apt-get install -y gpg-agent wget
 wget -qO - https://repositories.intel.com/gpu/intel-graphics.key | 
 sudo gpg --dearmor --output /usr/share/keyrings/intel-graphics.gpg
-echo "deb [arch=.html64 signed-by=/usr/share/keyrings/intel-graphics.gpg] https://repositories.intel.com/gpu/ubuntu jammy/lts/2350 unified" | sudo tee /etc/apt/sources.list.d/intel-gpu-jammy.list
+echo "deb [arch=amd64 signed-by=/usr/share/keyrings/intel-graphics.gpg] https://repositories.intel.com/gpu/ubuntu jammy/lts/2350 unified" | sudo tee /etc/apt/sources.list.d/intel-gpu-jammy.list
 sudo apt-get update
 

@@ -245,7 +245,7 @@

Native Linux Running Directly on Hardware
sudo apt-get install -y gpg-agent wget
 wget -qO - https://repositories.intel.com/gpu/intel-graphics.key | 
 sudo gpg --dearmor --output /usr/share/keyrings/intel-graphics.gpg
-echo "deb [arch=.html64 signed-by=/usr/share/keyrings/intel-graphics.gpg] https://repositories.intel.com/gpu/ubuntu jammy/lts/2350 unified" | sudo tee /etc/apt/sources.list.d/intel-gpu-jammy.list
+echo "deb [arch=amd64 signed-by=/usr/share/keyrings/intel-graphics.gpg] https://repositories.intel.com/gpu/ubuntu jammy/lts/2350 unified" | sudo tee /etc/apt/sources.list.d/intel-gpu-jammy.list
 sudo apt-get update
 

@@ -372,7 +372,7 @@

Setup environment variablesSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/install/experimental/install_for_gpu_conda.html b/latest/docs/install/experimental/install_for_gpu_conda.html index 0742b0c08..5f0d47130 100644 --- a/latest/docs/install/experimental/install_for_gpu_conda.html +++ b/latest/docs/install/experimental/install_for_gpu_conda.html @@ -4,7 +4,7 @@ - Conda Environment Installation Instructions — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Conda Environment Installation Instructions — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -193,7 +193,7 @@

Step by step instructions:Sphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/install/how_to_build.html b/latest/docs/install/how_to_build.html index f77318030..309adf8d9 100644 --- a/latest/docs/install/how_to_build.html +++ b/latest/docs/install/how_to_build.html @@ -4,7 +4,7 @@ - Overview — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Overview — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -519,7 +519,7 @@

Configure Example For XPUSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/install/install_for_cpp.html b/latest/docs/install/install_for_cpp.html index 2167ac655..c17f67b2e 100644 --- a/latest/docs/install/install_for_cpp.html +++ b/latest/docs/install/install_for_cpp.html @@ -4,7 +4,7 @@ - Intel® Extension for TensorFlow* for C++ — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Intel® Extension for TensorFlow* for C++ — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -537,7 +537,7 @@

Build and runSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/install/install_for_cpu.html b/latest/docs/install/install_for_cpu.html index 87fda059c..aede6219d 100644 --- a/latest/docs/install/install_for_cpu.html +++ b/latest/docs/install/install_for_cpu.html @@ -4,7 +4,7 @@ - Intel CPU Software Installation — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Intel CPU Software Installation — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -220,7 +220,7 @@

Verify the InstallationSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/install/install_for_xpu.html b/latest/docs/install/install_for_xpu.html index 05a991896..9037cad14 100644 --- a/latest/docs/install/install_for_xpu.html +++ b/latest/docs/install/install_for_xpu.html @@ -4,7 +4,7 @@ - Intel XPU Software Installation — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Intel XPU Software Installation — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -321,7 +321,7 @@

XPU for CPU only platform (Deprecated)Sphinx using a theme provided by Read the Docs. - +

diff --git a/latest/docs/install/installation_guide.html b/latest/docs/install/installation_guide.html index f2e694e3b..ff7970843 100644 --- a/latest/docs/install/installation_guide.html +++ b/latest/docs/install/installation_guide.html @@ -4,7 +4,7 @@ - Installation Guide — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Installation Guide — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -133,7 +133,7 @@

Installation GuideSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/examples/README.html b/latest/examples/README.html index dfa309bf7..d4793f36a 100644 --- a/latest/examples/README.html +++ b/latest/examples/README.html @@ -4,7 +4,7 @@ - Examples — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Examples — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -205,7 +205,7 @@

ExamplesSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/examples/accelerate_alexnet_by_quantization/README.html b/latest/examples/accelerate_alexnet_by_quantization/README.html index 47bb641e5..5693a35d6 100644 --- a/latest/examples/accelerate_alexnet_by_quantization/README.html +++ b/latest/examples/accelerate_alexnet_by_quantization/README.html @@ -4,7 +4,7 @@ - Accelerate AlexNet by Quantization with Intel® Extension for Tensorflow* — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Accelerate AlexNet by Quantization with Intel® Extension for Tensorflow* — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -170,7 +170,7 @@

Execute Built with Sphinx using a theme provided by Read the Docs. - +

diff --git a/latest/examples/common_guide_running.html b/latest/examples/common_guide_running.html index b8d5e67cd..7d04b129d 100644 --- a/latest/examples/common_guide_running.html +++ b/latest/examples/common_guide_running.html @@ -4,7 +4,7 @@ - Common Guide for Running — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Common Guide for Running — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -165,7 +165,7 @@

Run ScriptSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/examples/infer_inception_v4_amp/README.html b/latest/examples/infer_inception_v4_amp/README.html index 2b6747b8a..6e9b425e8 100644 --- a/latest/examples/infer_inception_v4_amp/README.html +++ b/latest/examples/infer_inception_v4_amp/README.html @@ -4,7 +4,7 @@ - Speed up Inference of Inception v4 by Advanced Automatic Mixed Precision on Intel CPU and GPU via Docker Container or Bare Metal — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Speed up Inference of Inception v4 by Advanced Automatic Mixed Precision on Intel CPU and GPU via Docker Container or Bare Metal — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -346,7 +346,7 @@

FAQSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/examples/infer_resnet50/README.html b/latest/examples/infer_resnet50/README.html index d8afa27cb..a77d650c0 100644 --- a/latest/examples/infer_resnet50/README.html +++ b/latest/examples/infer_resnet50/README.html @@ -4,7 +4,7 @@ - ResNet50 Inference on Intel CPU and GPU — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + ResNet50 Inference on Intel CPU and GPU — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -165,7 +165,7 @@

FAQSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/examples/itex_quantization_example/README.html b/latest/examples/itex_quantization_example/README.html index 3d15a7f4b..618061e1b 100644 --- a/latest/examples/itex_quantization_example/README.html +++ b/latest/examples/itex_quantization_example/README.html @@ -4,7 +4,7 @@ - Intel® Extension for Tensorflow* Model Quantization API Example — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Intel® Extension for Tensorflow* Model Quantization API Example — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -214,7 +214,7 @@

Run Model Quantization Example:Sphinx using a theme provided by Read the Docs. - +

diff --git a/latest/examples/model_zoo_example/README.html b/latest/examples/model_zoo_example/README.html index af4782886..9e8f581f5 100644 --- a/latest/examples/model_zoo_example/README.html +++ b/latest/examples/model_zoo_example/README.html @@ -4,7 +4,7 @@ - Accelerate Deep Learning Training and Inference for Model Zoo Workloads on Intel GPU — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Accelerate Deep Learning Training and Inference for Model Zoo Workloads on Intel GPU — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -130,7 +130,7 @@

Run Models on Bare MetalSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/examples/pretrain_bert/README.html b/latest/examples/pretrain_bert/README.html index 29b6e979e..cc1e12257 100644 --- a/latest/examples/pretrain_bert/README.html +++ b/latest/examples/pretrain_bert/README.html @@ -4,7 +4,7 @@ - Accelerate BERT-Large Pretraining on Intel GPU — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Accelerate BERT-Large Pretraining on Intel GPU — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -527,7 +527,7 @@

FAQSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/examples/quantize_inception_v3/README.html b/latest/examples/quantize_inception_v3/README.html index 345564eff..ff4c58bef 100644 --- a/latest/examples/quantize_inception_v3/README.html +++ b/latest/examples/quantize_inception_v3/README.html @@ -4,7 +4,7 @@ - Quantize Inception V3 by Intel® Extension for Tensorflow* on Intel® Xeon® — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Quantize Inception V3 by Intel® Extension for Tensorflow* on Intel® Xeon® — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -237,7 +237,7 @@

License Built with Sphinx using a theme provided by Read the Docs. - +

diff --git a/latest/examples/quick_example.html b/latest/examples/quick_example.html index 0ed6e6372..ec8c99569 100644 --- a/latest/examples/quick_example.html +++ b/latest/examples/quick_example.html @@ -4,7 +4,7 @@ - Quick Example on Intel CPU and GPU — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Quick Example on Intel CPU and GPU — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -196,7 +196,7 @@

NotesSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/examples/stable_diffussion_inference/README.html b/latest/examples/stable_diffussion_inference/README.html index bfa1d3854..2c0be71cc 100644 --- a/latest/examples/stable_diffussion_inference/README.html +++ b/latest/examples/stable_diffussion_inference/README.html @@ -4,7 +4,7 @@ - Stable Diffusion Inference for Text2Image on Intel GPU — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Stable Diffusion Inference for Text2Image on Intel GPU — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -225,7 +225,7 @@

FAQSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/examples/train_3d_unet/README.html b/latest/examples/train_3d_unet/README.html index 034739705..4ad0a3dff 100644 --- a/latest/examples/train_3d_unet/README.html +++ b/latest/examples/train_3d_unet/README.html @@ -4,7 +4,7 @@ - Accelerate 3D-Unet Training w/o horovod for medical image segmentation on Intel GPU — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Accelerate 3D-Unet Training w/o horovod for medical image segmentation on Intel GPU — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -229,7 +229,7 @@

FAQSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/examples/train_bert/README.html b/latest/examples/train_bert/README.html index dab3e4c8b..40e90bce4 100644 --- a/latest/examples/train_bert/README.html +++ b/latest/examples/train_bert/README.html @@ -4,7 +4,7 @@ - BERT Training for Classifying Text on Intel CPU and GPU — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + BERT Training for Classifying Text on Intel CPU and GPU — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -208,7 +208,7 @@

FAQSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/examples/train_bert_fp8/README.html b/latest/examples/train_bert_fp8/README.html index bc7d3964f..a3bc8f4f5 100644 --- a/latest/examples/train_bert_fp8/README.html +++ b/latest/examples/train_bert_fp8/README.html @@ -4,7 +4,7 @@ - FP8 BERT-Large Fine-tuning for Classifying Text on Intel GPU — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + FP8 BERT-Large Fine-tuning for Classifying Text on Intel GPU — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -201,7 +201,7 @@

FAQSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/examples/train_horovod/mnist/README.html b/latest/examples/train_horovod/mnist/README.html index e68e55251..964b90f29 100644 --- a/latest/examples/train_horovod/mnist/README.html +++ b/latest/examples/train_horovod/mnist/README.html @@ -4,7 +4,7 @@ - Distributed Training Example with Intel® Optimization for Horovod* on Intel® GPU — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Distributed Training Example with Intel® Optimization for Horovod* on Intel® GPU — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -221,7 +221,7 @@

Output< Built with Sphinx using a theme provided by Read the Docs. - +

diff --git a/latest/examples/train_horovod/resnet50/README.html b/latest/examples/train_horovod/resnet50/README.html index 76d9031b6..f8e2c5212 100644 --- a/latest/examples/train_horovod/resnet50/README.html +++ b/latest/examples/train_horovod/resnet50/README.html @@ -4,7 +4,7 @@ - Refer to train_resnet50 — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Refer to train_resnet50 — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -108,7 +108,7 @@

Refer to Sphinx using a theme provided by Read the Docs. - +

diff --git a/latest/examples/train_maskrcnn/README.html b/latest/examples/train_maskrcnn/README.html index b9f950223..3e25168e7 100644 --- a/latest/examples/train_maskrcnn/README.html +++ b/latest/examples/train_maskrcnn/README.html @@ -4,7 +4,7 @@ - Accelerate Mask R-CNN Training on Intel GPU — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Accelerate Mask R-CNN Training on Intel GPU — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -234,7 +234,7 @@

FAQSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/examples/train_resnet50/README.html b/latest/examples/train_resnet50/README.html index 9c0ac2d7f..c6ad15506 100644 --- a/latest/examples/train_resnet50/README.html +++ b/latest/examples/train_resnet50/README.html @@ -4,7 +4,7 @@ - Resnet50 train on Intel GPU — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Resnet50 train on Intel GPU — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -252,7 +252,7 @@

Example Output with hvdSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/examples/train_resnet50_with_autoshard/README.html b/latest/examples/train_resnet50_with_autoshard/README.html index 81938cde0..651b26ad0 100644 --- a/latest/examples/train_resnet50_with_autoshard/README.html +++ b/latest/examples/train_resnet50_with_autoshard/README.html @@ -4,7 +4,7 @@ - Accelerate ResNet50 Training by XPUAutoShard on Intel GPU — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Accelerate ResNet50 Training by XPUAutoShard on Intel GPU — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -278,7 +278,7 @@

Example OutputSphinx using a theme provided by Read the Docs. - +

diff --git a/latest/genindex.html b/latest/genindex.html index 7bd920511..645fdd0c1 100644 --- a/latest/genindex.html +++ b/latest/genindex.html @@ -3,7 +3,7 @@ - Index — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Index — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -109,7 +109,7 @@

Index

Built with Sphinx using a theme provided by Read the Docs. - +

diff --git a/latest/get_started.html b/latest/get_started.html index 79e77758b..794eedefc 100644 --- a/latest/get_started.html +++ b/latest/get_started.html @@ -4,7 +4,7 @@ - Intel® Extension for TensorFlow* — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Intel® Extension for TensorFlow* — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -331,7 +331,7 @@

License Built with Sphinx using a theme provided by Read the Docs. - +

diff --git a/latest/objects.inv b/latest/objects.inv index 60ba67930..ceb808d2b 100644 Binary files a/latest/objects.inv and b/latest/objects.inv differ diff --git a/latest/search.html b/latest/search.html index 245bb07a8..ce93f1650 100644 --- a/latest/search.html +++ b/latest/search.html @@ -3,7 +3,7 @@ - Search — Intel® Extension for TensorFlow* 0.1.dev1+gc09a994 documentation + Search — Intel® Extension for TensorFlow* 0.1.dev1+g26e99fc documentation @@ -126,7 +126,7 @@ Built with Sphinx using a theme provided by Read the Docs. - +

diff --git a/latest/searchindex.js b/latest/searchindex.js index 23a1359b2..937b65ca0 100644 --- a/latest/searchindex.js +++ b/latest/searchindex.js @@ -1 +1 @@ -Search.setIndex({"alltitles": {"1. Prerequisite": [[11, "prerequisite"]], "1. Build Intel\u00ae Extension for TensorFlow* C++ library": [[34, "build-intel-extension-for-tensorflow-c-library"]], "1. Correction": [[0, "correction"]], "1. Install GPU Drivers": [[37, "install-gpu-drivers"]], "2. Define the op interface and Register op": [[11, "define-the-op-interface-and-register-op"]], "2. Build TensorFlow Serving": [[34, "build-tensorflow-serving"]], "2. Install TensorFlow* via PyPI Wheel in Linux": [[37, "install-tensorflow-via-pypi-wheel-in-linux"]], "2. Warning": [[0, "warning"]], "3. Register the kernels for the op": [[11, "register-the-kernels-for-the-op"]], "3. Install Intel\u00ae Extension for TensorFlow*": [[37, "install-intel-extension-for-tensorflow"]], "3. Temporary Ban": [[0, "temporary-ban"]], "4. Implement the kernels": [[11, "implement-the-kernels"]], "4. Permanent Ban": [[0, "permanent-ban"]], "4. Verify the Installation": [[37, "verify-the-installation"]], "6. Add the op to BUILD": [[11, "add-the-op-to-build"]], "7. Use the op in Python": [[11, "use-the-op-in-python"]], "8. Build the package": [[11, "build-the-package"]], "9. Install and Verify": [[11, "install-and-verify"]], "Accelerate 3D-Unet Training w/o horovod for medical image segmentation on Intel GPU": [[55, "accelerate-3d-unet-training-w-o-horovod-for-medical-image-segmentation-on-intel-gpu"]], "Accelerate AlexNet by Quantization with Intel\u00ae Extension for Tensorflow*": [[45, "accelerate-alexnet-by-quantization-with-intel-extension-for-tensorflow"]], "Accelerate BERT-Large Pretraining on Intel GPU": [[51, "accelerate-bert-large-pretraining-on-intel-gpu"]], "Accelerate Deep Learning Training and Inference for Model Zoo Workloads on Intel GPU": [[50, "accelerate-deep-learning-training-and-inference-for-model-zoo-workloads-on-intel-gpu"]], "Accelerate Mask R-CNN Training on Intel GPU": [[60, "accelerate-mask-r-cnn-training-on-intel-gpu"]], "Accelerate ResNet50 Training by XPUAutoShard on Intel GPU": [[62, "accelerate-resnet50-training-by-xpuautoshard-on-intel-gpu"]], "Accuracy": [[54, "accuracy"], [57, "accuracy"]], "AdamW": [[26, "adamw"]], "Additional": [[39, "additional"]], "Additional Performance Data for Intel AI Data Center Products": [[31, "additional-performance-data-for-intel-ai-data-center-products"]], "Advanced AMP vs. Stock TensorFlow AMP": [[19, "advanced-amp-vs-stock-tensorflow-amp"]], "Advanced Auto Mixed Precision": [[19, "advanced-auto-mixed-precision"], [19, "id1"]], "Advanced Auto Mixed Precision (AMP)": [[21, "advanced-auto-mixed-precision-amp"]], "Advanced Settings": [[29, "advanced-settings"]], "Advanced: Enable Advanced AMP Method": [[47, "advanced-enable-advanced-amp-method"]], "Apply Model Quantization": [[49, "apply-model-quantization"]], "Apply Patch": [[61, "apply-patch"]], "Apply Patch for Intel GPU": [[58, "apply-patch-for-intel-gpu"]], "Architecture": [[23, "architecture"]], "Attribution": [[0, "attribution"]], "Auto Mixed Precision Options": [[20, "auto-mixed-precision-options"]], "BERT Training for Classifying Text on Intel CPU and GPU": [[56, "bert-training-for-classifying-text-on-intel-cpu-and-gpu"]], "BERT-Large Phase2 Training Performance Results": [[31, "bert-large-phase2-training-performance-results"]], "BF16 + FP8 Fine-tuning": [[57, "bf16-fp8-fine-tuning"]], "Backend and Config Protocol": [[20, "backend-and-config-protocol"]], "Background": [[18, "background"], [45, "background"], [52, "background"]], "Basic Settings": [[29, "basic-settings"]], "Basic fusion": [[24, "basic-fusion"]], "Binaries Preparation": [[2, "binaries-preparation"]], "Build Docker container from Dockerfile": [[41, "build-docker-container-from-dockerfile"], [42, "build-docker-container-from-dockerfile"]], "Build Docker image from Dockerfile": [[34, "build-docker-image-from-dockerfile"]], "Build Intel\u00ae Extension for TensorFlow* CC library": [[40, "build-intel-extension-for-tensorflow-cc-library"]], "Build Intel\u00ae Extension for TensorFlow* PyPI": [[39, "build-intel-extension-for-tensorflow-pypi"]], "Build Source Code": [[39, "build-source-code"], [40, "build-source-code"]], "Build and run": [[40, "build-and-run"]], "Build from source": [[14, "build-from-source"], [34, "build-from-source"]], "Build the Docker Image": [[3, "build-the-docker-image"]], "Build to Local Test": [[5, "build-to-local-test"]], "Building the model": [[28, "building-the-model"]], "C++ coding style": [[7, "c-coding-style"]], "CPU": [[52, "cpu"]], "CPU Launcher [Experimental]": [[21, "cpu-launcher-experimental"]], "CPU Practice Guide": [[32, "cpu-practice-guide"]], "Check Currently Used Device Type": [[30, "check-currently-used-device-type"]], "Check Device Count (Optional)": [[58, "check-device-count-optional"]], "Check Intel\u00ae Advanced Matrix Extensions": [[52, "check-intel-advanced-matrix-extensions"]], "Check Intel\u00ae Deep Learning Boost": [[52, "check-intel-deep-learning-boost"]], "Check the Environment for XPU": [[42, "check-the-environment-for-xpu"]], "Clone Horovod Repo": [[58, "clone-horovod-repo"]], "Clone the Repository": [[47, "clone-the-repository"]], "Code": [[53, "code"]], "Code Structure": [[17, "code-structure"]], "Code style guide": [[7, "code-style-guide"]], "Command": [[61, "command"]], "Command with Horovod": [[61, "command-with-horovod"]], "Commands": [[51, "commands"]], "Common Execution Mode": [[29, "common-execution-mode"]], "Common Guide for Running": [[46, "common-guide-for-running"]], "Common Requirements": [[39, "common-requirements"], [40, "common-requirements"]], "Compatibility Table": [[63, "compatibility-table"]], "Conda Environment Installation Instructions": [[38, "conda-environment-installation-instructions"]], "Configuration": [[31, "configuration"], [52, "configuration"]], "Configuration List": [[18, "configuration-list"]], "Configuration via Environment Variables": [[20, "configuration-via-environment-variables"]], "Configure": [[39, "configure"], [40, "configure"]], "Configure Example For XPU": [[39, "configure-example-for-xpu"]], "Configure Example for CPU": [[39, "configure-example-for-cpu"]], "Configure For CPU": [[39, "configure-for-cpu"], [40, "configure-for-cpu"]], "Configure For GPU": [[40, "configure-for-gpu"]], "Configure For XPU": [[39, "configure-for-xpu"]], "Contributing": [[63, "contributing"]], "Contributing guidelines": [[7, "contributing-guidelines"]], "Contributing to Intel\u00ae Extension for TensorFlow*": [[7, "contributing-to-intel-extension-for-tensorflow"]], "Contributor Covenant Code of Conduct": [[0, "contributor-covenant-code-of-conduct"]], "Convergence": [[51, "convergence"]], "Create Release Version": [[5, "create-release-version"]], "Create Virtual Environment": [[58, "create-virtual-environment"]], "Create a Conda Environment": [[39, "create-a-conda-environment"], [40, "create-a-conda-environment"]], "Custom API": [[23, "custom-api"]], "Custom Operation": [[19, "custom-operation"]], "Customized Operators": [[25, "customized-operators"]], "Data Type": [[19, "data-type"]], "Default memory allocator": [[29, "default-memory-allocator"]], "Dense Layer": [[26, "dense-layer"]], "Dependency": [[58, "dependency"]], "Description": [[2, "description"], [3, "description"]], "Developing Intel\u00ae Extension for TensorFlow*": [[7, "developing-intel-extension-for-tensorflow"]], "Directory Tree Structure": [[9, "directory-tree-structure"]], "Disable Constant Folding Function": [[52, "disable-constant-folding-function"]], "Distributed Training Example with Intel\u00ae Optimization for Horovod* on Intel\u00ae GPU": [[58, "distributed-training-example-with-intel-optimization-for-horovod-on-intel-gpu"]], "Documentation": [[4, "documentation"], [63, "documentation"]], "Documentation style guide": [[7, "documentation-style-guide"]], "Download Jupyter Code:": [[56, "download-jupyter-code"]], "Download Patch": [[58, "download-patch"]], "Download Source Code": [[39, "download-source-code"], [40, "download-source-code"]], "Download the Pretrained-model": [[47, "download-the-pretrained-model"]], "Dump the graph": [[17, "dump-the-graph"]], "Ease-of-use Python API": [[21, "ease-of-use-python-api"]], "EfficientNet-B0 Inference Performance Results": [[31, "efficientnet-b0-inference-performance-results"]], "EfficientNet-B3 Inference Performance Results": [[31, "efficientnet-b3-inference-performance-results"]], "Enable Advanced AMP": [[19, "enable-advanced-amp"]], "Enable Running Environment": [[47, "enable-running-environment"], [48, "enable-running-environment"], [51, "enable-running-environment"], [54, "enable-running-environment"], [55, "enable-running-environment"], [56, "enable-running-environment"], [57, "enable-running-environment"], [60, "enable-running-environment"], [61, "enable-running-environment"], [62, "enable-running-environment"]], "Enable Virtual Running Environment": [[46, "enable-virtual-running-environment"]], "Enable oneAPI": [[58, "enable-oneapi"]], "Enable oneAPI Running Environment": [[46, "enable-oneapi-running-environment"]], "Enable oneDNN Graph": [[52, "enable-onednn-graph"]], "End-to-end Example": [[18, "end-to-end-example"]], "Enforcement": [[0, "enforcement"]], "Enforcement Guidelines": [[0, "enforcement-guidelines"]], "Enforcement Responsibilities": [[0, "enforcement-responsibilities"]], "Environment Variable Configuration": [[47, "environment-variable-configuration"]], "Environment Variable Difference with Stock TensorFlow": [[18, "environment-variable-difference-with-stock-tensorflow"]], "Environment Variables": [[20, "environment-variables"], [29, "environment-variables"]], "Environment Variables with Python APIs": [[20, "environment-variables-with-python-apis"]], "Environment Vasriable": [[54, "environment-vasriable"]], "Example": [[16, "example"], [18, "example"], [19, "example"], [35, "example"], [40, "example"]], "Example Output": [[48, "example-output"], [53, "example-output"], [54, "example-output"], [62, "example-output"]], "Example Output with hvd": [[61, "example-output-with-hvd"]], "Example Output without hvd": [[61, "example-output-without-hvd"]], "Example of Mix Precision by List": [[18, "example-of-mix-precision-by-list"]], "Example:": [[22, "example"]], "Examples": [[17, "examples"], [29, "examples"], [44, "examples"], [44, "id1"]], "Execute": [[45, "execute"], [56, "execute"]], "Execute Testing and Comparing the Performance of FP32 and Advanced AMP on CPU and GPU in Docker Container or Bare Metal": [[47, "execute-testing-and-comparing-the-performance-of-fp32-and-advanced-amp-on-cpu-and-gpu-in-docker-container-or-bare-metal"]], "Execute the Example": [[51, "execute-the-example"], [55, "execute-the-example"], [57, "execute-the-example"], [60, "execute-the-example"]], "Executes the Example with Python API": [[48, "executes-the-example-with-python-api"], [54, "executes-the-example-with-python-api"], [62, "executes-the-example-with-python-api"]], "Executing Command": [[62, "executing-command"]], "Execution": [[58, "execution"], [61, "execution"]], "Experimental Release": [[37, "experimental-release"]], "Experimental: Intel\u00ae Arc\u2122 A-Series GPU Software Installation": [[37, "experimental-intel-arc-a-series-gpu-software-installation"]], "Extension Design": [[10, "extension-design"]], "Extra Requirements for XPU Build Only": [[39, "extra-requirements-for-xpu-build-only"]], "Extra Requirements for XPU/GPU Build Only": [[40, "extra-requirements-for-xpu-gpu-build-only"]], "FAQ": [[22, "faq"], [47, "faq"], [48, "faq"], [51, "faq"], [54, "faq"], [55, "faq"], [56, "faq"], [57, "faq"], [60, "faq"]], "FP16 Inference": [[54, "fp16-inference"]], "FP32 Inference": [[54, "fp32-inference"]], "FP8 BERT-Large Fine-tuning for Classifying Text on Intel GPU": [[57, "fp8-bert-large-fine-tuning-for-classifying-text-on-intel-gpu"]], "Feature": [[19, "feature"]], "Features": [[21, "features"]], "Finetune Command": [[51, "finetune-command"]], "Frequently Asked Questions": [[14, "frequently-asked-questions"]], "Further Settings": [[62, "further-settings"]], "GNU OpenMP": [[32, "gnu-openmp"]], "GPU": [[45, "gpu"], [52, "gpu"]], "GPU Practice Guide": [[32, "gpu-practice-guide"]], "GPU Profiler": [[21, "gpu-profiler"], [22, "gpu-profiler"]], "Gelu Activation": [[26, "gelu-activation"]], "Generic layout optimizer": [[24, "generic-layout-optimizer"]], "Get docker container from dockerhub": [[41, "get-docker-container-from-dockerhub"], [42, "get-docker-container-from-dockerhub"]], "Graph Optimization": [[21, "graph-optimization"]], "Graph Optimizer": [[19, "graph-optimizer"]], "Graph fusion": [[24, "graph-fusion"]], "Hardware Configuration": [[31, "hardware-configuration"], [32, "hardware-configuration"]], "Hardware Configuration for Intel Flex 170 GPU": [[31, "hardware-configuration-for-intel-flex-170-gpu"]], "Hardware Configuration for Intel Max 1550 GPU": [[31, "hardware-configuration-for-intel-max-1550-gpu"]], "Hardware Environment": [[45, "hardware-environment"], [52, "hardware-environment"]], "Hardware Requirement": [[47, "hardware-requirement"], [63, "hardware-requirement"]], "Hardware Requirements": [[37, "hardware-requirements"], [39, "hardware-requirements"], [40, "hardware-requirements"], [41, "hardware-requirements"], [42, "hardware-requirements"], [51, "hardware-requirements"], [54, "hardware-requirements"], [55, "hardware-requirements"], [56, "hardware-requirements"], [57, "hardware-requirements"], [60, "hardware-requirements"], [61, "hardware-requirements"], [62, "hardware-requirements"]], "Highlights": [[4, "highlights"]], "How it works": [[16, "how-it-works"]], "How to identify different hardware types?": [[28, "how-to-identify-different-hardware-types"]], "How to write custom op": [[11, "how-to-write-custom-op"]], "I. Binaries Preparation": [[3, "i-binaries-preparation"]], "I. Customize Build Script": [[2, "i-customize-build-script"]], "I. Use all physical cores": [[29, "i-use-all-physical-cores"]], "II. Build the Container": [[2, "ii-build-the-container"], [3, "ii-build-the-container"]], "II. Use all cores including logical cores": [[29, "ii-use-all-cores-including-logical-cores"]], "III. Running the Container": [[2, "iii-running-the-container"]], "III. Use physical cores on one node": [[29, "iii-use-physical-cores-on-one-node"]], "INT8 Quantization": [[15, "int8-quantization"], [21, "int8-quantization"]], "ITEX_VERBOSE level definition": [[20, "itex-verbose-level-definition"]], "IV. Use your designated number of cores": [[29, "iv-use-your-designated-number-of-cores"]], "IX. Set environment variable TF_NUM_INTRAOP_THREADS": [[29, "ix-set-environment-variable-tf-num-intraop-threads"]], "If not use Horovod": [[61, "if-not-use-horovod"]], "If use Horovod": [[61, "if-use-horovod"]], "Implementation Details": [[24, "implementation-details"]], "Incompatible Changes": [[8, "incompatible-changes"]], "Inference Performance Results": [[31, "inference-performance-results"]], "Inference Performance on 1x Intel Data Center GPU Flex 170": [[31, "inference-performance-on-1x-intel-data-center-gpu-flex-170"]], "Inference Workloads": [[31, "inference-workloads"]], "Infrastructure": [[23, "infrastructure"]], "Install": [[58, "install"], [63, "install"]], "Install Bazel": [[39, "install-bazel"], [40, "install-bazel"]], "Install Clang-17 compiler": [[39, "install-clang-17-compiler"]], "Install GPU Drivers": [[42, "install-gpu-drivers"]], "Install Intel GPU Driver": [[39, "install-intel-gpu-driver"], [40, "install-intel-gpu-driver"]], "Install Intel\u00ae Extension for TensorFlow*": [[41, "install-intel-extension-for-tensorflow"], [42, "install-intel-extension-for-tensorflow"]], "Install Intel\u00ae Extension for Tensorflow*": [[49, "install-intel-extension-for-tensorflow"]], "Install Intel\u00ae Neural Compressor": [[49, "install-intel-neural-compressor"]], "Install Model Server": [[34, "install-model-server"]], "Install Other Required Packages": [[62, "install-other-required-packages"]], "Install TensorFlow": [[37, "install-tensorflow"], [39, "install-tensorflow"], [40, "install-tensorflow"], [41, "install-tensorflow"], [42, "install-tensorflow"]], "Install TensorFlow Serving with Intel\u00ae Extension for TensorFlow*": [[34, "install-tensorflow-serving-with-intel-extension-for-tensorflow"]], "Install for CPU": [[63, "install-for-cpu"]], "Install for CPU weekly": [[63, "install-for-cpu-weekly"]], "Install for XPU": [[63, "install-for-xpu"]], "Install for XPU weekly": [[63, "install-for-xpu-weekly"]], "Install for weekly binaries": [[63, "install-for-weekly-binaries"]], "Install oneAPI Base Toolkit": [[39, "install-oneapi-base-toolkit"], [40, "install-oneapi-base-toolkit"]], "Install oneAPI Base Toolkit Packages": [[42, "install-oneapi-base-toolkit-packages"]], "Install using Docker": [[34, "install-using-docker"]], "Install via Docker container": [[41, "install-via-docker-container"], [42, "install-via-docker-container"]], "Install via PyPI wheel in bare metal": [[41, "install-via-pypi-wheel-in-bare-metal"], [42, "install-via-pypi-wheel-in-bare-metal"]], "Installation": [[53, "installation"]], "Installation Channel:": [[63, "installation-channel"]], "Installation Guide": [[43, "installation-guide"]], "Instance Normalization": [[26, "instance-normalization"]], "Integrate the CC library": [[40, "integrate-the-cc-library"]], "Intel Advanced Feature and Extension Management": [[23, "intel-advanced-feature-and-extension-management"]], "Intel CPU Software Installation": [[41, "intel-cpu-software-installation"]], "Intel GPU Driver": [[46, "intel-gpu-driver"]], "Intel OpenMP": [[32, "intel-openmp"]], "Intel XPU Software Installation": [[42, "intel-xpu-software-installation"]], "Intel\u00ae DevCloud": [[45, "intel-devcloud"], [52, "intel-devcloud"]], "Intel\u00ae Extension for TensorFlow*": [[63, "intel-extension-for-tensorflow"]], "Intel\u00ae Extension for TensorFlow* Config Protocol": [[33, "intel-extension-for-tensorflow-config-protocol"]], "Intel\u00ae Extension for TensorFlow* Docker Container Guide": [[2, "intel-extension-for-tensorflow-docker-container-guide"]], "Intel\u00ae Extension for TensorFlow* Serving - Docker Container Guide": [[3, "intel-extension-for-tensorflow-serving-docker-container-guide"]], "Intel\u00ae Extension for TensorFlow* for C++": [[40, "intel-extension-for-tensorflow-for-c"]], "Intel\u00ae Extension for Tensorflow* Model Quantization API Example": [[49, "intel-extension-for-tensorflow-model-quantization-api-example"]], "Intel\u00ae Extension for Tensorflow* Version": [[52, "intel-extension-for-tensorflow-version"]], "Intel\u00ae oneAPI Base Toolkit": [[46, "intel-oneapi-base-toolkit"]], "Introduction": [[5, "introduction"], [13, "introduction"], [23, "introduction"], [45, "introduction"], [47, "introduction"], [50, "introduction"], [51, "introduction"], [52, "introduction"], [54, "introduction"], [55, "introduction"], [56, "introduction"], [57, "introduction"], [60, "introduction"], [61, "introduction"], [62, "introduction"]], "Jemalloc": [[29, "jemalloc"]], "Keras 3 Overview": [[27, "keras-3-overview"]], "Keras Mixed Precision": [[28, "keras-mixed-precision"]], "Known Issues": [[8, "known-issues"]], "LSTM": [[26, "lstm"]], "Latency mode": [[29, "latency-mode"]], "Launch Log": [[29, "launch-log"]], "Launch Script User Guide": [[29, "launch-script-user-guide"]], "Layer Normalization": [[26, "layer-normalization"]], "License": [[52, "license"], [63, "license"]], "Limitation": [[36, "limitation"]], "Linker": [[40, "linker"]], "Load": [[40, "load"]], "Local Server": [[45, "local-server"], [52, "local-server"]], "Log and Save Optimized Graph": [[19, "log-and-save-optimized-graph"]], "Loss scaling": [[28, "loss-scaling"]], "Loss scaling overview": [[28, "loss-scaling-overview"]], "Mask-RCNN Inference Performance Results": [[31, "mask-rcnn-inference-performance-results"]], "Mask-RCNN Training Performance Results": [[31, "mask-rcnn-training-performance-results"]], "Medical Image 3D U-Net Training Performance Results": [[31, "medical-image-3d-u-net-training-performance-results"]], "Memory Allocator": [[29, "memory-allocator"], [32, "memory-allocator"]], "Memory Layout format": [[32, "memory-layout-format"]], "Mixed data type fusion": [[24, "mixed-data-type-fusion"]], "Model Code change": [[51, "model-code-change"], [54, "model-code-change"], [55, "model-code-change"], [57, "model-code-change"], [60, "model-code-change"], [61, "model-code-change"]], "Models": [[31, "models"]], "Multi-instance": [[29, "multi-instance"]], "Multi-tile with horovod": [[55, "multi-tile-with-horovod"]], "Multiple instances for inference": [[29, "multiple-instances-for-inference"]], "NUMA Control": [[29, "numa-control"]], "Native Linux Running Directly on Hardware": [[37, "native-linux-running-directly-on-hardware"], [37, "id2"]], "NextPluggableDevice Architecture": [[30, "nextpluggabledevice-architecture"]], "NextPluggableDevice Overview": [[30, "nextpluggabledevice-overview"]], "Non-Uniform Memory Access (NUMA)": [[32, "non-uniform-memory-access-numa"]], "Notes": [[53, "notes"]], "Notice": [[19, "notice"]], "Numactl": [[32, "numactl"]], "Numeric Stability": [[18, "numeric-stability"]], "OMP_NUM_THREADS": [[32, "omp-num-threads"]], "Objectives": [[16, "objectives"]], "Online Documentation Build Guide": [[5, "online-documentation-build-guide"]], "Online Weight Prepack": [[36, "online-weight-prepack"]], "OpenMP": [[32, "openmp"]], "OpenXLA": [[16, "openxla"]], "OpenXLA PJRT Plugin": [[30, "openxla-pjrt-plugin"]], "OpenXLA Support on GPU [Experimental]": [[21, "openxla-support-on-gpu-experimental"]], "Operator Optimization": [[21, "operator-optimization"]], "Operators Override": [[26, "operators-override"]], "Optimization in convolution": [[13, "optimization-in-convolution"]], "Optimizations Design": [[12, "optimizations-design"]], "Option 1: Extract from Tensorflow* python package (Recommended)": [[40, "option-1-extract-from-tensorflow-python-package-recommended"]], "Option 2: Build from TensorFlow* source code": [[40, "option-2-build-from-tensorflow-source-code"]], "Optional Requirements for CPU Build Only": [[39, "optional-requirements-for-cpu-build-only"]], "Optional: Install Full Intel\u00ae oneAPI": [[37, "optional-install-full-intel-oneapi"]], "Original Code": [[19, "original-code"]], "Our Pledge": [[0, "our-pledge"]], "Our Standards": [[0, "our-standards"]], "Output": [[58, "output"]], "Overview": [[15, "overview"], [16, "overview"], [17, "overview"], [19, "overview"], [20, "overview"], [28, "overview"], [29, "overview"], [31, "overview"], [32, "overview"], [33, "overview"], [36, "overview"], [39, "overview"], [49, "overview"]], "Performance Data": [[31, "performance-data"]], "Practice Guide": [[32, "practice-guide"]], "Preconditions": [[38, "preconditions"]], "Prepare": [[46, "prepare"]], "Prepare Dataset": [[49, "prepare-dataset"], [51, "prepare-dataset"], [55, "prepare-dataset"], [60, "prepare-dataset"]], "Prepare Example Code": [[58, "prepare-example-code"]], "Prepare ImageNet dataset": [[61, "prepare-imagenet-dataset"]], "Prepare Pre-Trained Model": [[49, "prepare-pre-trained-model"]], "Prepare Tensorflow* CC library and header files": [[40, "prepare-tensorflow-cc-library-and-header-files"]], "Prepare for GPU": [[51, "prepare-for-gpu"], [55, "prepare-for-gpu"], [57, "prepare-for-gpu"], [60, "prepare-for-gpu"], [62, "prepare-for-gpu"]], "Prepare for GPU (Skip this Step for CPU)": [[47, "prepare-for-gpu-skip-this-step-for-cpu"]], "Prepare for GPU (Skip this step for CPU)": [[48, "prepare-for-gpu-skip-this-step-for-cpu"], [54, "prepare-for-gpu-skip-this-step-for-cpu"], [56, "prepare-for-gpu-skip-this-step-for-cpu"], [61, "prepare-for-gpu-skip-this-step-for-cpu"]], "Prepare for Running": [[44, "prepare-for-running"]], "Prepare the Codes": [[62, "prepare-the-codes"]], "Prerequisite: import intel_extension_for_tensorflow as itex": [[33, "prerequisite-import-intel-extension-for-tensorflow-as-itex"]], "Prerequisites": [[48, "prerequisites"], [51, "prerequisites"], [51, "id1"], [51, "id2"], [54, "prerequisites"], [55, "prerequisites"], [56, "prerequisites"], [57, "prerequisites"], [60, "prerequisites"], [61, "prerequisites"], [62, "prerequisites"]], "Pretraining Command": [[51, "pretraining-command"]], "Python API": [[17, "python-api"], [18, "python-api"], [47, "python-api"], [62, "python-api"]], "Python API Attribute & Environment Variable": [[18, "python-api-attribute-environment-variable"]], "Python APIs": [[33, "python-apis"]], "Python APIs and Environment Variable Names": [[33, "python-apis-and-environment-variable-names"]], "Python APIs and preserved environment variable Names": [[33, "python-apis-and-preserved-environment-variable-names"]], "Python Unit Testing": [[7, "python-unit-testing"]], "Python coding style": [[7, "python-coding-style"]], "Quantize Inception V3 by Intel\u00ae Extension for Tensorflow* on Intel\u00ae Xeon\u00ae": [[52, "quantize-inception-v3-by-intel-extension-for-tensorflow-on-intel-xeon"]], "Quick Example on Intel CPU and GPU": [[53, "quick-example-on-intel-cpu-and-gpu"]], "Quick Start Guide": [[50, "quick-start-guide"]], "Quick Training Example": [[19, "quick-training-example"]], "Refer to train_resnet50": [[59, "refer-to-train-resnet50"]], "Reference": [[36, "reference"]], "References": [[16, "references"]], "Releases": [[8, "releases"]], "Report a Vulnerability": [[1, "report-a-vulnerability"]], "Requirements": [[39, "requirements"], [40, "requirements"]], "ResNet50 Inference on Intel CPU and GPU": [[48, "resnet50-inference-on-intel-cpu-and-gpu"]], "ResNet50v1-5 Inference Performance Results": [[31, "resnet50v1-5-inference-performance-results"]], "ResNet50v1-5 Training Performance Results": [[31, "resnet50v1-5-training-performance-results"]], "Resnet50 train on Intel GPU": [[61, "resnet50-train-on-intel-gpu"]], "Resources": [[10, "resources"], [63, "resources"]], "Result": [[47, "result"]], "Results": [[51, "results"]], "Rule to Improve Performance by the Configuration List": [[18, "rule-to-improve-performance-by-the-configuration-list"]], "Run Model Quantization Example:": [[49, "run-model-quantization-example"]], "Run Models in the Docker Container": [[50, "run-models-in-the-docker-container"]], "Run Models on Bare Metal": [[50, "run-models-on-bare-metal"]], "Run Script": [[46, "run-script"]], "Run sample": [[34, "run-sample"]], "Running": [[46, "running"]], "Running Command": [[58, "running-command"]], "Running Environment": [[45, "running-environment"], [52, "running-environment"]], "Running the Container": [[3, "running-the-container"]], "Running the Jupyter Notebook": [[54, "running-the-jupyter-notebook"]], "Runtime": [[14, "runtime"]], "Runtime Switch of NextPluggableDevice and PluggableDevice": [[30, "runtime-switch-of-nextpluggabledevice-and-pluggabledevice"]], "Scope": [[0, "scope"]], "Security": [[63, "security"]], "Security Policy": [[1, "security-policy"]], "Selecting Thread Pool in Intel\u00ae Extension for TensorFlow* CPU [Experimental]": [[35, "selecting-thread-pool-in-intel-extension-for-tensorflow-cpu-experimental"]], "Set Model Parameters": [[61, "set-model-parameters"]], "Set Up Software Environment": [[49, "set-up-software-environment"]], "Set environment variables for inference": [[29, "set-environment-variables-for-inference"]], "Set up Base Running Environment": [[45, "set-up-base-running-environment"]], "Set up Intel\u00ae Extension for Tensorflow* for GPU": [[45, "set-up-intel-extension-for-tensorflow-for-gpu"]], "Setting the dtype policy": [[28, "setting-the-dtype-policy"]], "Setup": [[19, "setup"], [28, "setup"]], "Setup PYTHONPATH": [[62, "setup-pythonpath"]], "Setup Running Environment": [[46, "setup-running-environment"], [47, "setup-running-environment"], [48, "setup-running-environment"], [51, "setup-running-environment"], [54, "setup-running-environment"], [55, "setup-running-environment"], [56, "setup-running-environment"], [57, "setup-running-environment"], [58, "setup-running-environment"], [60, "setup-running-environment"], [61, "setup-running-environment"]], "Setup environment variables": [[37, "setup-environment-variables"], [42, "setup-environment-variables"]], "Sharding Parameters Setting": [[62, "sharding-parameters-setting"]], "Single Tile": [[55, "single-tile"]], "Single instance for inference": [[29, "single-instance-for-inference"]], "Situations leads to warning or Error": [[27, "situations-leads-to-warning-or-error"]], "Software Configuration": [[31, "software-configuration"], [32, "software-configuration"]], "Software Configuration for Intel Flex 170 GPU": [[31, "software-configuration-for-intel-flex-170-gpu"]], "Software Configuration for Intel Max 1550 GPU": [[31, "software-configuration-for-intel-max-1550-gpu"]], "Software Requirement": [[63, "software-requirement"]], "Software Requirements": [[37, "software-requirements"], [41, "software-requirements"], [42, "software-requirements"]], "Speed up Inference of Inception v4 by Advanced Automatic Mixed Precision on Intel CPU and GPU via Docker Container or Bare Metal": [[47, "speed-up-inference-of-inception-v4-by-advanced-automatic-mixed-precision-on-intel-cpu-and-gpu-via-docker-container-or-bare-metal"]], "Stable Diffusion Inference for Text2Image on Intel GPU": [[54, "stable-diffusion-inference-for-text2image-on-intel-gpu"]], "Stable Diffusion v1-4 Inference Performance Results": [[31, "stable-diffusion-v1-4-inference-performance-results"]], "Start with XLA using NextPluggableDevice": [[30, "start-with-xla-using-nextpluggabledevice"]], "Startup Jupyter Notebook": [[52, "startup-jupyter-notebook"], [56, "startup-jupyter-notebook"]], "Step": [[47, "step"]], "Step by step instructions:": [[38, "step-by-step-instructions"]], "Step-By-Step Instructions": [[37, "step-by-step-instructions"]], "Support": [[63, "support"]], "System environment install": [[37, "system-environment-install"], [41, "system-environment-install"], [42, "system-environment-install"]], "TCMalloc": [[29, "tcmalloc"], [32, "tcmalloc"]], "Table of Contents": [[32, "table-of-contents"]], "TensorFlow Public API": [[23, "tensorflow-public-api"]], "TensorFlow Serving": [[21, "tensorflow-serving"]], "Throughput mode": [[29, "throughput-mode"]], "Tips": [[19, "tips"]], "Tips and Debugging": [[7, "tips-and-debugging"]], "Training Accuracy Results": [[31, "training-accuracy-results"]], "Training Accuracy on 1-node of 4x Intel Data Center GPU Max 1550": [[31, "training-accuracy-on-1-node-of-4x-intel-data-center-gpu-max-1550"]], "Training Performance Results": [[31, "training-performance-results"]], "Training Performance on 1-node of 4x Intel Data Center GPU Max 1550": [[31, "training-performance-on-1-node-of-4x-intel-data-center-gpu-max-1550"]], "Training Workloads": [[31, "training-workloads"]], "Training the model with Model.fit": [[28, "training-the-model-with-model-fit"]], "Training the model with a custom training loop": [[28, "training-the-model-with-a-custom-training-loop"]], "Troubleshooting": [[14, "troubleshooting"]], "Tune Advanced AMP Manually": [[19, "tune-advanced-amp-manually"]], "Tune Advanced Auto Mixed Precision": [[18, "tune-advanced-auto-mixed-precision"]], "Tuning Performance Example on MobileNet": [[18, "tuning-performance-example-on-mobilenet"]], "Ubuntu Linux Installed in WSL2": [[37, "ubuntu-linux-installed-in-wsl2"]], "Underflow and Overflow": [[28, "underflow-and-overflow"]], "Unit testing": [[7, "unit-testing"]], "Update latest Version": [[5, "update-latest-version"]], "Usage": [[15, "usage"], [17, "usage"], [18, "usage"], [18, "id1"], [19, "usage"], [22, "usage"], [26, "usage"]], "Usage & Effect": [[36, "usage-effect"]], "Usage of Docker Container": [[2, "usage-of-docker-container"]], "Usage of TCMalloc/Jemalloc/Default memory allocator": [[29, "usage-of-tcmalloc-jemalloc-default-memory-allocator"]], "Use Case with different performance": [[27, "use-case-with-different-performance"]], "Using Eigen Thread Pool": [[35, "using-eigen-thread-pool"]], "Using OpenMP Thread Pool": [[35, "using-openmp-thread-pool"]], "V. Throughput mode": [[29, "v-throughput-mode"]], "VI. Latency mode": [[29, "vi-latency-mode"]], "VII. Your designated number of instances": [[29, "vii-your-designated-number-of-instances"]], "VIII. Your designated number of instances and instance index": [[29, "viii-your-designated-number-of-instances-and-instance-index"]], "Verify That Intel GPU is Accessible From TensorFlow": [[2, "verify-that-intel-gpu-is-accessible-from-tensorflow"]], "Verify the Installation": [[41, "verify-the-installation"], [42, "verify-the-installation"]], "Virtual environment install": [[37, "virtual-environment-install"], [41, "virtual-environment-install"], [42, "virtual-environment-install"]], "Welcome to Intel \u00ae Extension for TensorFlow* documentation!": [[6, "welcome-to-intel-extension-for-tensorflow-documentation"], [64, "welcome-to-intel-extension-for-tensorflow-documentation"]], "Welcome to Intel\u00ae Extension for TensorFlow* documentation": [[4, "welcome-to-intel-extension-for-tensorflow-documentation"]], "Why NextPluggableDevice": [[30, "why-nextpluggabledevice"]], "Windows GPU Drivers": [[37, "windows-gpu-drivers"]], "Windows Subsystem for Linux 2 (WSL2)": [[37, "windows-subsystem-for-linux-2-wsl2"], [37, "id1"]], "With XPUAutoShard": [[62, "with-xpuautoshard"]], "Without XPUAutoShard": [[62, "without-xpuautoshard"]], "Workflow": [[10, "workflow"], [15, "workflow"], [17, "workflow"], [36, "workflow"]], "X. Set environment variable TF_NUM_INTEROP_THREADS": [[29, "x-set-environment-variable-tf-num-interop-threads"]], "XPU Engine": [[23, "xpu-engine"]], "XPU for CPU only platform (Deprecated)": [[42, "xpu-for-cpu-only-platform-deprecated"]], "XPUAutoShard on GPU [Experimental]": [[17, "xpuautoshard-on-gpu-experimental"], [21, "xpuautoshard-on-gpu-experimental"]], "bazel style guide": [[7, "bazel-style-guide"]], "itex graph": [[33, "itex-graph"]], "itex operators": [[33, "itex-operators"]], "itex ops override": [[33, "itex-ops-override"]], "itex version": [[33, "itex-version"]], "itex.AutoMixedPrecisionOptions": [[33, "itex-automixedprecisionoptions"]], "itex.ConfigProto": [[33, "itex-configproto"]], "itex.DebugOptions": [[33, "itex-debugoptions"]], "itex.GPUOptions": [[33, "itex-gpuoptions"]], "itex.GraphOptions": [[33, "itex-graphoptions"]], "itex.ShardingConfig": [[33, "itex-shardingconfig"]], "itex.get_config": [[33, "itex-get-config"]], "itex.ops.AdamWithWeightDecayOptimizer": [[25, "itex-ops-adamwithweightdecayoptimizer"]], "itex.ops.GroupNormalization": [[25, "itex-ops-groupnormalization"]], "itex.ops.ItexLSTM": [[25, "itex-ops-itexlstm"]], "itex.ops.LAMBOptimizer": [[25, "itex-ops-lamboptimizer"]], "itex.ops.LayerNormalization": [[25, "itex-ops-layernormalization"]], "itex.ops.gelu": [[25, "itex-ops-gelu"]], "itex.set_config": [[33, "itex-set-config"]], "oneDNN object cache optimization": [[13, "onednn-object-cache-optimization"]], "quick_example.py": [[53, "quick-example-py"]]}, "docnames": ["CODE_OF_CONDUCT", "SECURITY", "docker/README", "docker/tensorflow-serving/README", "docs/README", "docs/build_docs/docs_build_tips", "docs/build_docs/source/index", "docs/community/contributing", "docs/community/releases", "docs/design/directory_structure", "docs/design/extension_design", "docs/design/how_to_write_custom_op", "docs/design/optimization/README", "docs/design/optimization/oneDNN_object_cache", "docs/guide/FAQ", "docs/guide/INT8_quantization", "docs/guide/OpenXLA", "docs/guide/XPUAutoShard", "docs/guide/aamp_tune", "docs/guide/advanced_auto_mixed_precision", "docs/guide/environment_variables", "docs/guide/features", "docs/guide/how_to_enable_profiler", "docs/guide/infrastructure", "docs/guide/itex_fusion", "docs/guide/itex_ops", "docs/guide/itex_ops_override", "docs/guide/keras3_support", "docs/guide/keras_mixed_precision", "docs/guide/launch", "docs/guide/next_pluggable_device", "docs/guide/performance", "docs/guide/practice_guide", "docs/guide/python_api", "docs/guide/tf_serving_install", "docs/guide/threadpool", "docs/guide/weight_prepack", "docs/install/experimental/install_for_arc_gpu", "docs/install/experimental/install_for_gpu_conda", "docs/install/how_to_build", "docs/install/install_for_cpp", "docs/install/install_for_cpu", "docs/install/install_for_xpu", "docs/install/installation_guide", "examples/README", "examples/accelerate_alexnet_by_quantization/README", "examples/common_guide_running", "examples/infer_inception_v4_amp/README", "examples/infer_resnet50/README", "examples/itex_quantization_example/README", "examples/model_zoo_example/README", "examples/pretrain_bert/README", "examples/quantize_inception_v3/README", "examples/quick_example", "examples/stable_diffussion_inference/README", "examples/train_3d_unet/README", "examples/train_bert/README", "examples/train_bert_fp8/README", "examples/train_horovod/mnist/README", "examples/train_horovod/resnet50/README", "examples/train_maskrcnn/README", "examples/train_resnet50/README", "examples/train_resnet50_with_autoshard/README", "get_started", "index"], "envversion": {"sphinx": 61, "sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2}, "filenames": ["CODE_OF_CONDUCT.md", "SECURITY.md", "docker/README.md", "docker/tensorflow-serving/README.md", "docs/README.md", "docs/build_docs/docs_build_tips.md", "docs/build_docs/source/index.rst", "docs/community/contributing.md", "docs/community/releases.md", "docs/design/directory_structure.md", "docs/design/extension_design.md", "docs/design/how_to_write_custom_op.md", "docs/design/optimization/README.md", "docs/design/optimization/oneDNN_object_cache.md", "docs/guide/FAQ.md", "docs/guide/INT8_quantization.md", "docs/guide/OpenXLA.md", "docs/guide/XPUAutoShard.md", "docs/guide/aamp_tune.md", "docs/guide/advanced_auto_mixed_precision.md", "docs/guide/environment_variables.md", "docs/guide/features.rst", "docs/guide/how_to_enable_profiler.md", "docs/guide/infrastructure.md", "docs/guide/itex_fusion.md", "docs/guide/itex_ops.md", "docs/guide/itex_ops_override.md", "docs/guide/keras3_support.md", "docs/guide/keras_mixed_precision.md", "docs/guide/launch.md", "docs/guide/next_pluggable_device.md", "docs/guide/performance.md", "docs/guide/practice_guide.md", "docs/guide/python_api.md", "docs/guide/tf_serving_install.md", "docs/guide/threadpool.md", "docs/guide/weight_prepack.md", "docs/install/experimental/install_for_arc_gpu.md", "docs/install/experimental/install_for_gpu_conda.md", "docs/install/how_to_build.md", "docs/install/install_for_cpp.md", "docs/install/install_for_cpu.md", "docs/install/install_for_xpu.md", "docs/install/installation_guide.rst", "examples/README.md", "examples/accelerate_alexnet_by_quantization/README.md", "examples/common_guide_running.md", "examples/infer_inception_v4_amp/README.md", "examples/infer_resnet50/README.md", "examples/itex_quantization_example/README.md", "examples/model_zoo_example/README.md", "examples/pretrain_bert/README.md", "examples/quantize_inception_v3/README.md", "examples/quick_example.md", "examples/stable_diffussion_inference/README.md", "examples/train_3d_unet/README.md", "examples/train_bert/README.md", "examples/train_bert_fp8/README.md", "examples/train_horovod/mnist/README.md", "examples/train_horovod/resnet50/README.md", "examples/train_maskrcnn/README.md", "examples/train_resnet50/README.md", "examples/train_resnet50_with_autoshard/README.md", "get_started.md", "index.rst"], "indexentries": {}, "objects": {}, "objnames": {}, "objtypes": {}, "terms": {"": [0, 4, 5, 14, 16, 18, 20, 21, 28, 31, 32, 34, 35, 39, 40, 45, 47, 49, 51, 52, 54, 55, 56, 63], "0": [2, 3, 4, 5, 11, 14, 15, 16, 19, 20, 22, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 37, 38, 39, 40, 41, 42, 45, 48, 49, 51, 52, 53, 56, 57, 58, 60, 61, 62, 63], "00": [16, 31, 42, 49, 61], "000": 28, "000000e": 51, "0001": 49, "0005": 51, "000611": 51, "001": [25, 26], "00363725": 25, "004": 51, "00404969": 25, "004888": 51, "006297": 61, "006950": 58, "00x": 31, "01": [14, 16, 26, 31, 33, 49, 61], "0113076031208038": 47, "01837550401687622": 47, "02": [16, 26, 28, 31, 61], "025180": 62, "027671": 62, "03": [29, 31, 51, 61], "037595": 51, "04": [2, 16, 31, 34, 35, 37, 39, 41, 42, 49, 56], "05": [16, 29, 31, 58], "0527704": 53, "06": [14, 16, 25, 28, 51], "061277": 28, "061301": 28, "061306": 28, "063685": 28, "063851": 28, "063865": 28, "0656753": 53, "07": [14, 16, 25, 31, 42, 61, 62], "072701": 51, "072752": 51, "072779": 51, "072805": 51, "072829": 51, "072861": 51, "072884": 51, "072928": 51, "073072": 51, "073094": 51, "073121": 51, "073183": 51, "077278": 53, "08": [16, 29, 35, 61], "089": 29, "09": [16, 29, 61], "090": 29, "0f": 11, "1": [2, 4, 5, 14, 16, 18, 19, 20, 21, 22, 25, 26, 27, 28, 29, 30, 32, 33, 35, 36, 38, 39, 42, 47, 49, 51, 52, 53, 54, 55, 56, 57, 58, 60, 61, 62, 63], "10": [2, 14, 16, 18, 19, 25, 28, 29, 35, 36, 37, 39, 40, 41, 49, 51, 52, 61, 62, 63], "100": [11, 28, 33, 39, 51], "1000": [31, 34, 55, 61], "10000": [19, 25, 28], "101": 37, "1024": [28, 31], "1024_a": 51, "1024gb": 31, "103148": 62, "105446": 51, "107809": 58, "10gbase": 31, "11": [16, 18, 29, 31, 37, 38, 39, 40, 42, 61, 63], "111": [28, 32], "112": 32, "114": [28, 58], "1146879196167": 54, "11490434": 28, "116": 14, "118": [28, 30], "118212": 53, "1193419": 53, "12": [7, 14, 16, 28, 29, 31, 42, 51, 54, 56, 58, 61, 62, 63], "1200": 61, "122": 33, "122414": 51, "122509": 51, "12278": 31, "127": [5, 34], "128": [16, 31, 47, 51, 57], "128gb": 31, "129": 29, "12_h": 51, "12e": 51, "13": [16, 40, 52, 58, 62, 63], "133": 49, "136": 29, "137": 29, "139660941027136": 61, "139898862851904": 61, "14": [28, 31, 34, 40, 49, 51, 56, 58, 61, 63], "140": [39, 40], "140348344015936": 62, "1403804": 53, "140612319840064": 61, "141": 11, "144": 29, "1445": 11, "145": [29, 61, 62], "1455178": 53, "15": [2, 7, 16, 29, 31, 35, 37, 38, 39, 40, 41, 42, 45, 51, 63], "150": 55, "15000": 25, "15031084974591766410": 2, "150400": 31, "150w": 31, "1550": 16, "156": 28, "15865526": 25, "158808": 25, "16": [18, 28, 29, 31, 33, 41, 47, 51, 61], "161625": 62, "163": 49, "163161": 58, "163517": 58, "163815": 62, "1657011814330": 18, "1657011815538": 18, "1658201": 53, "1666": 51, "1691980294577": 47, "16x64gb": 31, "17": [29, 40], "170": [39, 40, 42, 54, 57], "1704025": 53, "170intel": 47, "1729176": 53, "174": 56, "17448926295332318308": 2, "1762": 31, "1766": 31, "177216": 51, "178206": 61, "18": [16, 51, 58], "182": 31, "1846": 51, "185w": 31, "19": [29, 31, 37, 41, 42], "1900": 61, "190052": 51, "190136": 51, "190169": 51, "190193": 51, "190217": 51, "190249": 51, "190273": 51, "190343": 51, "190536": 51, "190559": 51, "190587": 51, "190668": 51, "191": 29, "192": [29, 51], "197306": 53, "198": 29, "1986": 28, "1997": 25, "1a": 40, "1ccb4fee": 38, "1e": [25, 26, 28], "1export": [18, 19], "1tb": 31, "1u": 28, "2": [2, 14, 15, 16, 17, 18, 19, 20, 24, 25, 27, 28, 29, 30, 31, 32, 33, 35, 36, 38, 39, 41, 42, 45, 47, 48, 49, 51, 52, 53, 54, 55, 57, 58, 60, 61, 62, 63], "20": [16, 29, 31, 35, 39, 41, 60, 62], "200": [25, 26, 51], "2000": [51, 61], "200m": 32, "2016": 25, "2017": [31, 60], "2018": 49, "20180905": 33, "2019": 55, "20200711": 49, "2021": 14, "2022": [28, 29, 33], "2023": [38, 42, 49, 51, 58], "20230123": 21, "2024": [14, 31, 37, 42], "206": 29, "207": 29, "21": [29, 31, 51], "210": 49, "2100": 61, "2134862": 53, "215": 29, "2155": 28, "216": 29, "217981": 42, "22": [2, 31, 34, 37, 39, 41, 42, 49, 51, 62], "2200": 61, "22355853": 48, "224": [22, 49], "22471978829632": 51, "224x224": 31, "227250": 51, "229": 29, "23": [29, 31, 42, 62], "2300": 61, "23092487755584": 51, "23450678511424": 51, "2350": 37, "24": [29, 31, 51, 58], "2400": 61, "241": 29, "2488174077578": 57, "24_h": 51, "24x": 31, "25": [31, 62], "250": 58, "250221": 53, "25294047594070435": 28, "254": 29, "255": [19, 28, 35], "256": [28, 31, 35, 51, 62], "26": 35, "2600": 51, "2607155": 53, "2636094": 53, "26531240344047546": 28, "266": 29, "268435456": 2, "269": 28, "27": [16, 29, 32, 62], "272": 30, "27642": 42, "277716": 61, "277811": 61, "278": 29, "28": [29, 31, 32, 38, 42, 49, 51], "280": 62, "29": [29, 31], "290": 29, "298973": 53, "299": 35, "2nd": 41, "2tb": 31, "2x": [31, 35], "2x256x10": 62, "3": [2, 4, 7, 16, 18, 20, 22, 24, 25, 26, 28, 29, 30, 31, 32, 33, 35, 38, 39, 40, 41, 42, 45, 46, 49, 52, 53, 62], "30": [14, 16, 31, 35, 49, 51, 62], "3000765": 53, "3007": 31, "300x300": [31, 49], "302": 29, "303": 28, "305706": 53, "31": [29, 37], "312": [31, 51], "314010": 51, "314064": 51, "314090": 51, "314113": 51, "314135": 51, "314165": 51, "314197": 51, "314260": 51, "314455": 51, "314478": 51, "314505": 51, "314589": 51, "315": 29, "318963": 53, "32": [16, 18, 25, 26, 28, 29, 31, 33, 47, 51, 57, 61], "3200": 31, "3221133": 53, "3265": 31, "327": 29, "327398": 53, "328223477737884": 54, "33": 14, "3343554": 62, "3359": 28, "3359284": 62, "3364005982875824": 28, "339": 29, "3391027": 53, "34": 29, "3455": 28, "3461": 31, "35": [29, 31, 42], "350w": 31, "351": 29, "3549364": 53, "3555": 28, "3587": 31, "36": [29, 31, 35, 49], "364": 29, "3670": 28, "37": 16, "3753": 28, "376": 29, "3787665": 53, "38": [29, 31], "3804817": 53, "381424": 53, "384": 31, "3870": 31, "388": 29, "39": [29, 31], "3905785": 53, "3999124": 53, "3d": 44, "3dunet_itex": 55, "3dunet_itex_with_horovod": 55, "3e": [51, 57], "3f": 35, "3rd": [4, 21, 31, 41], "4": [14, 17, 18, 20, 24, 25, 28, 29, 30, 32, 35, 38, 51, 53, 58, 60, 62], "40": [14, 16, 29, 31, 42, 51], "400": [29, 61], "404": 29, "405": 29, "408512": 61, "4096": [19, 28], "40ghz": 31, "41": [16, 28], "41249612335034": 57, "413": 29, "416651": 62, "419072": 62, "42": 31, "42261": 53, "425": 29, "43": [16, 29, 31, 42], "435": 31, "438": 29, "44": [11, 16, 29], "4498": 28, "452": 29, "45x": 31, "461180928": 51, "465": 29, "47": [16, 29, 61], "4718971": 53, "479": 62, "479142": 53, "47eb": [37, 42], "48": [16, 29, 51, 61], "480": 29, "4800": 31, "481086": 53, "4818356": 53, "49": [29, 61], "4929404": 53, "494": 29, "4d": 25, "4th": [31, 41, 47], "5": [11, 18, 19, 20, 22, 25, 28, 30, 33, 35, 39, 40, 41, 51, 53, 57, 62], "50": [29, 31, 35], "5000": 31, "5063303": 53, "509": 29, "50ghz": 32, "51": [16, 29, 31, 51], "510076": 14, "51179520": 51, "512": [31, 51, 57], "5120": 62, "512x512": 31, "517385": 53, "52": [16, 28, 29, 51], "523": 31, "5294489860534668": 28, "53": [29, 31], "5300783": 53, "5333": 37, "54": 58, "5479512": 53, "549": 29, "55": [14, 16, 29, 31, 32, 35, 62], "550": 29, "555174": 61, "555221": 61, "5597944": 53, "56": [16, 29, 31, 32, 35], "57": 31, "5774": 51, "57x": 31, "58": 29, "586": 29, "59": [16, 29], "590331": 61, "594147": 62, "595": 51, "596": [37, 42, 51], "597": 51, "597360": 62, "598": 51, "5e": 51, "5th": 31, "6": [18, 26, 28, 30, 31, 33, 42, 49, 51], "60": [28, 29, 31, 35, 51], "600": [51, 61], "60000": [19, 28], "600w": 31, "601": 51, "602": 51, "6027272": 53, "602742": 61, "603262": 61, "604": [29, 51], "6047": 31, "605": 29, "606": 51, "607": 51, "6153628825864496": 47, "6240": 28, "63": [16, 29], "6336y": 31, "6342418": 53, "634554": 62, "64": [14, 16, 17, 19, 28, 29, 31, 35, 37, 39, 41, 42, 51, 56], "640x640": 49, "6416": 51, "6422923": 53, "6456823": 53, "6461415": 53, "6514435": 53, "65504": 28, "6628485": 53, "66fa74b6a2a0bb1e563ae8bce66496b118b95200": 54, "67": [16, 29, 31], "6761076": 53, "68": 29, "6867": 31, "69": 31, "692": 31, "6926193": 53, "693": 29, "694": 29, "69612": 49, "699": 31, "7": [18, 28, 29, 30, 31, 33, 49, 51, 54], "7090344": 53, "71": 29, "7112d33": 33, "718459": 53, "72": [29, 49], "7239000201225281": 28, "7296917": 53, "7297122": 53, "730m": 14, "736": 31, "74": 31, "7494": 28, "75": [29, 31], "7520": 28, "757": 29, "76": [25, 29, 31, 51], "768": 51, "768_a": 51, "772": 29, "773": 11, "7787259": 53, "784": [19, 28, 29, 35], "79": 29, "790128": 61, "790632": 62, "792936": 62, "795": 29, "7987": 28, "7f": 51, "8": [18, 25, 28, 29, 31, 33, 40, 41, 42, 49, 51, 52], "80": [29, 31], "800": 61, "803": [37, 42], "806": 29, "81": [31, 51, 54, 57], "810": 51, "817": 29, "8180m": 32, "8192": [19, 28], "81m": 28, "82574l": 31, "828": 29, "83": [29, 31, 32, 51], "839": 29, "83m": 28, "84": [29, 31, 32], "841192": 25, "8413447": 25, "8480": [31, 35], "84m": 28, "85": 35, "850": 29, "8500": [3, 34], "8501": 34, "8534": 28, "85485": 53, "8598063": 53, "85m": 28, "86": [16, 31], "8672705": 53, "867908472383153": 47, "87": [29, 31], "870": 31, "875052": 53, "8751": 28, "88": [29, 57], "8809638": 53, "8819": 28, "8863": 28, "8876": [37, 42], "888000e": 51, "8880196": 53, "8888": [41, 42, 47, 52, 54, 56], "88eb3cff2f03dad85035621d041e23a14345999": 55, "891": 29, "892": 29, "8941312": 53, "8972": 28, "89942324": 53, "8x16gb": 31, "9": [14, 18, 25, 26, 29, 30, 37, 38, 39, 41, 42, 45, 46, 56, 62], "9000": 5, "908": 29, "909": 29, "91": [29, 31], "911": 29, "9154005": 53, "9168000221252441": 28, "917546": 61, "917738": 61, "918": 31, "92": [29, 31], "924008369445801": 28, "9259825": 53, "9260886": 53, "9266936945121049176": 2, "928": 31, "92880015134813": 47, "92x": 31, "93": 31, "930": 29, "9349675": 53, "9373732": 53, "9377": 28, "9381000399589539": 28, "9381838": 53, "93901324": 53, "94": 16, "940695": 58, "9410": 28, "947": 29, "948": 29, "9486000537872314": 28, "949225": 53, "95": [29, 31], "951": 29, "9536000490188599": 28, "96": [29, 31, 40, 51], "9631021": 53, "9677248": 53, "968": 31, "96x": 31, "97": 16, "9702091": 53, "9746864": 53, "9755": 28, "98": 16, "9842": 31, "9873173": 53, "988714": 53, "99": 16, "9959502": 25, "9963627": 25, "999": [25, 26], "99998": 25, "A": [0, 5, 17, 18, 24, 28, 29, 32, 33, 34, 36, 42, 44, 47, 58], "And": [30, 37, 41, 42, 51], "As": [17, 24, 28, 29, 32], "At": [16, 17, 21, 45, 54], "Being": 0, "But": [27, 28], "By": [13, 20, 28, 29, 32, 52], "For": [0, 1, 2, 4, 7, 11, 14, 15, 18, 19, 20, 23, 25, 26, 28, 29, 31, 33, 34, 35, 37, 42, 47, 48, 49, 50, 51, 54, 55, 56, 57, 58, 60, 61, 62], "If": [2, 3, 5, 20, 22, 25, 26, 27, 28, 29, 32, 33, 35, 37, 39, 40, 41, 42, 45, 47, 48, 49, 51, 52, 53, 54, 55, 56, 57, 60], "In": [4, 11, 16, 18, 19, 27, 28, 29, 30, 32, 35, 36, 38, 45, 47, 49, 52, 53, 58, 62], "It": [4, 11, 14, 15, 16, 17, 18, 19, 20, 21, 28, 30, 32, 35, 36, 38, 39, 44, 51, 52, 55, 56, 60, 63], "NOT": [7, 14], "No": [0, 14, 19, 22, 35, 39, 47, 48, 51, 54, 55, 56, 57, 60], "Not": 20, "ON": [17, 31, 33, 47, 62], "Of": 51, "On": [28, 32, 37, 41, 42], "One": [29, 32], "That": [14, 32, 39, 40, 47], "The": [0, 2, 4, 5, 7, 9, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 24, 25, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 45, 47, 49, 51, 52, 55, 56, 57, 58, 60, 61, 62], "Their": 28, "Then": [3, 11, 22, 33, 41, 42, 52], "There": [21, 27, 36, 39, 45, 47, 52, 61], "These": [16, 24, 28, 29, 63], "To": [2, 3, 4, 7, 16, 18, 19, 24, 27, 28, 32, 36, 37, 39, 40, 41, 42, 45, 51, 52, 54, 55, 60], "With": [18, 19, 28, 29, 30, 45, 48, 53, 54], "_": [0, 11, 13, 14, 17, 18, 20, 22, 24, 27, 28, 29, 30, 32, 33, 34, 35, 37, 39, 40, 46, 47, 49, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61], "__del__": 56, "__init__": 35, "__main__": [29, 35], "__name__": 35, "__version__": [11, 33, 37, 39, 40, 41, 42, 63], "_gbs1_": 51, "_gbs2_": 51, "_pywrap_itex": 39, "_timestamp_inst": 29, "_timestamp_instance_n_cor": 29, "a100": 54, "a380": [39, 40], "a730m": [39, 40], "a930253": 33, "abl": 5, "about": [0, 7, 19, 32, 34, 35, 45, 51, 52, 58], "abov": [18, 19, 22, 28, 29, 32, 37, 47, 51, 52, 55, 56, 57, 58, 60, 62], "absolut": [29, 51], "abus": 0, "acceler": [4, 14, 16, 30, 31, 33, 44, 47, 52, 63], "accept": [0, 7, 17], "access": 37, "accmatmul": 24, "accord": [17, 18, 47, 56, 58, 61], "accordingli": 62, "account": 0, "accumul": 31, "accur": 36, "accuraci": [15, 18, 19, 25, 28, 44, 45, 52, 58, 61], "achiev": [18, 32], "acm": [39, 40], "across": [16, 20, 25], "act": [0, 21, 34], "action": [0, 5, 36], "activ": [11, 18, 19, 22, 25, 28, 32, 33, 37, 38, 39, 40, 41, 42, 46, 47, 48, 52, 53, 55, 56, 58, 60], "ad": [5, 13, 17, 18, 21, 23, 28, 39, 51, 62], "adam": 25, "adamw": 25, "adamwithweightdecayoptim": 26, "adapt": 0, "add": [3, 4, 5, 17, 18, 19, 24, 27, 32, 34, 37, 39, 40, 47, 54, 62], "add_weight": 35, "add_with_xla": 30, "addit": [8, 21, 23, 24, 32, 36, 40, 63], "addition": [18, 28], "addn": 24, "addon": [26, 58], "address": [0, 32, 37], "adher": 63, "adjust": [20, 25, 51], "adjusted_init_lr": 51, "adopt": [4, 15, 16, 21], "advanc": [0, 4, 20, 30, 33, 44, 63], "affect": [0, 18, 28], "affin": 32, "after": [2, 17, 18, 19, 22, 24, 26, 27, 28, 32, 33, 36, 37, 38, 42, 45, 51, 56], "afterward": [28, 29, 32], "ag": 0, "again": 28, "against": 7, "agent": 37, "aggress": [0, 16, 18, 19], "ahead": [39, 40], "ai": [44, 45, 50, 52, 63], "aim": 63, "aka": 21, "akdlm": [37, 42], "al": 25, "alexnet": 44, "alg": 11, "alg_kind_": 11, "algebra": [4, 16, 30], "algo": 11, "algorithm": [11, 25], "align": [0, 13], "all": [0, 7, 11, 14, 18, 20, 21, 25, 27, 28, 30, 32, 37, 42, 45, 47, 51, 62], "allocate_output": 11, "allow": [0, 16, 18, 28, 32, 35, 56, 63], "allowlist": 18, "allowlist_add": [18, 19], "allowlist_remov": 18, "almost": 21, "along": [30, 32], "alpha": 11, "alpha_": 11, "alreadi": [18, 28, 38, 45], "also": [0, 4, 7, 15, 16, 17, 19, 21, 23, 27, 28, 29, 30, 32, 36, 37, 38, 41, 42, 63], "altern": 18, "although": 32, "alwai": [18, 28, 36], "alwayslink": [11, 34], "am": 51, "among": [29, 32], "amount": [14, 28], "amp": [4, 18, 29, 31, 44, 55, 60, 63], "ampthre": 18, "amx": 52, "amx_bf16": 52, "amx_int8": 52, "an": [0, 2, 3, 4, 7, 11, 13, 14, 16, 18, 19, 21, 24, 25, 27, 28, 29, 30, 32, 34, 35, 37, 38, 39, 40, 42, 44, 49, 52, 53, 57, 62, 63], "anaconda": 38, "analysi": [16, 32], "analyt": 45, "analyz": [16, 22], "ani": [0, 4, 11, 16, 20, 21, 23, 24, 27, 28, 29, 37, 38, 39, 42, 45, 53, 56], "annot": 17, "anoth": [29, 32, 36], "answer": 0, "antirectifi": 35, "aot": [39, 40], "apach": 63, "api": [4, 7, 9, 10, 14, 15, 16, 19, 25, 26, 27, 28, 30, 32, 34, 40, 52, 53], "apolog": 0, "apologi": 0, "appear": [0, 28], "append": [35, 37, 41, 42], "appli": [0, 16, 17, 25, 28, 33, 34, 51, 54, 55, 57, 60, 62], "applic": [4, 21, 23, 31, 32, 33, 34, 36, 45], "apply_gradi": 28, "appoint": 0, "approach": [4, 16, 38], "appropri": [0, 3, 32, 39, 40], "approv": 7, "approxim": [11, 25], "approximate_": 11, "apt": [7, 34, 37, 39, 42], "ar": [0, 2, 4, 5, 7, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 32, 34, 36, 37, 39, 40, 41, 42, 44, 45, 47, 51, 52, 53, 55, 58, 61, 63], "arang": 25, "arc": [14, 39, 40, 42, 47, 63], "arch": 37, "architectur": [11, 16], "archiv": 37, "area": 13, "arg": [2, 13, 33], "argument": [13, 25, 28, 29, 33], "around": [0, 29, 51], "arrai": 25, "articl": 32, "as_graph_el": 35, "ask": [4, 36, 39, 40], "aspect": 28, "assign": [29, 32, 40], "assign_i": 40, "assign_x": 40, "assist": 8, "assum": [17, 28, 32, 38, 39, 40, 51, 55, 60], "assumpt": [2, 3], "astyp": [19, 28, 35, 53], "ats": [39, 40], "atsp": 28, "attach": [2, 3, 28, 32], "attack": 0, "attent": [0, 20], "attr": [11, 20], "attribut": [24, 33], "auto": [4, 11, 17, 27, 29, 30, 33, 40], "auto_mixed_precis": [18, 19, 33, 47], "auto_mixed_precision_log_path": [20, 33], "auto_mixed_precision_opt": [18, 19, 47], "auto_mixed_precision_optionsgraph_opt": 18, "auto_mod": [17, 62], "auto_sharding_pass": 17, "auto_sharding_pass_mlir": 17, "autom": [21, 29], "automat": [4, 5, 16, 17, 18, 19, 21, 26, 28, 29, 31, 32, 33, 37, 42, 44, 48, 53, 62], "automixedprecis": 18, "automixedprecisionopt": [18, 19, 47], "automixedprecosionopt": 18, "autoshard": [17, 62], "ava": 49, "avail": [0, 2, 3, 11, 14, 19, 25, 29, 32, 35, 36, 39, 40, 41, 42, 55], "averag": 51, "avgpool": [18, 19, 49], "avgpool3d": [18, 19], "avoid": [0, 4, 24, 27, 28, 29, 32, 35, 38, 51], "avx512": [4, 21, 52], "avx_vnni": 52, "awk": 51, "axi": [25, 26, 35], "b": [30, 35, 40, 47, 49, 51, 52, 61, 62], "b4ab4b8f8b3a41fade4899fd00b5b2d2dad0981f3e1bb10df4c522975fd7": 40, "b7a8": [37, 42], "ba": 25, "back": [17, 28, 39], "backend": [4, 16, 21, 23, 26, 27, 28, 33, 42, 47, 48, 52, 53, 63], "background": 32, "background_thread": 29, "backward": [11, 28], "balanc": [18, 19, 31, 35], "bare": 44, "base": [7, 11, 14, 15, 16, 18, 19, 25, 31, 32, 37, 38, 41, 44, 47, 51, 52, 57, 58, 62, 63], "base_config": 35, "base_shap": 35, "basekit": [37, 38, 42], "bash": [2, 37, 38, 39, 40, 47, 51, 52, 60, 63], "bashrc": 38, "basi": 37, "basic": [18, 19, 20, 28], "batch": [17, 25, 28, 29, 31, 51, 62], "batch_siz": [16, 17, 19, 28, 35, 55, 62], "batch_size_per_gpu": 51, "batchmatmul": [24, 26], "bazel": [3, 11, 34], "bazelbuild": [7, 39, 40], "bazelrc": 39, "becaus": [18, 19, 28, 36], "becom": [13, 32, 36], "been": [28, 32, 54, 62], "befor": [5, 7, 11, 16, 18, 19, 24, 27, 28, 29, 32, 35, 36, 39, 40, 44, 62], "begin": [7, 11, 47], "behavior": [0, 27, 28, 29, 32, 36, 51], "being": 32, "below": [2, 3, 24, 25, 28, 29, 30, 31, 32, 33, 37, 39, 42, 51, 56], "benchmark": [7, 16, 31, 35, 55, 61], "benefit": [4, 21, 28, 32, 33], "bert": [16, 20, 25, 36, 44], "bert_base_dir": 16, "bert_base_model": 16, "bert_config": [16, 57], "bert_config_fil": [16, 57], "bert_larg": 16, "bert_large_dir": 57, "bert_model": [51, 57], "bert_prep_working_dir": 51, "besid": [21, 32], "best": [0, 14, 16, 27, 37], "beta": 11, "beta_": 11, "beta_1": [25, 26], "beta_2": [25, 26], "beta_constraint": [25, 26], "beta_initi": [25, 26], "beta_regular": [25, 26], "better": [4, 15, 16, 18, 19, 21, 24, 25, 27, 29, 32, 35, 36, 44, 51, 52, 54, 55, 60], "between": [16, 17, 18, 19, 21, 32, 34, 35, 39, 54, 61, 62], "bf16": [18, 19, 24, 31, 44, 45, 47, 51, 55, 60, 61, 62], "bf32": 20, "bfloat16": [4, 11, 18, 19, 21, 24, 28, 33, 47, 51, 55, 57, 60], "bfloat16graph_opt": 19, "bia": [13, 20, 24, 53], "bias_add": 53, "bias_initi": [25, 26], "biasadd": [20, 26], "biasaddgrad": 24, "big": 45, "bin": [3, 7, 11, 29, 34, 39, 40, 46, 47, 48, 52, 55, 56, 58, 60], "bin_threadpool": 3, "binari": [18, 34, 39, 40], "bind": [13, 30, 32, 40], "bind_al": 22, "bit": [15, 18, 28, 33, 37, 39, 41, 42, 47], "blob": [21, 34], "block": [11, 32, 33, 35, 36, 42], "blocker": 45, "blocktim": 32, "blog": 16, "board": 31, "bodi": 0, "bookcorpu": [31, 51], "bool": 11, "boolean": [24, 29], "boost": [4, 21, 29, 31, 32], "both": [4, 7, 14, 15, 18, 19, 23, 27, 29, 30, 31, 32, 33, 39, 47, 61], "bound": 32, "box": 15, "brain": 55, "branch": [5, 7, 39], "break": 24, "bridg": [21, 34], "briefli": 32, "bring": [23, 28, 29, 63], "browser": [5, 22, 41, 42, 49, 52, 54, 56], "bs1": 49, "bt": 35, "bu": [2, 30], "buffer": [16, 49], "bug": [7, 63], "buid": 40, "build": [4, 7, 9, 35, 43, 44, 45, 51, 63], "build_doc": 5, "build_pip_packag": [11, 39], "build_tmp": 5, "build_with_threadpool": 40, "builder": 61, "buildifi": 7, "buildtool": 7, "built": [11, 16, 34, 41, 42], "bus_id": 2, "busi": 32, "bzl": 7, "c": [2, 4, 10, 11, 14, 29, 30, 32, 35, 37, 38, 39, 41, 42, 43, 56, 63], "c481324031ecf0f70f8939516c02e16cac60446d": 60, "c_api_experiment": 40, "c_str": 40, "cach": [12, 15, 32, 35, 51], "calcul": [29, 54], "calibr": 52, "call": [11, 15, 16, 26, 28, 30, 32, 33, 35, 36, 43, 46, 52, 53, 56, 57], "callabl": 56, "can": [2, 3, 4, 7, 11, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 25, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 45, 51, 55, 56, 60, 61, 62, 63], "cannot": [14, 18, 27, 35, 47, 48, 51, 54, 55, 57, 60], "capabl": [4, 14, 27, 28], "capi": 30, "card": [20, 51, 58], "case": [4, 13, 18, 19, 21, 28, 29, 32, 35, 47], "cast": [0, 18, 24, 28, 49], "cat": 29, "catch": 11, "caus": [27, 28, 32, 35, 56], "cbica": 55, "cc": [3, 11, 14, 17, 28, 30, 34, 42, 58, 62], "ccl": [38, 42], "cd": [2, 5, 7, 16, 32, 34, 39, 40, 47, 51, 54, 55, 57, 58, 60, 62], "cell": [28, 54], "center": [1, 4, 16, 21, 25, 26, 33, 39, 40, 42, 45, 47, 50, 51, 52, 54, 55, 56, 57, 58, 60, 61, 62, 63], "cento": 41, "certain": [16, 29, 32], "challeng": 55, "chanc": [18, 28], "chang": [4, 5, 7, 11, 18, 19, 20, 21, 23, 27, 28, 29, 30, 36, 38, 44, 45, 56, 58], "channel": [0, 24, 25, 43], "channels_last": 62, "characterist": 0, "cheap": 35, "check": [5, 7, 11, 13, 14, 18, 19, 21, 23, 28, 29, 37, 38, 39, 40, 45, 46, 47, 57, 63], "checker": 32, "checkout": [5, 34, 40, 55, 60, 62], "checkpoint": 51, "choos": [16, 23, 25, 27, 28, 29, 32, 35, 39, 40, 43, 47, 49, 52, 53, 55], "chrome": 5, "circular": 27, "ckpt": [51, 57], "clang": 7, "clarifi": 0, "clariti": 0, "class": [0, 11, 28, 33, 35], "classic": 32, "classif": 22, "classifi": [44, 61], "classifier_train": 61, "classify_text_with_bert": 56, "claus": [4, 21, 23], "clean": [11, 40], "clearlist": 18, "clearlist_add": 18, "clearlist_remov": 18, "click": [11, 39, 40], "client": [2, 30, 40], "client_sess": 40, "clientsess": 40, "clock": 14, "clone": [5, 16, 34, 39, 40, 51, 54, 55, 57, 60, 61, 62], "close": [25, 27, 32], "closer": 24, "cluster": [27, 38], "cm": 37, "cmake": 39, "cnn": [18, 31, 32, 44, 45], "co": [4, 14, 15, 21], "coco": [31, 49, 60], "coco17": 49, "code": [2, 4, 5, 9, 11, 16, 20, 21, 22, 23, 27, 30, 31, 32, 34, 35, 43, 44, 45, 47, 49, 52], "codebas": [4, 30], "codenam": 4, "colab": 28, "collabor": [16, 63], "collect": [2, 32, 42], "color": 0, "com": [0, 5, 7, 8, 16, 21, 28, 32, 34, 35, 37, 38, 39, 40, 42, 45, 47, 49, 51, 52, 54, 55, 56, 57, 58, 60, 61, 62, 63], "combin": [16, 21, 29, 32, 54], "come": 4, "comma": 32, "command": [2, 3, 14, 22, 29, 32, 37, 38, 39, 40, 41, 42, 46, 47, 49, 52, 57], "comment": [0, 7, 14], "commit": [0, 5, 17, 34], "common": [0, 11, 14, 17, 21, 32, 44, 51], "common_runtim": [11, 30], "commonli": 32, "commun": [0, 2, 7, 9, 21, 23, 32, 42, 63], "compact": [29, 32, 35], "compar": [16, 18, 28, 32, 44], "compat": [2, 3, 4, 15, 19, 21, 23, 26, 28, 30, 33, 35, 51, 52, 54, 55, 56, 57, 60, 61], "compet": 32, "competit": 32, "compil": [4, 11, 14, 16, 19, 21, 27, 28, 30, 32, 33, 34, 35, 36, 37, 38, 40, 42], "compiler_vers": 33, "complaint": 0, "complet": 32, "complic": [21, 29], "compon": [17, 19, 31, 33, 37, 38, 39, 40, 42], "compos": 17, "compressor": [4, 15, 21, 44, 45, 52], "comput": [4, 11, 15, 16, 25, 28, 32, 35, 37, 45, 53, 54, 63], "compute_dtyp": 28, "compute_gradi": 28, "concat": 35, "concaten": [35, 54], "concatv2": 49, "concept": [16, 28, 32], "concrete_funct": 35, "concurr": [4, 13, 20, 32, 35], "conda": [4, 14, 43, 51, 56], "conda_prefix": 29, "conduct": [7, 29], "conduit": [4, 30], "conf": 29, "config": [11, 14, 17, 18, 19, 28, 34, 35, 37, 39, 40, 42, 47, 52, 58, 61, 62], "config_fil": 61, "configproto": [17, 18, 19, 47, 52, 62], "configur": [4, 8, 11, 14, 17, 19, 21, 23, 28, 29, 33, 35, 37, 42, 49, 61, 63], "confirm": [29, 39, 40], "conflict": 35, "conform": 7, "connect": 32, "consecut": 32, "consequ": 0, "consid": [0, 18, 58], "consist": [7, 28], "consol": 42, "const": 40, "constant": [11, 15, 16, 25, 26, 28, 30], "constant_fold": 52, "constraint": 25, "construct": [0, 11, 17, 28], "constructor": 28, "consum": 51, "consumpt": [19, 21, 28, 47], "contact": 8, "contain": [5, 9, 15, 17, 27, 29, 32, 34, 43, 44, 55, 60, 63], "content": [5, 40, 42], "context": [11, 25, 32], "contigu": 32, "continu": [0, 14, 18, 27, 28], "contrast": 16, "contribut": [0, 4, 14, 21, 29, 39], "contributor": [7, 63], "control": [31, 32, 44, 52, 62], "conv": [17, 24, 53], "conv2d": [4, 21, 49, 53], "conv3d": 24, "convent": 7, "convers": [17, 18, 19, 24], "convert": [15, 16, 17, 18, 19, 28, 36, 45, 47, 49, 55, 61], "convert_to_tensor": 11, "convgradfilt": 24, "convolut": 32, "cooper": [4, 21, 44, 49, 52], "copi": [2, 3, 40], "copt": [11, 34], "copyright": 7, "core": [9, 11, 14, 17, 26, 28, 30, 31, 32, 35, 39, 40, 42, 52, 53, 58, 62], "core_id": 29, "core_list": 29, "correct": [28, 35, 39, 40], "correspond": [18, 29, 30, 36], "correspondli": 61, "cost": 15, "costli": 32, "could": [0, 18, 28, 33, 40, 45, 51, 52], "count": 14, "coupl": 32, "coven": [7, 63], "cover": [19, 21, 24, 29, 32], "cp": [3, 40, 51], "cp311": 40, "cpp": [3, 14, 17, 37], "cpplint": 7, "cpu": [2, 3, 4, 9, 11, 14, 15, 16, 18, 19, 20, 23, 24, 28, 31, 33, 34, 36, 43, 44, 45, 49], "cpudevic": 11, "cpunodebind": 32, "crash": 56, "creat": [11, 18, 28, 29, 30, 33, 36, 38, 42, 46, 49, 52, 55, 60, 62], "create_datasets_from_start": 51, "creatednnlengin": 11, "creatednnlstream": 11, "creation": 13, "critic": 18, "cross": [29, 32], "ctl": 61, "ctx": 11, "cuda": 28, "cuda_diagnost": 28, "cuda_driv": 28, "cuinit": 28, "curl": 38, "current": [14, 17, 22, 33, 51, 55, 60, 62], "custom": [4, 7, 9, 16, 18, 21, 26, 27, 29, 33, 37, 42, 51], "custom_graph_optimizer_registri": 58, "cv": 54, "cvfh": 3, "d": [7, 35, 37, 39, 40, 61], "d50dnp1sbb": 31, "dai": 51, "danger": 18, "dashboard": 22, "data": [4, 15, 16, 17, 18, 21, 22, 25, 28, 33, 35, 39, 40, 42, 45, 47, 49, 50, 51, 52, 54, 55, 56, 57, 58, 60, 61, 62, 63], "data_dir": [16, 51, 55, 60, 61], "data_f32": 11, "data_format": [20, 62], "data_typ": [18, 19, 47], "dataset": [19, 28, 31, 35, 52, 58], "dataset_dir": [55, 60], "datatyp": [33, 40, 51, 55, 60], "dch": 37, "dcmake_build_typ": 39, "ddr4": 31, "ddr5": 31, "de6201297144": [37, 42], "dealloc": 32, "dearmor": 37, "deb": [37, 39], "debug": [11, 20, 22, 33], "debugalloc": 32, "decai": 25, "decayed_learning_rate_at_crossover_point": 51, "decid": 17, "decis": [0, 17], "declar": 11, "decoupl": [25, 30], "dedic": 7, "deem": 0, "deep": [15, 25, 27, 32, 36, 44, 63], "deeper": 23, "deeplearningexampl": [31, 51, 55, 60], "def": [28, 30, 35], "default": [4, 7, 13, 14, 15, 18, 19, 20, 21, 23, 27, 28, 30, 31, 32, 33, 35, 39, 40, 51, 52, 53, 60, 61, 62], "default_data_typ": [18, 33], "default_dataset": 49, "default_static_qconfig": 49, "defin": [4, 16, 28, 40], "definit": [7, 18, 23, 33], "deleg": 15, "deliv": [4, 19, 21, 27], "delta_tim": 35, "demand": [13, 63], "demo": 22, "demonstr": [0, 31, 44], "denali": 31, "deni": 18, "dens": [19, 20, 28, 35], "dense1": 28, "dense2": 28, "dense_1": [19, 28], "dense_2": [19, 28], "dense_logit": [19, 28], "denylist": 18, "denylist_add": 18, "denylist_remov": 18, "dep": [11, 34], "depend": [14, 16, 19, 29, 32, 36, 37, 39, 40, 42], "deploi": [21, 34], "deploy": [38, 41, 42], "deprec": 39, "depthwiseconv2dn": 49, "dequant": [49, 52], "derogatori": 0, "desc": [11, 13], "descibl": 11, "describ": [25, 28, 29, 32], "descript": [9, 13, 18, 29, 32, 33, 44, 56], "descriptor": 11, "design": [4, 7, 9, 21, 30, 34, 45], "desir": [18, 29], "destruct": 32, "detail": [2, 3, 11, 15, 16, 17, 18, 19, 21, 23, 25, 28, 32, 33, 36, 37, 39, 40, 42, 45, 47, 51, 63], "detect": [32, 49], "determin": [0, 11, 28, 32], "dev": [2, 3, 14, 22, 34, 39, 42, 47, 57], "develop": [4, 14, 16, 21, 30, 32, 37, 39, 40, 41, 42, 63], "deviat": 25, "devic": [2, 3, 4, 9, 10, 11, 13, 14, 16, 17, 19, 20, 21, 22, 23, 24, 28, 33, 34, 39, 40, 42, 47, 62, 63], "device_cpu": 11, "device_gpu": [11, 17, 62], "device_lib": 2, "device_num": [17, 62], "device_typ": [2, 14, 17, 39, 40, 58, 62], "diagram": 63, "dialect": [16, 17], "dict": 35, "did": [28, 32], "diff_undef": 11, "diffent": 27, "differ": [0, 2, 4, 13, 16, 20, 21, 23, 25, 29, 30, 32, 33, 35, 36, 43], "differenct": [39, 40], "differenti": 39, "difficult": 30, "diffus": [44, 63], "digit": [19, 28], "dim": 13, "dimens": 17, "dir": [2, 3, 7, 51, 55, 56, 57, 60], "directli": [11, 14, 17, 27, 28, 29, 32, 36, 42], "directori": [2, 3, 4, 5, 7, 14, 17, 29, 34, 37, 39, 40, 42, 47, 48, 49, 51, 54, 55, 57, 60], "diretcori": 40, "disabl": [0, 15, 19, 27, 29, 30, 32, 33], "disable_numactl": 29, "disable_taskset": 29, "disbal": 39, "discontinu": 14, "discuss": 7, "disk": [36, 49], "disparag": 0, "displai": [20, 49], "distanc": 54, "distinguish": [28, 30], "distribut": [2, 4, 8, 31, 32, 37, 38, 42, 43, 44, 51, 60, 61, 63], "distribution_strategi": 62, "divers": 0, "divid": [25, 28, 32], "divis": 28, "dl": 7, "dll": 51, "dllogger": [55, 60], "dllvm_enable_project": 39, "dnnl": [11, 13], "dnnl_arg_dst": 11, "dnnl_arg_scratchpad": 11, "dnnl_arg_src": 11, "do": [7, 14, 19, 27, 28, 29, 33, 36, 39, 52], "do_benchmark": 35, "do_lower_cas": 16, "do_predict": [16, 57], "do_train": [16, 57], "doc": [5, 9, 11, 39, 56], "doc_strid": 57, "docker": [9, 43, 44], "dockerfil": 2, "dockerhub": 63, "docs_build": 9, "docstr": 11, "document": [2, 3, 28, 31, 36, 38, 39, 40], "doe": [16, 24, 27, 28], "doesn": [5, 17, 18, 36, 56], "domin": 28, "don": [28, 49], "done": [7, 22, 28, 32, 35, 37], "doubl": 28, "download": [2, 8, 28, 32, 37, 42, 49, 51, 60, 61], "download_and_preprocess_coco": 60, "downstream": 18, "dpc": [21, 37, 38, 39, 40, 42], "dpcpp": [33, 37], "draft": 5, "dramat": 32, "dri": [2, 3, 34, 42, 47], "drive": 35, "driver": [2, 3, 14, 28, 31, 38, 45, 47, 52, 63], "drop": [18, 29, 35], "dropout": 35, "dst_mem": 11, "dst_tensor": 11, "dt_float": [20, 40], "dtype": [11, 19, 25, 26, 30, 35, 53, 62], "dtype_polici": 28, "due": [18, 27, 32, 35], "dummi": [31, 49, 61], "dummy_v2": 49, "dump": [20, 35], "duplic": 39, "dure": [0, 15, 16, 18, 19, 24, 28, 36, 38, 39, 40, 47], "dut3046": 28, "dynam": [13, 28, 32, 35, 36], "e": [0, 2, 3, 5, 11, 17, 28, 29, 34, 40, 60, 61], "each": [14, 25, 28, 29, 30, 31, 32, 62], "eager": [11, 25], "earli": 37, "easi": [16, 21, 30, 45], "easiest": 38, "easili": [16, 30, 31, 33], "ecc": 31, "echo": [37, 51], "econom": 0, "ecosystem": [16, 30, 63], "ed": 40, "edit": [0, 2], "edu": 55, "educ": 0, "effect": [18, 29, 32], "effici": [4, 16, 21, 30, 32, 34, 35, 51, 62, 63], "effort": 37, "egg": 60, "eigen": [4, 20], "either": [3, 19, 27, 49], "elaps": [32, 49], "elig": 11, "elimin": [16, 36], "els": [19, 28, 40, 61], "eltwis": 11, "eltwise_bas": 11, "eltwise_base_hdr": 11, "eltwise_forward": 11, "eltwise_gelu_erf": 11, "eltwise_gelu_tanh": 11, "eltwise_relu": 11, "eltwisebaseop": 11, "elu": 24, "email": 0, "emit": 16, "empathi": 0, "empir": 25, "en": 42, "enabl": [4, 13, 15, 16, 17, 18, 21, 22, 25, 27, 28, 29, 30, 31, 32, 33, 35, 36, 38, 39, 40], "enable_checkpoint_and_export": 62, "enable_itex_amp": 29, "enable_itex_layout_opt": 29, "enable_jemalloc": 29, "enable_op_parallel": 29, "enable_tcmalloc": 29, "enable_tensorboard": 62, "enable_tf_profil": [4, 21, 22, 28], "enable_xla": 62, "encod": 20, "encompass": 16, "encount": 14, "end": [28, 35, 39, 40, 44, 45, 52], "engin": [11, 14], "enhanc": [4, 30], "ensur": [7, 29], "enter": [2, 3, 22, 38, 39, 40], "enterpris": [31, 42], "entir": 28, "entri": 17, "enum": 33, "env": [14, 34, 38, 39, 40, 42, 46, 51, 52, 54], "env_check": [37, 38, 42, 63], "env_itex": [46, 47, 52, 54, 55, 56, 58, 60], "env_itex_cpu": [48, 56], "env_nam": 46, "environ": [0, 2, 4, 11, 13, 15, 16, 19, 21, 22, 23, 27, 28, 30, 32, 34, 35, 43, 44, 63], "environment": [30, 40], "epoch": [18, 19, 28, 35, 51, 58, 60], "epoch_loss_avg": 28, "epsilon": [25, 26], "equal": [24, 27, 32], "equival": [4, 28], "error": [4, 7, 11, 14, 20, 25, 28, 34, 47, 48, 51, 54, 55, 56, 57, 60], "errors_impl": [14, 47, 48, 51, 54, 55, 57, 60], "especi": [13, 38], "estim": [36, 63], "et": 25, "etc": [21, 30, 37, 39], "ethernet": 31, "ethnic": 0, "eu": 14, "eval_batch_s": 51, "evalu": [19, 28, 35, 54, 57], "even": [28, 29, 32, 43, 51, 63], "event": 0, "everi": [18, 20, 54], "everyon": 0, "evo": 31, "evolv": 30, "exact": 31, "exact_match": [51, 57], "exactli": 30, "exampl": [0, 2, 4, 5, 7, 9, 11, 14, 15, 20, 21, 24, 25, 26, 28, 31, 32, 33, 34, 37, 38, 45, 47, 50, 52, 56, 63], "example_test": 40, "except": [30, 33, 42, 51], "excess": 30, "exclud": 7, "exclus": 29, "excutor": 27, "exec": [11, 13], "exec_mod": 55, "execut": [2, 5, 11, 13, 15, 16, 17, 18, 19, 20, 22, 25, 28, 31, 32, 36, 39, 44, 52, 53], "executor": 15, "exist": [19, 24, 26, 28, 29, 45], "exit": 34, "exp": 18, "expect": [18, 38, 52, 63], "experi": [0, 4, 21, 23, 32], "experiment": [4, 13, 14, 22, 33, 39, 40, 42], "experimental_compil": 30, "experimental_gelu": 16, "experimental_ops_overrid": [26, 33], "explain": 18, "explan": 0, "explicit": [0, 11, 28, 32], "explicitli": [28, 29, 33, 52], "export": [4, 7, 11, 15, 16, 17, 18, 19, 21, 22, 28, 29, 30, 32, 34, 37, 38, 40, 42, 46, 47, 51, 52, 54, 57, 61, 62, 63], "expos": [21, 22, 63], "expr": 51, "express": 0, "extend": [4, 14, 21, 23, 25, 30, 32, 33], "extens": [5, 8, 9, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 24, 25, 26, 28, 29, 30, 31, 32, 36, 38, 43, 44, 46, 47, 48, 50, 51, 53, 54, 55, 56, 57, 58, 60, 61, 62], "extent": 31, "extern": [0, 14, 40], "extra": [18, 28, 36], "extract": 51, "f": [2, 35, 40, 63], "f0": 11, "f1": [51, 57], "f502f0715979ec73c571ca5676ba58431b916f5f58ee3333": 56, "facilit": [4, 30], "factor": [21, 29], "fail": [11, 28, 33, 36], "fair": 0, "fairli": 0, "fallback": 25, "fals": [7, 16, 17, 25, 27, 28, 29, 35, 51, 57, 62], "familiar": 11, "faq": 0, "far": 28, "fashion": [4, 21], "fast": 25, "faster": [18, 19, 25, 27, 28, 32, 35, 36, 47, 49], "fatal": 14, "fdc7a2bc": [37, 42], "featur": [4, 7, 8, 11, 13, 17, 25, 32, 36, 39, 44, 52, 62, 63], "feedback": [0, 7], "fetch": 40, "few": [28, 61], "fewer": 28, "fi": 61, "fi_provid": 38, "fid": 54, "field": [33, 39, 40], "fig": [16, 36], "figur": [16, 30, 32], "file": [2, 5, 7, 14, 17, 18, 22, 29, 34, 37, 42, 47, 48, 49, 51, 54, 55, 56, 57, 60, 61, 63], "filenam": 35, "fill": [39, 40], "filter": 7, "filter_height": 53, "filter_width": 53, "final": [17, 19, 28, 51], "final_carry_st": 25, "final_memory_st": 25, "find": [7, 11, 22, 31, 32, 34, 36], "fine": [28, 29, 31, 32, 35, 51], "finish": [28, 35, 39, 53, 56], "first": [17, 18, 19, 22, 24, 25, 27, 28, 29, 30, 32, 37, 38, 39, 41, 42, 51, 55, 60], "fit": [19, 32, 35], "fix": [7, 28, 37], "flag": [17, 30, 40, 60], "flex": [39, 40, 42, 45, 47, 50, 52, 54, 57, 63], "flexibl": [4, 30, 33, 35], "flexibli": 63, "float": [11, 18, 20, 28, 33, 40, 47], "float16": [4, 16, 18, 19, 21, 28, 33, 47], "float16graph_opt": [18, 19], "float32": [11, 19, 24, 25, 26, 28, 30, 35, 51, 53, 55, 60], "flow": [16, 28], "flower": 52, "focus": [0, 30], "fold": 15, "folder": [2, 3, 19, 34, 39, 40, 61], "follow": [0, 2, 3, 7, 15, 16, 17, 18, 22, 24, 27, 28, 29, 31, 32, 33, 34, 35, 37, 38, 39, 40, 41, 42, 43, 45, 47, 48, 51, 53, 54, 55, 56, 57, 60, 61, 62, 63], "follw": 62, "footprint": 36, "forg": [14, 56], "fork": [32, 35], "format": [7, 9, 18, 24, 28, 33, 35, 36, 61], "forth": 63, "forward": [11, 28, 54], "forward_train": 11, "found": [7, 14, 28, 29, 32, 34, 36, 39, 51], "four": 18, "fp": 47, "fp16": [16, 18, 19, 31, 44, 47, 51], "fp32": [16, 18, 19, 20, 24, 31, 44, 45, 49, 51, 52, 60], "fpn": 49, "fraction": 16, "framework": [14, 16, 30, 35, 36, 37, 40, 47, 48, 50, 51, 54, 55, 57, 60], "free": [0, 21, 29], "frequenc": [14, 31], "frequent": [4, 36], "friendli": 32, "from": [0, 3, 5, 7, 11, 16, 17, 18, 19, 21, 22, 27, 28, 29, 30, 32, 33, 35, 36, 37, 39, 43, 44, 47, 49, 50, 51, 52, 55, 56, 63], "from_logit": 35, "from_model": 49, "from_tensor_slic": 28, "frontend": [4, 16, 21, 23], "frozen": 19, "fr\u00e9chet": 54, "full": [7, 39, 40, 42], "fulli": [4, 19, 21, 30, 35], "function": [5, 17, 20, 21, 23, 25, 26, 28, 30, 32, 33], "fundament": 16, "further": [4, 16, 21], "fuse": [4, 16, 18, 19, 21, 24, 26, 51], "fusedaccmatmul": 24, "fusedbatchnorm": 24, "fusedbatchnormgrad": 24, "fusedmatmul": 24, "fusion": [4, 9, 17, 18, 19, 21, 26, 33], "fwd_desc": 11, "fwd_pd": 11, "fwd_primit": 11, "fwd_primitive_arg": 11, "g": [5, 17, 28, 40, 56, 61], "g10": [39, 40], "g11": [39, 40], "gamma_constraint": [25, 26], "gamma_initi": [25, 26], "gamma_regular": [25, 26], "gate": 25, "gaussian": 25, "gb": 31, "gbs1": 51, "gbs2": 51, "gcc": [33, 39], "gd": 35, "gddr6": 31, "gelu": [11, 33], "gelu_erf": 24, "gelu_tanh": 24, "geluop": 11, "gen": 31, "gen9": 11, "gender": 0, "gener": [4, 5, 16, 20, 21, 23, 28, 29, 30, 31, 32, 34, 38, 39, 41, 47, 49, 52], "get": [2, 4, 7, 11, 13, 21, 28, 31, 32, 33, 34, 35, 37, 39, 40, 47, 48, 51, 54, 55, 57, 60, 63], "get_concrete_funct": 35, "get_config": 35, "get_scaled_loss": 28, "get_unscaled_gradi": 28, "get_weight": 28, "getattr": 11, "getsitepackag": [37, 38, 42, 63], "gh": 5, "ghz": 31, "gigabit": 31, "gin": 58, "git": [5, 11, 16, 33, 34, 39, 40, 47, 51, 54, 55, 57, 58, 60, 61, 62], "git_vers": [33, 38], "github": [5, 7, 8, 16, 21, 32, 34, 39, 40, 45, 47, 51, 54, 55, 57, 58, 60, 61, 62, 63], "give": [0, 35], "given": [17, 25, 29, 55], "glibcxx": 14, "glibcxx_3": 14, "global": [17, 28, 33, 62], "glorot_uniform": [25, 26], "glue_dataset": 16, "glue_dir": 16, "go": [7, 40, 41, 42], "go1": 7, "golang": 7, "gold": 31, "gomp": 32, "gomp_cpu_affin": 32, "good": [4, 19, 21, 23, 32, 34, 36], "googl": [7, 14, 16, 21, 22, 34, 57], "google_pretrained_weight": 51, "googleapi": [28, 35, 47, 49, 56], "govern": 63, "governor": 31, "gperftool": 32, "gpg": [37, 39], "gpu": [3, 4, 9, 11, 14, 15, 16, 18, 19, 20, 23, 24, 25, 27, 28, 33, 34, 38, 43, 44, 49, 63], "gpu_kernel": 11, "gpu_profil": 28, "gpudevic": 11, "gracefulli": 0, "grad": 28, "gradient": 28, "gradienttap": 28, "granular": [29, 32, 35], "graph": [4, 9, 10, 13, 15, 16, 18, 20, 23, 30, 35, 36, 44, 53, 62, 63], "graph_def": 35, "graph_opt": [17, 18, 19, 33, 47, 52, 62], "graph_pb2": 35, "graphdef": [17, 18, 35], "graphic": [37, 39, 40], "graphopt": [17, 18, 19, 47, 62], "grappler": [15, 17, 19, 58], "greater": [24, 32], "greaterequ": 24, "greatli": 28, "green": 15, "grep": 52, "group": [25, 32], "gt": [18, 33, 62], "guarante": 37, "guid": [4, 9, 11, 18, 21, 28, 31, 34, 37, 39, 40, 42, 44, 45, 52, 63], "guidelin": [1, 4, 16, 50, 63], "guidlin": 31, "gxx_linux": [14, 56], "gz": [7, 32, 49], "h": [7, 11, 14, 17, 34, 40], "ha": [2, 3, 4, 14, 18, 19, 20, 28, 30, 32, 36, 37, 40, 51, 62], "had": [28, 32], "half": [11, 28], "halv": 28, "hand": 16, "handl": [1, 13], "handwrit": [44, 45], "happen": [28, 36, 56], "harass": 0, "hard": [2, 54], "hardwar": [4, 16, 17, 19, 21, 23, 25, 29, 33, 35, 44], "harm": 0, "hasattr": [11, 33], "hasn": 54, "hat": 42, "have": [0, 18, 28, 32, 37, 38, 39, 42, 45, 49, 52], "hbm2e": 31, "hdr": [11, 34], "he": 25, "he_norm": 35, "header": 11, "headless": 60, "healthi": 0, "heap": 32, "help": [14, 19, 20, 21, 29, 32, 39, 40, 45, 52], "here": [8, 11, 14, 17, 18, 24, 27, 30, 35, 36, 39, 40, 49, 51, 54, 55, 60, 62], "heterogen": [17, 63], "heurist": 17, "high": [14, 16, 17, 28, 32, 63], "higher": [14, 15, 20, 28, 32], "highli": 28, "histori": [19, 28], "hlo": 16, "hochreit": 25, "hold": 32, "home": [7, 29, 37, 41, 42, 56], "homogen": 17, "hook": 17, "horovod": [2, 31, 37, 38, 42, 44, 51, 60], "horovodversionmismatcherror": 51, "host": [2, 3, 28, 39, 42, 47], "hour": 31, "how": [1, 5, 14, 17, 18, 27, 32, 34, 39, 40, 42, 44, 49, 58, 61, 63], "howev": [18, 21, 24, 28, 29, 30, 32, 54], "hpp": 11, "hs_to_tfg": 17, "hsp": 17, "html": [0, 5, 11, 39, 42], "html64": [7, 37], "http": [0, 2, 5, 7, 8, 16, 21, 22, 28, 32, 34, 35, 37, 38, 39, 40, 41, 42, 45, 47, 49, 51, 52, 54, 55, 56, 57, 58, 60, 61, 62, 63], "http_proxi": [2, 3], "https_proxi": [2, 3], "hub": 34, "hurt": 33, "hutter": 25, "hvd": 51, "hvd_configur": 61, "hvd_support": 61, "hyper": [29, 31, 32], "hyperparamet": 51, "hyphen": 32, "i": [0, 4, 5, 7, 9, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 30, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 47, 48, 49, 51, 52, 53, 54, 55, 56, 57, 58, 60, 61, 62, 63], "i0203": 61, "i0324": 62, "i0817": 61, "i1015": 51, "i1021": 51, "i1022": 51, "icd": [37, 42], "id": [2, 30, 34], "idea": 32, "ident": [0, 28], "identif": 28, "identifi": 39, "if_not_mobil": 34, "igc": 37, "ignor": [18, 28, 34], "ii": [18, 19, 33], "iii": [18, 19], "illustr": 32, "ilov": 25, "imag": [27, 28, 35, 41, 42, 44, 49, 54], "image_classif": [61, 62], "image_nam": [2, 3], "imagenet": 22, "imageri": 0, "img_arrays_for_acc": 54, "impact": [0, 5, 14, 18, 24, 32, 56], "implement": [4, 7, 10, 16, 17, 19, 21, 23, 25, 26, 30, 32, 35, 49, 51, 63], "import": [2, 7, 11, 14, 17, 18, 19, 22, 23, 25, 26, 27, 28, 30, 32, 35, 37, 38, 39, 40, 41, 42, 47, 49, 52, 53, 56, 63], "import_graph_def": 35, "imports_graph_def": 35, "improv": [15, 16, 19, 28, 32, 36, 39, 40, 49, 62], "inappropri": 0, "incarn": 2, "incept": [15, 18, 35, 44, 49, 54], "inceptionv4": 35, "inceptionv4_fp32_pretrained_model": [35, 47], "incid": 0, "includ": [0, 7, 13, 14, 16, 17, 18, 20, 23, 40, 42, 51, 52, 53, 63], "include_subdir": 7, "inclus": 0, "incorrect": 28, "increas": [18, 28, 52], "independ": [16, 25, 29, 35], "index": [18, 32], "indic": [24, 28, 47, 62], "individu": [0, 16, 20], "inf": 28, "infer": [11, 15, 16, 17, 18, 19, 24, 28, 34, 36, 44, 45, 51, 52, 56], "infer_config": 52, "infer_fp32_vs_amp": 47, "infer_inception_v4_amp": 47, "infer_resnet50": [29, 48], "inferlist": 18, "inferlist_add": 18, "inferlist_remov": [18, 19], "infin": 28, "influenc": [21, 29, 32], "info": [17, 18, 29, 36, 40, 45, 47, 49], "inform": [0, 1, 7, 8, 16, 20, 29, 32, 33, 39, 40, 42, 45, 52, 61, 63], "infrastructur": [4, 9, 20, 63], "init": 11, "init_checkpoint": 57, "initi": [17, 20, 28, 31, 35, 39, 40], "initial_weight": 28, "innov": [4, 63], "inplac": 7, "input": [4, 11, 13, 17, 19, 20, 21, 22, 24, 25, 28, 33, 35, 62], "input_height": 53, "input_shap": [35, 49], "input_width": 53, "input_x": 35, "insert": [18, 19, 24, 35, 52], "insid": [2, 63], "inspir": 0, "instal": [2, 3, 4, 7, 9, 14, 18, 19, 21, 22, 23, 26, 27, 28, 29, 31, 32, 33, 45, 46, 47, 48, 51, 52, 54, 55, 56, 57, 60], "install_head": 40, "instanc": [0, 31], "instance_idx": 29, "instancenorm": [19, 26], "instead": [36, 37, 39, 51, 54, 55, 60], "instruct": [2, 3, 4, 7, 16, 18, 19, 21, 31, 32, 41, 42, 54, 61, 63], "insult": 0, "int": [11, 35, 40, 51], "int8": [4, 28, 31, 45, 49, 52], "integ": 29, "integr": [4, 15, 16, 30, 32, 39], "intel": [0, 1, 5, 8, 9, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 24, 25, 26, 28, 29, 30, 36, 38, 43, 44], "intel_extension_for_tensorflow": [11, 17, 18, 19, 25, 26, 28, 29, 34, 37, 38, 39, 41, 42, 47, 49, 63], "intel_extension_for_tensorflow_lib": [11, 39], "intel_xpu": 2, "intelai": 16, "intelpython3_ful": 38, "intend": [7, 16, 63], "intent": 7, "inter": [4, 20, 35], "inter_op_parallelism_thread": 35, "interact": [0, 39], "interfac": [17, 30, 43, 63], "intermedi": [16, 28], "intern": 16, "internet": 47, "interop": 29, "interpret": 29, "intraop": 29, "introduc": [16, 29, 32, 36], "introduct": 19, "invalid": [13, 27, 32], "invent": 15, "investig": [0, 29], "invis": 0, "invok": [16, 17], "involv": 0, "io": [5, 34], "ip": 56, "ipc": [2, 3, 42, 47], "ipp": 55, "ipykernel": 54, "ipynb": [52, 54, 56], "ipython": 56, "ir": [16, 17], "irc_na": [37, 42], "is_bf16_math_mod": 24, "is_gpu_avail": 28, "isol": [37, 41, 42], "issu": [0, 1, 4, 7, 14, 18, 28, 37, 39, 40, 42, 56, 63], "item": [22, 35], "iter": [20, 31, 35, 36, 62], "itex": [0, 2, 3, 4, 8, 9, 11, 13, 14, 17, 18, 19, 20, 21, 23, 26, 27, 28, 29, 30, 31, 34, 37, 38, 39, 40, 41, 42, 46, 47, 52, 54, 62, 63], "itex_auto_mixed_precis": [16, 18, 19, 29, 33, 47], "itex_auto_mixed_precision_allowlist_add": [18, 19], "itex_auto_mixed_precision_allowlist_remov": 18, "itex_auto_mixed_precision_clearlist_add": 18, "itex_auto_mixed_precision_clearlist_remov": 18, "itex_auto_mixed_precision_data_typ": [16, 18, 19, 47], "itex_auto_mixed_precision_denylist_add": 18, "itex_auto_mixed_precision_denylist_remov": 18, "itex_auto_mixed_precision_inferlist_add": 18, "itex_auto_mixed_precision_inferlist_remov": [18, 19], "itex_auto_mixed_precision_log_path": [18, 19, 20, 33], "itex_auto_mixed_precision_unsafe_force_al": 18, "itex_bf16": 61, "itex_bf16_lar": 61, "itex_build": [39, 40], "itex_cfg": [17, 62], "itex_check_eq": 11, "itex_cpp_min_log_level": 20, "itex_disable_xla": 27, "itex_dummy_bf16": 61, "itex_dummy_bf16_lar": 61, "itex_dummy_fp32": 61, "itex_dummy_fp32_lar": 61, "itex_enable_multiple_stream": 62, "itex_enable_nextpluggable_devic": 27, "itex_fp32": 61, "itex_fp32_lar": 61, "itex_fp32_math_mod": [20, 51], "itex_gpu_wrapp": 42, "itex_layout_opt": [29, 32, 33], "itex_layout_optitex_remapperitex_auto_mixed_precisionitex_shard": 33, "itex_omp_threadpool": [3, 4, 20, 29, 35, 40], "itex_onednn_graph": [33, 52], "itex_ops_overrid": 27, "itex_optimizer_after_shard": 17, "itex_optimizer_before_shard": 17, "itex_quant": 49, "itex_remapp": 33, "itex_repo": 47, "itex_shard": 33, "itex_sync_exec": 33, "itex_tf_constant_fold": [15, 52], "itex_tile_as_devic": 20, "itex_verbos": [11, 17], "itex_vlog": 11, "itex_xpu_librari": 11, "itex_xx": 61, "itexauto_mixed_precision_opt": [18, 19], "itexdatatyp": 33, "itexgelu": 26, "itexgelugrad": 26, "itexlayernorm": 26, "itexlayernormgrad": 26, "itexlstm": 26, "itexresourceapplyadamwithweightdecai": 26, "itexrnn": 26, "its": [4, 11, 25, 28, 29, 30, 32, 37, 42, 53], "iv": [18, 19], "jammi": [37, 39], "jax": [16, 27, 30, 63], "jemalloc": 32, "jit": [4, 16, 27, 30], "jit_compil": 27, "job": [11, 20, 40], "join": [22, 32, 35], "json": [16, 35, 57], "just": [0, 4], "k8": [3, 40], "kaim": 25, "kdstindex": 11, "keep": [28, 32], "keepdim": 35, "kei": [9, 17, 20, 36, 37, 39], "kept": [26, 28], "kera": [4, 19, 25, 26, 31, 35, 51, 52, 54, 58, 63], "keras_util": [61, 62], "kerascv": 31, "keraslay": 22, "kernel": [2, 3, 9, 10, 15, 20, 22, 23, 24, 25, 28, 30, 31, 35, 37, 39, 40, 41, 42, 51, 52, 54, 56, 63], "kernel_initi": [25, 26], "kernels_experiment": 34, "keyr": 37, "kind": [0, 4, 21, 53], "kitti": 49, "kmp": 32, "kmp_affin": [29, 32, 35], "kmp_blocktim": [29, 32, 35], "knob": 29, "know": [19, 28], "knowledg": [19, 32], "known": [16, 28, 56], "kwarg": [25, 26, 35], "l": [34, 35, 40], "l28": 34, "l2loss": 24, "l_basekit_p_2024": [37, 42], "label_shap": 49, "ladder": 0, "lake": [4, 21], "lamb": [25, 51], "lambda": 25, "languag": [0, 40], "language_model": 16, "languagemodel": 51, "laptop": 14, "lar": 61, "larg": [4, 16, 20, 25, 28, 32, 35, 36, 44], "larger": [31, 32, 35, 39, 40], "last": [28, 56], "latenc": [13, 35, 47, 54], "latency_mod": 29, "later": [32, 37, 41, 42], "latest": [8, 27, 31, 34, 38, 39, 40, 42, 63], "launch": [21, 42, 54], "launcher": [4, 29, 32], "layer": [2, 9, 16, 19, 25, 28, 35, 52], "layer_0": 20, "layernorm": [19, 24, 26], "layernormgrad": 26, "layout": [13, 29, 33, 36], "layout_opt": 33, "ld": 32, "ld_library_path": 40, "ld_preload": [29, 32], "lead": [0, 16, 18], "leader": 0, "leakyrelu": 24, "learn": [0, 14, 15, 16, 19, 21, 25, 27, 29, 32, 34, 36, 44, 45, 63], "learning_r": [25, 26, 57], "learning_rate_per_gpu": 51, "learning_rate_phase1": 51, "learning_rate_phase2": 51, "least": [28, 37, 38], "leav": 32, "legaci": [27, 30, 51, 54, 55, 56, 57, 60, 61, 62], "legal": 7, "len": 35, "length": [16, 31, 51], "less": [4, 18, 19, 21, 24, 28, 35, 47], "lessequ": 24, "let": [18, 28, 34, 35], "level": [0, 14, 16, 17, 23, 24, 28, 37], "level_zero": 14, "level_zero_util": 14, "leverag": [4, 16], "lib": [2, 14, 29, 39, 40, 56], "lib64": 29, "lib_path": 40, "libgomp": 32, "libiari": 42, "libigc1": 37, "libigdfcl1": 37, "libigdgmm12": 37, "libiomp": 32, "libiomp5": [32, 40], "libitex": 40, "libitex_common": 39, "libitex_cpu": 39, "libitex_cpu_cc": [34, 40], "libitex_gpu": 39, "libitex_gpu_cc": [34, 40], "libitex_gpu_xetla": 40, "libmkl_sycl": [14, 47, 48, 51, 54, 55, 57, 60], "libomp": 39, "librari": [2, 3, 11, 14, 16, 29, 32, 37, 39, 42, 55], "library_path": 40, "libtensorflow": 40, "libtensorflow_cc": 40, "libtensorflow_framework": 40, "like": [0, 2, 7, 17, 25, 28, 32, 33, 46, 47, 57, 58], "limit": [16, 17, 32, 63], "line": [7, 28, 32, 34, 47, 56, 62], "linear": [4, 16, 19, 21, 25, 28, 30], "linearli": 25, "link": [2, 31, 40, 52], "linkstat": 11, "linux": [2, 3, 7, 29, 31, 32, 38, 39, 40, 41, 42, 52], "list": [2, 7, 11, 16, 19, 24, 27, 28, 29, 30, 32, 35, 37, 39, 40], "list_local_devic": 2, "list_physical_devic": [14, 19, 28], "littl": 18, "live": 16, "ll": [20, 24], "lld": 39, "lldb": 39, "llga": [7, 33], "llvm": [16, 39], "llvm_openmp": 40, "ln": 40, "load": [11, 28, 34, 35, 42], "load_data": [19, 28, 35], "load_ops_librari": 11, "load_pb": 35, "load_ref_result": 54, "local": [2, 3, 7, 14, 19, 29, 31, 32, 34, 35, 39, 40, 41, 42, 49, 58], "localalloc": 29, "localhost": [5, 11, 20, 41, 42], "locat": [7, 8, 39, 40, 51, 54], "lock": 13, "log": [7, 11, 18, 20, 22, 28, 33, 35, 40, 42, 47, 48, 51, 54, 55, 56, 57, 58, 60, 62], "log_everi": [55, 60], "log_file_prefix": 29, "log_path": 29, "log_step": 62, "log_warmup_step": 60, "logdir": 22, "logic": 32, "logit": 35, "logpath": 22, "long": [25, 30], "look": [2, 24, 34, 39, 40], "loop": [54, 62], "loshch": 25, "loss": [15, 18, 19, 31, 35, 44, 45, 52, 58], "loss_object": 28, "loss_scal": 28, "lossscaleoptim": 28, "low": [4, 16, 18, 21, 23, 28, 45], "lower": [4, 15, 18, 19, 21, 35, 47], "lowpropos": 49, "lr": [25, 51, 58], "lscpu": [32, 52], "lstm": 25, "lt": [31, 33, 37], "ltensorflow_cc": 40, "ltensorflow_framework": 40, "m": [5, 29, 32, 45, 46, 49, 54, 55, 58, 60], "m150": [39, 40], "m75": [39, 40], "machin": [2, 3, 14, 16, 21, 28, 29, 32, 34, 41, 42, 53, 58], "macro": 11, "made": [11, 30, 55], "mai": [0, 7, 13, 14, 16, 18, 19, 24, 28, 29, 32, 35, 36, 37, 38, 42, 54, 63], "mail": 0, "main": [5, 17, 21, 37, 39, 40, 55, 58, 60, 61], "mainli": [15, 17, 29], "maintain": [0, 7, 8, 14, 18, 21, 23, 25, 34, 36], "make": [0, 2, 3, 5, 7, 11, 16, 18, 19, 28, 30, 32, 35, 36, 39, 40, 47], "makefil": 40, "malloc": [29, 32], "malloc_conf": 29, "man": 32, "manag": 63, "mani": [16, 18, 21, 28, 29, 32, 58], "manner": 16, "manual": [5, 7, 18, 28, 29, 51, 61], "manylinux2014": [37, 41, 42], "manylinux2014_x86_64": 40, "manylinux_2_17_x86_64": 40, "map_structur": 35, "mark": 17, "mask": [25, 44], "maskrcnn": 60, "master": [32, 34, 36], "match": [16, 29, 36, 43], "matcher": 24, "math": [20, 24, 28, 37, 42], "matmul": [17, 20, 24, 26, 35, 36, 40, 49], "matrix": [36, 40], "max": [16, 33, 39, 40, 42, 47, 50, 51, 54, 55, 56, 57, 58, 60, 61, 62, 63], "max_seq_length": 57, "max_step": 55, "maxim": [4, 17, 21, 25, 33, 62], "maximum": [31, 51], "maxpool": 49, "maxpool3d": 24, "maxval": 35, "md": 21, "mean": [13, 14, 18, 25, 27, 28, 29, 32, 35, 36, 39, 40], "mechan": [4, 16, 21, 30], "media": 0, "medic": 44, "meet": [3, 25, 51, 63], "member": [0, 33], "membind": 32, "memori": [4, 9, 11, 13, 14, 15, 16, 18, 19, 21, 25, 28, 31, 36, 47, 51], "memory_limit": 2, "mention": [28, 32], "merg": 5, "messag": [28, 29], "meta": 13, "metadata_thp": 29, "metal": 44, "method": [28, 32, 45, 52], "metric": [19, 28, 35], "middl": 28, "might": [11, 39], "migrat": 7, "millisecond": 32, "mind": 16, "miniconda": 38, "miniconda3": 38, "minim": [15, 32], "minimum": [31, 39], "minor": [4, 21, 23], "minut": [25, 39, 40], "minval": 35, "miscellan": 9, "mismatch": 28, "miss": 15, "mistak": 0, "mit": 52, "mix": [4, 31, 33, 35, 44, 49], "mixed_bfloat16": 28, "mixed_float16": 28, "mixed_precis": 28, "mkdir": [2, 3, 39, 61, 62], "mkl": [7, 34, 37, 38, 39, 40, 42], "ml": 16, "mlir": 17, "mnist": [19, 28, 34, 35, 44, 58], "mnist_client": 34, "mnist_saved_model": 34, "mode": [16, 17, 20, 24, 31, 33, 39, 51, 54, 61], "model": [2, 3, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 27, 32, 33, 35, 36, 44, 45, 52, 56, 58, 62, 63], "model_base_path": 34, "model_dir": [3, 34, 55, 60, 61, 62], "model_nam": [3, 34], "model_path": 49, "model_serv": [3, 34], "model_training_util": 51, "model_typ": 61, "modelserv": 34, "moder": 0, "modern": 36, "modif": [4, 16, 30], "modifi": [5, 35, 40, 47, 51, 62], "modul": [14, 17, 29], "modular": 10, "modulenotfounderror": 14, "monitor": 14, "monolith": 16, "more": [1, 4, 7, 11, 16, 18, 19, 21, 25, 32, 34, 35, 36, 37, 39, 40, 42, 45, 51, 52, 53, 58, 61], "most": [4, 18, 19, 28, 29, 32, 47, 56], "mount": [2, 3], "move": [18, 32, 51, 55, 60], "mozilla": 0, "mpi": [37, 38, 42], "mpirun": [55, 58, 60, 61], "mrpc": 16, "mt": 31, "much": [28, 32, 35, 52], "mul": 24, "multi": [28, 32, 33, 38, 39, 51, 60, 62], "multipl": [18, 20, 32, 36, 62], "multipli": 28, "must": [5, 15, 27, 28, 35], "mutex": 13, "mutual": 29, "my": [14, 18, 19], "mybuilddir": 39, "myfil": 7, "n": [18, 24, 25, 32, 33, 38, 39, 40, 51, 53], "n02123159": 48, "na": [27, 31], "name": [2, 3, 5, 7, 11, 14, 18, 19, 20, 25, 26, 28, 30, 32, 34, 35, 44, 49, 54, 58], "name_scop": 11, "namespac": [4, 17, 21, 23, 25, 26, 33, 40], "nan": 28, "narrow": 28, "nation": 0, "nativ": [4, 15, 16, 21], "natur": 0, "ncdhw": 24, "nchw": 32, "ncore_per_inst": 29, "ndhwc": 24, "necessari": [16, 28, 37, 41, 42, 53], "necessarili": 16, "need": [4, 8, 13, 14, 16, 17, 20, 21, 23, 28, 29, 30, 34, 35, 36, 37, 38, 39, 40, 42, 47, 52, 53, 56, 60, 61, 62], "neg": [32, 35], "neglig": 28, "neither": 29, "nest": 35, "netron": 18, "network": [14, 15, 32], "neural": [4, 14, 15, 21, 32, 44, 45, 52], "new": [4, 5, 7, 8, 15, 16, 21, 23, 24, 28, 30, 32, 36, 45, 51], "newer": [15, 45, 46, 52], "newrootscop": 40, "next": [4, 16, 28, 39, 49], "next_pluggable_devic": 30, "next_pluggable_device_factori": 30, "nextplugg": 30, "nextpluggabledevic": 16, "nhwc": [20, 32], "nibabel": 55, "nic": 31, "nice": 32, "nifti": 55, "nightli": 55, "ninstanc": 29, "nn": [11, 25, 26, 33, 35, 53], "nn_op": 11, "no_proxi": [2, 3], "no_python": 29, "node": [13, 18, 20, 24, 32, 36, 38, 45, 51], "node0": 32, "node1": 32, "node_id": 29, "nolint": 7, "nolintnextlin": 7, "non": [27, 35], "none": [8, 25, 26, 28, 29, 33, 51], "nonetyp": 56, "nonlinear": 25, "nor": 29, "norm": 25, "normal": [17, 20, 25, 28, 32, 39, 47], "note": [2, 3, 5, 11, 16, 17, 18, 20, 25, 27, 28, 29, 31, 33, 34, 36, 39, 40, 47, 49, 51, 54, 58, 60, 61], "notequ": 24, "notfounderror": [14, 47, 48, 51, 54, 55, 57, 60], "noth": 11, "notic": [13, 28], "novel": 16, "now": [2, 18, 28, 32, 34], "np": [22, 25, 53, 55, 58, 60, 61], "npd": [4, 27, 30], "npz": 28, "nth": 32, "nullptr": 11, "num": [29, 32, 51], "num_accumulation_steps_phase1": 51, "num_accumulation_steps_phase2": 51, "num_channel": 53, "num_class": 35, "num_el": 11, "num_gpu": [51, 62], "num_test": 34, "num_train_epoch": 57, "num_unit": [19, 28], "numa": 31, "numactl": [29, 35], "number": [15, 20, 24, 28, 31, 32, 35, 36, 44, 45, 51, 54, 61, 62], "number_of_process": 61, "numer": 28, "numpi": [22, 25, 28, 53, 55], "nv_result": 54, "nvidia": [28, 51, 54, 55, 60], "nvme": 31, "o": [2, 22, 27, 31, 35, 37, 38, 39, 40, 42, 44, 52], "oam": 31, "object": [12, 14, 18, 28, 32, 33, 47, 48, 49, 51, 54, 55, 56, 57, 60], "oblig": 0, "obvious": 18, "occasionali": 27, "occupi": 18, "occur": 28, "ocl": 11, "ocloc": [39, 40], "off": [13, 29, 31, 33, 52, 62, 63], "offcial": 11, "offens": 0, "offer": [19, 30, 32, 49], "offici": [0, 16, 32, 44, 45, 46, 51, 54, 55, 57, 60, 61, 62], "offlin": [0, 36, 39, 40], "offononoffoff": 33, "often": [29, 37, 41, 42], "ok": 51, "omp": [4, 20, 32, 35], "omp_num_thread": [29, 35], "omp_proc_bind": 32, "omp_schedul": 32, "onboard": 32, "onc": [20, 28, 32, 36], "onconfig": [18, 19], "one": [11, 15, 20, 21, 28, 32, 39, 40, 47, 53, 55, 61], "oneapi": [2, 14, 21, 31, 34, 38, 45, 47, 48, 51, 52, 54, 55, 56, 57, 60, 61, 62, 63], "oneapi_install_path": 34, "oneccl": [2, 37, 38, 42, 51], "onednn": [9, 11, 12, 14, 15, 20, 24, 32, 33, 36, 44], "onednn_cpu_git_vers": 33, "onednn_engin": 11, "onednn_gpu_git_vers": 33, "onednn_graph": 33, "onednn_graphoverrid": 33, "onednn_stream": 11, "onednn_verbos": 11, "onednngraph": 15, "onemkl": [37, 38, 39, 40, 42], "ones": [22, 25, 26, 33, 51], "onli": [2, 4, 5, 13, 14, 16, 17, 18, 20, 21, 23, 24, 28, 29, 30, 33, 34, 36, 37, 41, 51, 54, 55, 56, 57, 60, 61, 62], "onlin": [0, 31, 63], "op": [4, 9, 10, 16, 17, 20, 21, 23, 24, 26, 27, 28, 30, 35, 40, 49, 51, 54], "op_build": 11, "op_kernel": 11, "op_requires_ok": 11, "opaqu": 30, "open": [0, 5, 7, 14, 16, 18, 21, 34, 35, 37, 47, 48, 51, 52, 54, 55, 56, 57, 60, 63], "opencl": [14, 37, 39, 40, 42], "opencv": [49, 60], "openmp": [29, 39], "openvino": 49, "openxla": 4, "openxla_support_on_gpu": 21, "oper": [4, 13, 15, 16, 18, 23, 24, 28, 32, 35, 36, 63], "opinion": 0, "opkernel": 11, "opkernelconstruct": 11, "opkernelcontext": 11, "ops_overrid": 27, "opt": [2, 3, 11, 14, 37, 39, 40, 42, 46, 58], "optim": [2, 4, 9, 14, 15, 16, 17, 18, 23, 25, 26, 28, 29, 30, 31, 32, 33, 35, 36, 37, 38, 42, 44, 45, 47, 49, 50, 51, 52, 54, 55, 60, 61, 63], "option": [2, 3, 7, 11, 18, 21, 29, 33, 35, 61, 62, 63], "order": [18, 19, 28, 29, 30, 32, 38, 43], "org": [0, 2, 7, 21, 39, 40, 49, 56], "organ": 16, "orient": 0, "origin": [4, 16, 18, 21, 23, 24, 25, 31, 36, 40, 45, 47, 49, 56], "orign": 31, "orthogon": [25, 26], "other": [0, 17, 20, 25, 28, 29, 30, 31, 32, 33, 34, 35, 37, 39, 40, 42, 56, 58, 63], "otherwis": [0, 17, 28, 33, 52, 53], "our": 29, "out": [3, 15, 28, 36, 40, 48, 51, 53, 54, 62], "outcom": 54, "outermost": 25, "output": [2, 7, 11, 13, 16, 19, 20, 24, 25, 28, 30, 31, 33, 35, 37, 39, 40, 47, 49, 52, 57], "output_dim": 35, "output_dir": [16, 55, 57, 60], "over": [18, 28, 49], "overal": [0, 32], "overhead": [13, 16, 28, 32, 35, 51], "overload": 26, "overrid": [4, 11, 18, 27, 28], "oversize_threshold": 29, "overview": 4, "own": [35, 49], "p": [2, 3, 25, 34, 41, 42, 47, 61], "pacakg": 56, "packag": [3, 27, 30, 32, 37, 38, 39, 41, 45, 51, 52, 55, 56, 60, 63], "pad": [24, 25, 53], "page": [5, 21, 22, 23, 32, 63], "paintbucket": 18, "parallel": [13, 20, 32, 35, 39], "paramet": [17, 26, 35, 47, 51], "parent": 9, "parsefromstr": 35, "part": [15, 16, 17, 32, 39, 40, 51, 60], "parti": [9, 36, 63], "particip": 0, "particular": 28, "particularli": 14, "partit": [15, 32], "pass": [11, 15, 16, 17, 28, 31, 33, 36, 49, 54, 62], "patch": [7, 34, 51, 54, 55, 57, 60, 62], "path": [2, 3, 7, 16, 18, 19, 20, 22, 29, 32, 33, 34, 37, 38, 39, 40, 42, 47, 49, 51, 52, 55, 57, 60, 61, 62], "path_to_itex": 3, "path_to_libitex_cpu_cc": 34, "path_to_libitex_gpu_cc": 34, "path_to_python_unit_test": 7, "path_to_site_packag": [37, 38, 42, 63], "path_to_tensorflow_serv": 3, "pattern": [0, 4, 15, 16, 21, 24], "pb": [18, 19, 34, 35, 47, 49], "pb_file": 35, "pbtxt": 17, "pci": [2, 30], "pcie": 31, "pdf": 25, "peak": [18, 23], "penal": 32, "peopl": 0, "per": [17, 28, 29, 31, 32, 38, 58, 62], "perf": 27, "perform": [4, 14, 15, 16, 17, 19, 20, 21, 22, 23, 24, 25, 28, 29, 32, 33, 35, 36, 39, 40, 44, 49, 51, 52, 54, 55, 60, 62, 63], "period": [0, 32], "permiss": [0, 5], "person": 0, "perspect": [29, 32], "phase": [15, 31, 36, 51], "phase1": [31, 51], "phase2": 51, "phase_2": 51, "photo": 52, "physic": [0, 30, 32, 62], "physical_devic": [14, 58], "physical_device_desc": 2, "physicaldevic": [14, 58], "pick": 7, "picker": 5, "piecewiseconstantdecai": 25, "pip": [7, 11, 14, 22, 27, 33, 34, 37, 38, 39, 40, 41, 42, 45, 46, 49, 51, 54, 55, 58, 60, 62, 63], "pip3": 41, "pip_packag": [11, 39], "pip_set_env": [51, 52, 54, 55, 57, 60, 61], "pipelin": [16, 44, 45, 52], "pjrt": [4, 16, 21, 63], "place": [4, 17, 21, 32, 40], "placement": [29, 32], "plai": 32, "plain": 36, "platform": [14, 16, 28, 32, 33, 37, 39, 40, 41, 51, 54, 55, 56, 57, 60, 61, 62], "platinum": [31, 32, 35], "pleas": [7, 11, 14, 16, 17, 21, 27, 28, 37, 39, 40, 42, 44, 45, 47, 51, 53, 55, 57, 58, 60, 61, 63], "plu": [16, 32], "plug": [34, 63], "pluggabl": [4, 10, 16, 30, 40], "pluggable_devic": 30, "pluggable_device_factori": 30, "pluggabledevic": [10, 27, 63], "plugin": [4, 10, 16, 18, 19, 21, 22, 34, 39, 58, 63], "po": 35, "point": [17, 18, 20, 28, 33, 37, 42, 47], "polici": [29, 32, 63], "polit": 0, "polymorph": 11, "pool": 4, "popular": [15, 16, 31], "port": [34, 54], "portabl": [16, 36], "posit": [0, 7], "possibl": [4, 19, 32, 35, 36, 39], "post": [0, 7, 18, 19, 24, 33], "post1": 40, "potenti": [28, 63], "power": [19, 63], "ppn": [55, 58, 60, 61], "pr": 5, "practic": [4, 28, 29], "pramet": 62, "pre": [18, 31, 33, 41, 42, 51, 56], "precis": [4, 16, 30, 31, 33, 44, 45, 49, 54, 57], "preconfigur": 39, "predict": [19, 26, 27, 28, 35, 57], "predict_batch_s": 16, "predict_fil": 57, "prefer": [29, 37, 41, 42], "prefix": 29, "preload": 32, "preop": 18, "prepack": 4, "prepend": [29, 55, 58, 60, 61], "preprocess": 60, "preprocess_data": 55, "present": [30, 54], "preserv": 20, "press": 38, "pretrain": [31, 44, 49], "pretrain_bert": 51, "pretrain_lamb": 51, "pretrain_path": 51, "pretrain_result_dir": 51, "prevent": 28, "previou": [8, 25, 32, 51], "previous": [28, 30], "primari": [17, 32], "primit": [11, 13, 20, 36], "primitive_attr": 11, "primitive_desc": 11, "principl": 18, "print": [2, 11, 19, 22, 25, 28, 29, 30, 33, 35, 37, 38, 39, 40, 41, 42, 47, 48, 51, 53, 54, 62, 63], "print_graph": 35, "printf": 51, "priorit": 18, "prioriti": [20, 33], "privaci": 0, "privat": 0, "privileg": [2, 3, 47], "problem": [14, 24, 28, 32, 56], "proc": [28, 32], "procedur": [11, 37, 41, 42], "process": [4, 7, 11, 16, 21, 28, 29, 32, 34, 51, 52], "process_per_nod": 61, "processor": [4, 21, 31, 32, 41, 47, 52, 53], "proclist": 32, "produc": 57, "product": [5, 7, 21, 34, 37], "profession": 0, "profil": [4, 9, 28, 30, 32], "profiler_demo": 22, "program": [9, 27, 32, 63], "project": [2, 5, 7, 16, 63], "prolong": [39, 40], "promot": 7, "prompt": [31, 39, 40], "promptli": 0, "prop_kind": 11, "propag": [9, 13, 16, 17], "properli": [21, 29], "properti": [17, 18, 28], "propos": [7, 25], "protect": 11, "protobuf": 52, "protocol": 49, "protocolmessag": 33, "provid": [0, 2, 4, 7, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 28, 29, 30, 31, 32, 33, 35, 36, 37, 38, 39, 40, 42, 44, 45, 49, 51, 52, 55, 60, 61, 62, 63], "proxi": 36, "prune": 35, "pseudocod": 28, "pub": 37, "public": [0, 4, 5, 11, 21, 25, 33, 34], "publish": [0, 5], "pull": [7, 34, 41, 42, 47], "pure": 31, "push": [5, 16], "put": 34, "pvc": [39, 40, 51], "pwd": [47, 62], "py": [7, 11, 16, 22, 29, 34, 35, 42, 47, 48, 49, 51, 54, 55, 56, 57, 58, 60, 61, 62], "pybind11": 60, "pycocotool": 60, "pylint": 7, "pylintrc": 7, "pypi": [2, 43, 63], "python": [2, 4, 9, 14, 19, 22, 23, 25, 26, 27, 28, 29, 30, 32, 34, 35, 37, 38, 39, 41, 42, 45, 46, 49, 51, 52, 53, 55, 56, 57, 58, 60, 61, 63], "python3": [2, 5, 16, 38, 39, 54, 56], "pythonhost": 40, "pythonpath": 61, "pytorch": [27, 30], "q1": 14, "q_model": 49, "qdq": 52, "qo": 37, "qualiti": 28, "quantiz": [4, 44], "quantizev2": 49, "queri": 28, "question": [0, 4, 36, 63], "queue": [35, 62], "quick": [4, 11, 37, 44], "quickli": [20, 28], "r": [3, 7, 14, 28, 31, 32, 44, 62], "r2": [34, 40, 62], "race": 0, "rais": 33, "rand": 53, "random": [25, 35, 53], "randomnorm": 40, "rang": [25, 28, 32, 35], "rank": [31, 55, 58, 60, 61], "rapid": [41, 47], "rare": 28, "rate": [14, 15, 18, 25, 34], "rather": 25, "ratio": 36, "raw": 58, "rb": 35, "rcfile": 7, "rcnn": 49, "re": [2, 32, 35, 46], "reach": 18, "read": [20, 28, 35, 45, 55], "readm": 61, "real": [15, 28, 36, 51, 61], "reason": [0, 28, 30], "recent": 56, "recogn": [44, 45], "recommend": [16, 20, 28, 32, 33, 34, 35, 37, 38, 39, 41, 42, 46, 52], "record": [36, 61], "recurrent_activ": [25, 26], "recurrent_initi": [25, 26], "recurs": 7, "red": 42, "reduc": [15, 16, 18, 28, 32, 36, 39, 40, 45, 51, 54, 62], "reduce_mean": 35, "ref_result_dir": 54, "refer": [2, 3, 7, 11, 14, 15, 17, 18, 19, 20, 21, 23, 28, 31, 32, 33, 34, 37, 39, 40, 42, 44, 45, 46, 47, 48, 50, 51, 52, 53, 54, 55, 56, 57, 58, 60, 61, 62, 63], "refresh": 22, "regardless": 0, "region": 32, "regist": [4, 14, 30, 45, 52], "register_": 11, "register_geluop": 11, "register_kernel_build": 11, "registr": [10, 11, 55], "registrationcent": [37, 42], "regress": 27, "regular": [25, 36], "reinstal": 51, "reject": 0, "rel": [16, 29, 51], "relat": [5, 27, 29, 34, 36], "relationship": [14, 18], "releas": [4, 14, 17, 32, 33, 34, 39, 40, 45, 54, 56], "reli": 17, "relianc": 16, "religion": 0, "relu": [4, 11, 19, 21, 24, 25, 26, 28, 35, 53], "relu6": 24, "relu_op": 11, "relu_op_functor": 11, "relubaseop": 11, "relugrad": 24, "remain": [20, 30], "remapp": [19, 24, 33], "remot": 32, "remov": [0, 11, 16, 18, 24], "reorder": [13, 36], "repeat": 18, "replac": [14, 25, 26, 27, 34, 36, 40, 51], "replica": [11, 20], "repo": [5, 31, 37, 38], "report": [0, 7, 20, 63], "repositori": [9, 16, 31, 37, 51, 55, 60], "repres": [0, 4, 16, 17, 30, 31], "represent": 15, "representative_dataset": 49, "reproduc": 31, "request": [0, 7, 63], "requir": [2, 4, 7, 11, 13, 15, 16, 21, 22, 24, 25, 28, 29, 30, 36, 38, 45], "rerun": 28, "research": 57, "reserv": 32, "reset": 54, "reshap": [19, 25, 28, 35], "resnet": [61, 62], "resnet101": 49, "resnet34": 49, "resnet50": [17, 29, 31, 44, 49, 59], "resnet50_itex": 62, "resnet_ctl_imagenet_main": 62, "resnet_v1_50": 22, "resolv": 1, "resourc": [29, 32, 56], "respect": [0, 29, 35, 51], "rest": [20, 24], "rest_api_port": 34, "restart": 38, "result": [5, 15, 16, 17, 19, 22, 27, 28, 30, 32, 33, 38, 45, 48, 53, 54, 56, 62], "result_dir": 51, "retinanet50": 49, "retrain": 28, "retriev": [28, 49], "return": [11, 17, 28, 30, 33, 35, 40], "return_sequ": 25, "return_st": 25, "reus": [32, 45], "review": 0, "rewrit": [11, 17], "rewrite_opt": 52, "rewriter_config_pb2": 52, "rewriterconfig": 52, "rewritten": 16, "rf": [34, 46, 61], "rfc": [7, 21], "right": [0, 25], "rm": [34, 40, 46, 47, 61], "rmsprop": [19, 28, 35], "role": 32, "root": [7, 39, 40, 56], "rpath": 40, "rule": 19, "run": [7, 11, 14, 16, 18, 19, 22, 24, 26, 27, 28, 29, 31, 32, 33, 35, 39, 41, 42, 63], "run_20210712212258_inst": 29, "run_20210712212258_instance_0_cores_0": 29, "run_20221009103552_inst": 29, "run_20221009103552_instance_0_cores_0": 29, "run_20221009104740_inst": 29, "run_20221009104740_instance_0_cores_0": 29, "run_20221009105044_inst": 29, "run_20221009105044_instance_0_cores_12": 29, "run_20221009105320_inst": 29, "run_20221009105320_instance_0_cores_0": 29, "run_20221009105838_inst": 29, "run_20221009105838_instance_0_cores_0": 29, "run_20221009105838_instance_1_cores_12": 29, "run_20221009105838_instance_2_cores_24": 29, "run_20221009105838_instance_3_cores_36": 29, "run_20221009105838_instance_4_cores_48": 29, "run_20221009105838_instance_5_cores_60": 29, "run_20221009105838_instance_6_cores_72": 29, "run_20221009105838_instance_7_cores_84": 29, "run_20221009110327_inst": 29, "run_20221009110327_instance_0_cores_0": 29, "run_20221009110327_instance_10_cores_40": 29, "run_20221009110327_instance_11_cores_44": 29, "run_20221009110327_instance_12_cores_48": 29, "run_20221009110327_instance_13_cores_52": 29, "run_20221009110327_instance_14_cores_56": 29, "run_20221009110327_instance_15_cores_60": 29, "run_20221009110327_instance_16_cores_64": 29, "run_20221009110327_instance_17_cores_68": 29, "run_20221009110327_instance_18_cores_72": 29, "run_20221009110327_instance_19_cores_76": 29, "run_20221009110327_instance_1_cores_4": 29, "run_20221009110327_instance_20_cores_80": 29, "run_20221009110327_instance_21_cores_84": 29, "run_20221009110327_instance_22_cores_88": 29, "run_20221009110327_instance_23_cores_92": 29, "run_20221009110327_instance_2_cores_8": 29, "run_20221009110327_instance_3_cores_12": 29, "run_20221009110327_instance_4_cores_16": 29, "run_20221009110327_instance_5_cores_20": 29, "run_20221009110327_instance_6_cores_24": 29, "run_20221009110327_instance_7_cores_28": 29, "run_20221009110327_instance_8_cores_32": 29, "run_20221009110327_instance_9_cores_36": 29, "run_20221009110849_inst": 29, "run_20221009110849_instance_0_cores_0": 29, "run_20221009110849_instance_1_cores_11": 29, "run_20221009110849_instance_1_cores_24": 29, "run_20221009110849_instance_2_cores_22": 29, "run_20221009110849_instance_2_cores_48": 29, "run_20221009110849_instance_3_cores_33": 29, "run_20221009110849_instance_3_cores_72": 29, "run_20221009111034_instance_0_cores_0": 29, "run_20221009111239_instance_0_cores_24": 29, "run_20221009111753_inst": 29, "run_20221009111753_instance_0_cores_0": 29, "run_20221009111951_inst": 29, "run_20221009111951_instance_0_cores_0": 29, "run_20221009112720_instance_0_cores_0": 29, "run_20221009112905_instance_0_cores_0": 29, "run_20221009112956_instance_0_cores_0": 29, "run_classifi": 16, "run_inf": 35, "run_jupyt": 52, "run_pretraining_lamb": 51, "run_squad": [51, 57], "runner": 61, "runtim": [16, 18, 23, 25, 27, 28, 32, 36, 37, 39, 40, 51, 63], "safe": [13, 18, 33, 63], "sai": [28, 51], "same": [5, 7, 14, 20, 21, 23, 24, 25, 28, 29, 30, 31, 32, 33, 34, 35, 36, 39, 40, 45, 53], "sampl": [2, 22, 31, 35, 45, 52, 54], "samsung": 31, "saniti": [7, 63], "sapphir": [41, 47], "satisfi": [13, 23], "save": [5, 11, 17, 29, 33, 49, 57], "save_checkpoint_step": 51, "save_json_data": 35, "saved_model": 34, "savedmodel": 49, "scalabl": [4, 21, 31, 34, 41, 47], "scale": [4, 25, 26, 31, 35, 62], "scaled_gradi": 28, "scaled_loss": 28, "scenario": [4, 13, 20, 21, 23, 32, 33], "schedul": [13, 16, 25, 29, 32, 35], "schmidhub": 25, "scope": [17, 40], "scratch": [28, 51], "scratchpad": [11, 13], "scratchpad_mem": 11, "scratchpad_mod": 11, "screen": 47, "script": [5, 21, 22, 27, 32, 39, 40, 42, 47, 49, 51, 53, 55, 56, 60, 61], "sdp": 29, "seamless": [4, 30], "search": [7, 29], "sec": [31, 35, 51, 62], "second": [32, 35, 52, 61, 62], "section": [14, 28, 32, 37, 39, 40, 49], "secur": 0, "see": [0, 1, 2, 4, 7, 14, 16, 22, 25, 28, 29, 32, 34, 36, 37, 39, 52, 61, 63], "seed": 60, "seen": 32, "segment": [31, 44, 60], "select": [14, 28, 29, 30, 33, 54, 63], "self": 35, "semant": [17, 20, 25], "send": 16, "separ": [11, 14, 23, 24, 28, 31, 32, 38, 39, 63], "seq": 16, "sequenc": [31, 51, 54], "sequenti": 35, "seri": [0, 16, 32, 33, 39, 40, 42, 45, 47, 50, 51, 52, 54, 55, 56, 57, 58, 60, 61, 62, 63], "serial": 35, "seriesintel": 47, "seriesne": 47, "seriessupport": 47, "seriou": 0, "serv": [4, 30], "serval": 27, "server": [5, 31, 39, 40, 42], "servic": 55, "serving_plugin": 34, "session": [40, 52], "set": [0, 2, 4, 7, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 27, 31, 32, 33, 35, 37, 38, 40, 42, 47, 51, 52, 57, 63], "set_config": [17, 18, 19, 47, 62], "set_env_cpu": [47, 48, 56], "set_env_gpu": [47, 48, 56], "set_global_polici": 28, "set_log_device_plac": 22, "set_scratchpad_mod": 11, "set_sess": 52, "set_weight": 28, "setup": [38, 41, 43, 45], "setvar": [14, 37, 42, 46, 58], "sever": [4, 16, 21, 29, 31, 32, 39, 40, 44, 61], "sex": 0, "sexual": 0, "sh": [2, 3, 5, 14, 34, 37, 38, 39, 40, 42, 46, 47, 48, 51, 52, 54, 55, 56, 57, 58, 60, 61, 63], "shape": [11, 13, 16, 17, 19, 25, 28, 30, 35, 36, 53], "shard": [4, 17, 21, 33], "sharding_config": [17, 62], "shardingconfig": [17, 62], "share": [7, 14, 32, 37, 47, 48, 51, 54, 55, 57, 60], "short": [16, 25, 28], "shoul": 40, "should": [2, 3, 5, 7, 22, 27, 28, 32, 34, 35, 37, 38, 40, 41, 42, 45, 51, 57, 62], "show": [5, 14, 16, 18, 27, 28, 31, 35, 39, 40, 42, 44, 45, 47, 49, 50, 51, 52, 54, 55, 56, 57, 60, 61, 62], "showcas": [16, 31], "shown": [2, 3, 15, 22, 24, 29, 51, 54, 55, 60], "shuffl": 28, "sigmoid": [24, 25, 26], "sign": [25, 37], "signific": [4, 7, 18], "significantli": [4, 28], "signoff": 51, "similar": [19, 32], "simpl": [4, 21, 23, 28, 40], "simpli": [28, 30, 62], "simplifi": 45, "simultan": [31, 42], "sinc": [4, 14, 28, 32, 36, 42], "singl": [0, 4, 7, 15, 20, 21, 24, 31, 51, 60, 61], "single_l2_loss_op": 62, "site": [5, 8, 37, 38, 39, 42, 56, 63], "situat": [20, 33], "size": [0, 20, 25, 28, 29, 31, 51, 58, 62], "skip": [7, 28, 29, 38], "skip_cross_node_cor": 29, "skip_ev": 62, "sle": 42, "sleep": 32, "slowdown": 16, "slower": [18, 19, 28, 35], "slowli": 28, "small": [13, 25, 28, 29, 32, 35], "sn850x": 31, "snapshot": 39, "snippet": 61, "so": [14, 16, 19, 28, 29, 32, 33, 34, 39, 40, 47, 48, 51, 54, 55, 56, 57, 58, 60], "social": 0, "socio": 0, "socket": [31, 32, 38, 62], "softmax": [18, 19, 28], "softwar": [2, 16, 38, 43, 45, 52, 53, 58], "sole": 32, "solut": [4, 14, 15, 21, 27, 30], "solv": [28, 56], "some": [2, 11, 18, 19, 26, 28, 29, 32, 39, 40, 49, 51, 58], "sometim": 7, "sort": [0, 16], "sourc": [2, 3, 4, 7, 11, 16, 17, 21, 37, 38, 42, 43, 46, 47, 48, 52, 55, 56, 58, 60, 63], "sp4": [31, 42], "sp5": 42, "space": [0, 32, 63], "sparse_categorical_crossentropi": [19, 28], "sparsecategoricalaccuraci": [28, 35], "sparsecategoricalcrossentropi": [28, 35], "special": [16, 19, 23, 28, 39, 40], "specif": [4, 16, 28, 30, 32, 33, 34, 37, 42, 61, 63], "specifi": [0, 3, 11, 21, 24, 28, 29, 32, 34, 39, 40, 49], "sped": 28, "speed": [15, 16, 18, 32, 44, 45], "speedup": [16, 31, 52, 62], "spend": 28, "split": [17, 18, 35], "squad": [31, 51, 57], "squad_dir": 57, "squad_vers": 51, "src": [7, 11, 14, 17, 34, 39], "src_mem": 11, "src_tensor": 11, "ssd": [31, 49], "ssdsc2kg960g8": 31, "st": [3, 40], "stabil": [19, 28], "stabl": [25, 28, 44, 63], "stable_diffusion_accuraci": 54, "stable_diffusion_infer": 54, "stable_diffussion_infer": 54, "stablehlo": 16, "stack": [31, 42, 43], "stage": [16, 52], "stage_num": [17, 62], "stall": 32, "standard": [7, 25], "standard_op": 40, "start": [2, 3, 14, 21, 22, 28, 29, 34, 35, 63], "startup": [39, 40], "stat": 22, "static": 32, "statist": 49, "statu": [0, 11, 19, 40], "status_msg": 40, "statusuniqueptr": 11, "std": [11, 40], "stdout": [7, 29], "steal": 35, "step": [3, 16, 17, 18, 25, 28, 31, 32, 34, 36, 44, 45, 51, 55, 58, 60, 62], "steps_per_epoch": [35, 60], "steps_per_loop": 62, "still": 28, "stock": [14, 16, 23, 24, 28, 30, 37, 38, 41, 42, 45, 49, 51, 54, 55, 56, 57, 60, 61, 62, 63], "stop": [22, 32], "storag": [16, 28, 31, 35, 47, 49, 56], "store": 36, "strategi": 32, "stream": [13, 27, 54, 62], "stream_executor": 28, "streamexecutor": [10, 30], "streamlin": [4, 21, 34], "strictli": 25, "stride": 53, "string": [18, 28, 29, 39, 40], "stringop": 34, "strong": 18, "structur": [4, 19, 29, 32], "sub": [9, 14, 18, 19, 32, 33], "subgraph": [15, 16], "submit": [5, 7, 63], "subsequ": [18, 19, 28, 32, 54], "subystem": 37, "succe": 36, "success": [48, 53, 54, 62], "successfulli": [14, 34, 38, 39, 40, 42, 62], "sudo": [7, 34, 37, 39, 40, 42], "suffici": [28, 35], "suggest": [56, 62], "sum": 35, "summari": [51, 63], "super": 35, "suppli": 35, "support": [4, 7, 13, 14, 15, 16, 17, 18, 19, 22, 24, 27, 28, 29, 30, 32, 33, 37, 39, 40, 41, 42, 45, 47, 52, 61, 62], "suppos": [32, 51], "sure": [3, 11, 28, 35, 37, 39, 40], "suse": [31, 42], "sustain": 0, "sw": 37, "swish": [19, 24], "switch": [4, 5, 27, 32, 35, 39], "sy": 53, "sycl": 14, "sycl_runtim": [14, 28], "symbol": 40, "sync": 33, "system": [14, 21, 30, 31, 32, 34, 35, 38, 39, 40, 56], "t": [2, 5, 11, 13, 17, 18, 20, 28, 29, 31, 36, 49, 54, 56], "tab": 22, "tabl": [18, 28, 29, 30, 31, 49], "tag": 5, "take": [0, 11, 16, 24, 28, 29, 32, 34, 35, 38, 51], "tanh": [24, 25, 26], "tape": 28, "tar": [3, 7, 32, 49], "target": [3, 16, 17, 39, 40], "task": [11, 20, 32, 61], "task_nam": 16, "taskset": 29, "tbb": 42, "tdp": 31, "team": [7, 54], "techniqu": [15, 28], "technologi": [16, 45], "tee": [29, 37, 51, 62], "tell": 14, "templat": 11, "temporari": 13, "tensor": [11, 16, 25, 28, 30, 40, 53], "tensorboard": [22, 63], "tensorflow": [5, 8, 9, 10, 11, 13, 14, 15, 16, 17, 20, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 36, 38, 43, 44, 46, 47, 48, 50, 51, 53, 54, 55, 56, 57, 58, 60, 61, 62], "tensorflow2": [51, 58, 60], "tensorflow2_keras_mnist": 58, "tensorflow_doc": 56, "tensorflow_hub": 22, "tensorflow_model_serv": [3, 34], "tensorflow_plugin": 34, "tensorflow_serv": [3, 34], "tensorflow_src": 40, "term": [0, 25, 30, 63], "termin": 38, "test": [9, 19, 22, 28, 34, 35, 38, 44, 55, 56], "test_accuraci": 28, "test_dataset": 28, "test_func": 28, "test_scor": [19, 28], "test_step": 28, "text": [18, 31, 44], "text2imag": [31, 44], "tf": [11, 14, 15, 19, 22, 25, 26, 27, 28, 29, 30, 33, 35, 37, 39, 40, 41, 42, 51, 52, 53, 62], "tf2": [49, 51, 56], "tf32": [20, 31, 51], "tf_auto_jit_flag": 27, "tf_auto_mixed_precision_graph_rewrite_allowlist_add": 18, "tf_auto_mixed_precision_graph_rewrite_allowlist_remov": 18, "tf_auto_mixed_precision_graph_rewrite_clearlist_add": 18, "tf_auto_mixed_precision_graph_rewrite_clearlist_remov": 18, "tf_auto_mixed_precision_graph_rewrite_denylist_add": 18, "tf_auto_mixed_precision_graph_rewrite_denylist_remov": 18, "tf_auto_mixed_precision_graph_rewrite_inferlist_add": 18, "tf_auto_mixed_precision_graph_rewrite_inferlist_remov": 18, "tf_auto_mixed_precision_graph_rewrite_level": 18, "tf_auto_mixed_precision_graph_rewrite_log_path": 18, "tf_bert_finetune_": 51, "tf_bert_pretraining_lamb_": 51, "tf_check_ok": 40, "tf_code": 40, "tf_compatible_vers": 33, "tf_copt": [11, 34], "tf_cpp_max_vlog_level": 20, "tf_cpp_min_log_level": 20, "tf_cuda_librari": 34, "tf_enable_onednn_opt": 29, "tf_getcod": [11, 40], "tf_hub": 22, "tf_include_path": 40, "tf_kera": 27, "tf_loadpluggabledevicelibrari": 40, "tf_messag": 40, "tf_newopdefinitionbuild": 11, "tf_newstatu": [11, 40], "tf_num_interop_thread": 62, "tf_num_intraop_thread": 62, "tf_ok": [11, 40], "tf_opdefinitionbuild": 11, "tf_opdefinitionbuilderaddattr": 11, "tf_opdefinitionbuilderaddinput": 11, "tf_opdefinitionbuilderaddoutput": 11, "tf_opdefinitionbuildersetshapeinferencefunct": 11, "tf_registeropdefinit": 11, "tf_serv": 34, "tf_statu": 40, "tf_use_legacy_kera": [27, 51, 54], "tf_ver": 2, "tf_xla_auto_jit": [16, 27, 30], "tf_xla_flag": [16, 27, 30], "tf_xla_use_device_api": [16, 30], "tfa": [25, 26, 55], "tfcc_path": 40, "tfd": 61, "tfg": 17, "tfg_optimizer_hook": 62, "tfg_to_h": 17, "tfhub": 22, "tfrecord": [51, 55, 61], "tfx": 21, "than": [19, 25, 28, 32, 35, 37, 42, 47, 53, 58], "thei": [0, 18, 28, 29, 32], "them": [16, 18, 21, 28, 29, 32, 34, 56, 61], "therefor": [28, 32], "thereof": 16, "thi": [0, 2, 3, 4, 5, 11, 13, 14, 16, 17, 18, 19, 20, 21, 23, 24, 25, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 38, 39, 40, 42, 45, 46, 49, 50, 51, 52, 53, 55, 57, 60, 62, 63], "thing": 21, "think": 28, "third": [9, 36, 63], "third_parti": [7, 9, 34], "those": [0, 16, 18, 19, 34, 61], "though": 39, "thrash": 32, "thread": [4, 13, 20, 29, 31, 32, 33, 42], "threadpool": [3, 20, 40], "threaten": 0, "three": [4, 21, 22, 23, 29], "through": [0, 27, 28, 32, 35, 39, 40, 55, 63], "throughput": [31, 47, 51, 54], "throughput_mod": 29, "throughput_train": 51, "thu": 32, "tiger_cat": 48, "tightli": 30, "tile": [17, 20, 33, 51, 58, 60, 61, 62], "time": [0, 4, 11, 14, 16, 18, 19, 20, 21, 22, 28, 31, 32, 35, 39, 40, 45, 49, 51], "timehistori": [61, 62], "tip": [11, 20, 32, 34], "tmp": 34, "todai": 30, "togeth": 32, "toggl": 33, "toi": 28, "token": [54, 56], "too": [18, 28, 37, 42], "tookit": [39, 40], "tool": [7, 9, 11, 14, 18, 32, 36, 37, 38, 39, 40, 42, 63], "toolchain": 39, "toolkit": [14, 31, 37, 38, 45, 47, 58, 63], "top": 27, "topic": 4, "topologi": [21, 29, 32], "total": [31, 32, 35, 49, 51, 58], "total_loss": 51, "total_tim": 35, "total_training_step": 51, "tour": 63, "tout": 24, "toward": 0, "tpl": 7, "tpost": 24, "tpu": 49, "trace": 22, "traceback": 56, "track": [22, 56], "train": [2, 14, 17, 18, 21, 24, 25, 26, 27, 29, 34, 35, 37, 38, 42, 43, 44, 47, 51, 52, 57, 59, 63], "train_accuraci": 62, "train_and_ev": 61, "train_batch_s": [57, 60], "train_batch_size_phase1": 51, "train_batch_size_phase2": 51, "train_dataset": 28, "train_epoch": 62, "train_fil": 57, "train_horovod": 58, "train_loss": [51, 62], "train_maskrcnn": [55, 60], "train_step": [28, 51, 62], "trainabl": [25, 35], "trainable_vari": 28, "trainer": 61, "trainingop": 24, "transfer": 52, "transform": [24, 25], "translat": [0, 39, 40], "transpar": [4, 21], "transpos": [24, 26], "travers": 36, "treat": 20, "tree": [39, 40], "tri": 56, "tricki": 28, "trigger": [5, 19, 33], "troll": 0, "true": [11, 16, 22, 25, 26, 28, 29, 30, 33, 35, 40, 51, 57, 62], "truncat": 34, "try": [11, 21, 29, 45, 49, 52], "ttt": 31, "tumor": 55, "tune": [31, 33, 45, 51], "tupl": 35, "turbo": 31, "turn": [17, 63], "tutori": 56, "two": [4, 13, 14, 19, 21, 23, 28, 32, 35, 39, 47, 51, 54, 55, 60], "txt": [16, 18, 37, 42, 54, 57, 62], "type": [4, 7, 11, 14, 18, 20, 21, 29, 31, 33, 38, 39, 40, 47, 49], "type_infer": 17, "typeconstraint": 11, "typeerror": 56, "typenam": 11, "typic": [4, 21, 23, 28, 32], "u": [0, 22, 29, 42], "ubuntu": [2, 31, 34, 39, 40, 41, 42], "ubuntu22": 56, "ubuntu_vers": 2, "uma": 32, "unaccept": 0, "uncased_l": 51, "unchanged_shape_fn": 11, "undef": 11, "undefin": [2, 30], "under": [17, 23, 26, 29, 33, 39, 52], "understand": 36, "undesir": 29, "unet": [31, 44], "unet_3d_med": 55, "unexpect": 51, "unifi": [21, 29, 37], "uniform": [4, 16, 21, 30, 35], "uniniti": 17, "uninstal": [11, 51, 60], "unit": [19, 25, 28, 32, 35], "unknown": [14, 28], "unkown": 27, "unless": 33, "unmodifi": 16, "unnecessari": [24, 28, 32], "unoptim": 36, "unordered_map": 11, "unprofession": 0, "unsafe_force_al": 18, "unscal": 28, "unshard": 17, "unsolicit": 0, "unspecifi": 29, "until": [18, 32], "unwelcom": 0, "unzip": 40, "up": [18, 22, 28, 32, 37, 40, 44, 51, 54, 57], "updat": [2, 18, 27, 28, 37, 38, 39, 40, 41, 42, 62], "update_st": 28, "upenn": 55, "upgrad": [14, 37, 38, 41, 42, 45, 46, 49, 55, 60, 63], "upon": 55, "upstream": [14, 18], "url": [49, 54, 56], "us": [0, 2, 3, 4, 5, 7, 13, 14, 15, 16, 18, 19, 20, 22, 23, 24, 25, 26, 28, 31, 32, 33, 36, 37, 38, 39, 40, 42, 44, 46, 47, 49, 50, 51, 52, 53, 55, 56, 57, 60, 63], "usag": [4, 14, 16, 21, 32, 33, 35, 44], "use_bia": [25, 26], "use_default_alloc": 29, "use_itex_shard": 62, "use_logical_cor": 29, "use_mytrain": 51, "use_synthetic_data": [60, 62], "use_tf_funct": 62, "use_tf_while_loop": 62, "use_tpu": 57, "use_xla": 51, "usecyclespersecondtim": [4, 21, 22, 28], "user": [4, 5, 7, 11, 13, 19, 20, 21, 23, 27, 30, 37, 39, 40, 41, 42, 43, 47, 54, 63], "usr": [7, 29, 37, 39], "usual": 18, "ut": 7, "util": [4, 9, 11, 14, 16, 21, 23, 29, 31, 32, 35, 56, 62], "v": [2, 3, 16, 18, 34, 38, 40, 42, 46, 47], "v0": [31, 33, 38], "v1": [35, 49, 51, 52, 57, 63], "v100": 51, "v1_8": [35, 47], "v2": [15, 31, 33, 38, 42, 49, 51, 61, 63], "v3": [15, 44], "v4": [18, 35, 44], "val_accuraci": 28, "val_loss": 28, "valid": [8, 33], "validation_split": [19, 28, 35], "valu": [15, 17, 18, 20, 25, 28, 29, 31, 32, 33, 61], "valueerror": 33, "var": [2, 14, 34, 38, 39, 40, 42], "vari": 27, "variabl": [2, 4, 13, 15, 16, 19, 21, 22, 23, 24, 25, 27, 28, 30, 32, 34, 35, 38, 40, 52], "variable_dtyp": 28, "varianc": 25, "varibl": 51, "varieti": 44, "variou": 16, "ve": [39, 40], "vector": 40, "venv": [46, 55, 58, 60], "verbos": [11, 19, 20, 28, 29, 30, 35], "veri": [15, 28, 51], "verifi": [38, 39, 40, 44, 51, 54, 55, 56, 57, 60, 61, 62], "version": [0, 2, 11, 14, 16, 27, 28, 31, 32, 37, 38, 39, 40, 41, 42, 45, 46, 51, 56], "versu": [19, 32], "via": [0, 4, 11, 17, 27, 30, 31, 35, 44, 62, 63], "view": 8, "viewer": 22, "viewpoint": 0, "violat": 0, "virtual": [39, 40, 51, 52, 54, 55, 56, 57, 60, 61, 62], "virtual_env": 29, "visibl": [0, 2, 11, 34], "vision": 30, "visit": 63, "vnni": 52, "vocab": [16, 57], "vocab_fil": [16, 57], "void": 11, "volum": 55, "vulner": 63, "vz": 40, "w": [28, 31, 35, 44], "wa": [0, 29, 32, 33, 39, 40], "wai": [0, 16, 19, 28, 30, 34, 36, 38], "wait": 32, "want": [3, 5, 7, 28, 29, 37, 39, 40, 42, 51, 54, 57, 60], "warm": [22, 35], "warmup": 35, "warmup_step": 55, "warmup_steps_phase1": 51, "warmup_steps_phase2": 51, "warn": [28, 29, 40, 51], "wd": [25, 31], "wd_black": 31, "we": [0, 2, 7, 11, 24, 27, 28, 31, 32, 33, 34, 35, 38, 39, 40, 45, 46, 47, 49, 51, 52, 54, 55, 56, 57, 60, 61, 63], "weak": 31, "web": [5, 56], "websit": [45, 63], "weight": [4, 13, 25, 28, 51, 53, 62], "weight_decai": [25, 26], "welcom": [0, 7, 63], "well": [0, 2, 8, 11, 21, 26, 28, 29, 30, 31, 32, 51], "were": [0, 16, 29, 32], "wether": 27, "wget": [2, 7, 32, 35, 37, 39, 40, 42, 47, 49, 56, 58], "what": [0, 14, 28], "wheel": [2, 38, 39], "when": [0, 5, 14, 17, 19, 24, 27, 28, 29, 32, 34, 35, 36, 37, 39, 40, 51, 52, 55, 56, 60], "where": [25, 28, 31, 32, 39, 49], "wherea": 61, "wherebi": 32, "whether": [24, 29, 32], "which": [0, 4, 7, 9, 13, 14, 15, 16, 17, 18, 19, 20, 24, 28, 29, 30, 32, 33, 35, 36, 37, 39, 40, 42, 45, 46, 52, 57], "while": [16, 21, 28, 31, 32, 33, 34, 39, 48, 53, 56], "whitespac": 51, "whitlei": 31, "whl": [2, 11, 39, 40, 63], "whole": [18, 20, 33, 51], "whole_seq_output": 25, "whose": 18, "why": 0, "wide": [14, 25, 36, 44], "wiki": 0, "wiki_onli": 51, "wikicorpus_en": 51, "wikipedia": [31, 32, 51], "wish": 39, "within": [0, 15, 25, 30, 37, 51], "without": [0, 4, 16, 18, 20, 21, 23, 28, 30, 31, 39, 40, 44, 52, 56, 63], "withsum": 24, "wl": 40, "wno": 34, "won": [5, 29, 36], "work": [1, 4, 7, 14, 15, 19, 20, 21, 27, 28, 29, 32, 35, 36, 40, 42, 45, 49, 52], "worker": 28, "workflow": 16, "workload": [2, 4, 16, 32, 35, 44, 52, 60, 63], "workspac": [2, 3, 34], "world": 28, "wors": 47, "would": [28, 37, 39, 61], "wrap": 28, "wrap_funct": 35, "wrapper": [28, 42], "write": [5, 7, 16, 19], "written": [0, 7, 27], "wrong": [39, 40], "ws1": 47, "wu": 25, "www": [0, 21, 42], "x": [11, 19, 25, 26, 28, 31, 39, 40, 47, 53, 58], "x15": 14, "x710": 31, "x86_64": [38, 39, 40], "x_test": [19, 28, 35], "x_train": [19, 28, 35], "xe": 31, "xeon": [4, 21, 31, 32, 35, 39, 40, 41, 44, 47], "xfd": 11, "xla": [4, 16, 27], "xla_global_id": 2, "xpu": [2, 4, 11, 14, 17, 19, 22, 25, 26, 28, 30, 33, 37, 38, 43, 45, 46, 47, 48, 49, 53, 54, 55, 58, 60], "xpu_force_sync": 33, "xpu_lib_path": 40, "xpuautoshard": [4, 33, 44], "xx": [34, 61], "xxx": [7, 52, 56], "xxxx": [58, 61], "xxxxx": [34, 51, 62], "xxxxxx": 11, "xxxxxxxx": 52, "xzf": 7, "xzvf": 32, "y": [11, 25, 26, 28, 35, 37, 39, 40, 47, 58, 63], "y_test": [19, 28, 35], "y_train": [19, 28, 35], "yaml": 61, "ye": [19, 38], "you": [2, 3, 4, 5, 7, 8, 11, 13, 14, 16, 17, 18, 20, 21, 22, 23, 28, 29, 30, 31, 32, 33, 34, 35, 37, 38, 39, 40, 41, 42, 45, 46, 47, 48, 49, 51, 52, 53, 54, 55, 56, 57, 60, 61, 62], "your": [2, 3, 5, 7, 14, 27, 30, 32, 34, 35, 37, 38, 39, 40, 41, 42, 46, 47, 49, 51, 52, 54, 56, 62, 63], "your_script": 29, "your_script_arg": 29, "yourself": 29, "yuxin": 25, "yyi": 52, "yym": 58, "yyyi": 58, "z": [40, 58], "ze_api": 14, "ze_enable_tracing_lay": [4, 21, 22, 28], "zero": [14, 25, 26, 28, 37], "zip": 28, "zoo": 44, "zxvf": 49, "zzz": 7, "zzzz": 58}, "titles": ["Contributor Covenant Code of Conduct", "Security Policy", "Intel\u00ae Extension for TensorFlow* Docker Container Guide", "Intel\u00ae Extension for TensorFlow* Serving - Docker Container Guide", "Welcome to Intel\u00ae Extension for TensorFlow* documentation", "Online Documentation Build Guide", "Welcome to Intel \u00ae Extension for TensorFlow* documentation!", "Contributing guidelines", "Releases", "Directory Tree Structure", "Extension Design", "How to write custom op", "Optimizations Design", "oneDNN object cache optimization", "Frequently Asked Questions", "INT8 Quantization", "OpenXLA", "XPUAutoShard on GPU [Experimental]", "Tune Advanced Auto Mixed Precision", "Advanced Auto Mixed Precision", "Environment Variables", "Features", "GPU Profiler", "Infrastructure", "Graph fusion", "Customized Operators", "Operators Override", "Keras 3 Overview", "Keras Mixed Precision", "Launch Script User Guide", "NextPluggableDevice Overview", "Performance Data", "Practice Guide", "Python APIs", "Install TensorFlow Serving with Intel\u00ae Extension for TensorFlow*", "Selecting Thread Pool in Intel\u00ae Extension for TensorFlow* CPU [Experimental]", "Online Weight Prepack", "Experimental: Intel\u00ae Arc\u2122 A-Series GPU Software Installation", "Conda Environment Installation Instructions", "Overview", "Intel\u00ae Extension for TensorFlow* for C++", "Intel CPU Software Installation", "Intel XPU Software Installation", "Installation Guide", "Examples", "Accelerate AlexNet by Quantization with Intel\u00ae Extension for Tensorflow*", "Common Guide for Running", "Speed up Inference of Inception v4 by Advanced Automatic Mixed Precision on Intel CPU and GPU via Docker Container or Bare Metal", "ResNet50 Inference on Intel CPU and GPU", "Intel\u00ae Extension for Tensorflow* Model Quantization API Example", "Accelerate Deep Learning Training and Inference for Model Zoo Workloads on Intel GPU", "Accelerate BERT-Large Pretraining on Intel GPU", "Quantize Inception V3 by Intel\u00ae Extension for Tensorflow* on Intel\u00ae Xeon\u00ae", "Quick Example on Intel CPU and GPU", "Stable Diffusion Inference for Text2Image on Intel GPU", "Accelerate 3D-Unet Training w/o horovod for medical image segmentation on Intel GPU", "BERT Training for Classifying Text on Intel CPU and GPU", "FP8 BERT-Large Fine-tuning for Classifying Text on Intel GPU", "Distributed Training Example with Intel\u00ae Optimization for Horovod* on Intel\u00ae GPU", "Refer to train_resnet50", "Accelerate Mask R-CNN Training on Intel GPU", "Resnet50 train on Intel GPU", "Accelerate ResNet50 Training by XPUAutoShard on Intel GPU", "Intel\u00ae Extension for TensorFlow*", "Welcome to Intel \u00ae Extension for TensorFlow* documentation!"], "titleterms": {"1": [0, 11, 31, 34, 37, 40], "1550": 31, "17": 39, "170": 31, "1x": 31, "2": [0, 11, 34, 37, 40], "3": [0, 11, 27, 37], "3d": [31, 55], "4": [0, 11, 31, 37], "4x": 31, "5": 31, "6": 11, "7": 11, "8": 11, "9": 11, "A": 37, "By": 37, "For": [39, 40], "If": 61, "That": 2, "With": 62, "acceler": [45, 50, 51, 55, 60, 62], "access": [2, 32], "accuraci": [31, 54, 57], "activ": 26, "adamw": 26, "adamwithweightdecayoptim": 25, "add": 11, "addit": [31, 39], "advanc": [18, 19, 21, 23, 29, 47, 52], "ai": 31, "alexnet": 45, "all": 29, "alloc": [29, 32], "amp": [19, 21, 47], "api": [17, 18, 20, 21, 23, 33, 47, 48, 49, 54, 62], "appli": [49, 58, 61], "arc": 37, "architectur": [23, 30], "ask": 14, "attribut": [0, 18], "auto": [18, 19, 20, 21], "automat": 47, "automixedprecisionopt": 33, "b0": 31, "b3": 31, "backend": 20, "background": [18, 45, 52], "ban": 0, "bare": [41, 42, 47, 50], "base": [39, 40, 42, 45, 46], "basic": [24, 29], "bazel": [7, 39, 40], "bert": [31, 51, 56, 57], "bf16": 57, "binari": [2, 3, 63], "boost": 52, "build": [2, 3, 5, 11, 14, 28, 34, 39, 40, 41, 42], "c": [7, 34, 40], "cach": 13, "case": 27, "cc": 40, "center": 31, "chang": [8, 51, 54, 55, 57, 60, 61], "channel": 63, "check": [30, 42, 52, 58], "clang": 39, "classifi": [56, 57], "clone": [47, 58], "cnn": 60, "code": [0, 7, 17, 19, 39, 40, 51, 53, 54, 55, 56, 57, 58, 60, 61, 62], "command": [51, 58, 61, 62], "common": [29, 39, 40, 46], "compar": 47, "compat": 63, "compil": 39, "compressor": 49, "conda": [38, 39, 40], "conduct": 0, "config": [20, 33], "configproto": 33, "configur": [18, 20, 31, 32, 39, 40, 47, 52], "constant": 52, "contain": [2, 3, 41, 42, 47, 50], "content": 32, "contribut": [7, 63], "contributor": 0, "control": 29, "converg": 51, "convolut": 13, "core": 29, "correct": 0, "count": 58, "coven": 0, "cpu": [21, 32, 35, 39, 40, 41, 42, 47, 48, 52, 53, 54, 56, 61, 63], "creat": [5, 39, 40, 58], "current": 30, "custom": [2, 11, 19, 23, 25, 28], "data": [19, 24, 31], "dataset": [49, 51, 55, 60, 61], "debug": 7, "debugopt": 33, "deep": [50, 52], "default": 29, "defin": 11, "definit": 20, "dens": 26, "depend": 58, "deprec": 42, "descript": [2, 3], "design": [10, 12, 29], "detail": 24, "devcloud": [45, 52], "develop": 7, "devic": [30, 58], "differ": [18, 27, 28], "diffus": [31, 54], "directli": 37, "directori": 9, "disabl": 52, "distribut": 58, "docker": [2, 3, 34, 41, 42, 47, 50], "dockerfil": [34, 41, 42], "dockerhub": [41, 42], "document": [4, 5, 6, 7, 63, 64], "download": [39, 40, 47, 56, 58], "driver": [37, 39, 40, 42, 46], "dtype": 28, "dump": 17, "eas": 21, "effect": 36, "efficientnet": 31, "eigen": 35, "enabl": [19, 46, 47, 48, 51, 52, 54, 55, 56, 57, 58, 60, 61, 62], "end": 18, "enforc": 0, "engin": 23, "environ": [18, 20, 29, 33, 37, 38, 39, 40, 41, 42, 45, 46, 47, 48, 49, 51, 52, 54, 55, 56, 57, 58, 60, 61, 62], "error": 27, "exampl": [16, 17, 18, 19, 22, 29, 35, 39, 40, 44, 48, 49, 51, 53, 54, 55, 57, 58, 60, 61, 62], "execut": [29, 45, 47, 48, 51, 54, 55, 56, 57, 58, 60, 61, 62], "experiment": [17, 21, 35, 37], "extens": [2, 3, 4, 6, 7, 10, 23, 33, 34, 35, 37, 39, 40, 41, 42, 45, 49, 52, 63, 64], "extra": [39, 40], "extract": 40, "faq": [22, 47, 48, 51, 54, 55, 56, 57, 60], "featur": [19, 21, 23], "file": 40, "fine": 57, "finetun": 51, "fit": 28, "flex": 31, "fold": 52, "format": 32, "fp16": 54, "fp32": [47, 54], "fp8": 57, "frequent": 14, "from": [2, 14, 34, 40, 41, 42], "full": 37, "function": 52, "further": 62, "fusion": 24, "gelu": [25, 26], "gener": 24, "get": [41, 42], "get_config": 33, "gnu": 32, "gpu": [2, 17, 21, 22, 31, 32, 37, 39, 40, 42, 45, 46, 47, 48, 50, 51, 52, 53, 54, 55, 56, 57, 58, 60, 61, 62], "gpuoption": 33, "graph": [17, 19, 21, 24, 33, 52], "graphopt": 33, "groupnorm": 25, "guid": [2, 3, 5, 7, 29, 32, 43, 46, 50], "guidelin": [0, 7], "hardwar": [28, 31, 32, 37, 39, 40, 41, 42, 45, 47, 51, 52, 54, 55, 56, 57, 60, 61, 62, 63], "header": 40, "highlight": 4, "horovod": [55, 58, 61], "how": [11, 16, 28], "hvd": 61, "i": [2, 3, 29], "identifi": 28, "ii": [2, 3, 29], "iii": [2, 29], "imag": [3, 31, 34, 55], "imagenet": 61, "implement": [11, 24], "import": 33, "improv": 18, "incept": [47, 52], "includ": 29, "incompat": 8, "index": 29, "infer": [29, 31, 47, 48, 50, 54], "infrastructur": 23, "instal": [11, 34, 37, 38, 39, 40, 41, 42, 43, 49, 53, 58, 62, 63], "instanc": [26, 29], "instruct": [37, 38], "int8": [15, 21], "integr": 40, "intel": [2, 3, 4, 6, 7, 23, 31, 32, 33, 34, 35, 37, 39, 40, 41, 42, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 60, 61, 62, 63, 64], "intel_extension_for_tensorflow": 33, "interfac": 11, "introduct": [5, 13, 23, 45, 47, 50, 51, 52, 54, 55, 56, 57, 60, 61, 62], "issu": 8, "itex": [25, 33], "itex_verbos": 20, "itexlstm": 25, "iv": 29, "ix": 29, "jemalloc": 29, "jupyt": [52, 54, 56], "kera": [27, 28], "kernel": 11, "known": 8, "lamboptim": 25, "larg": [31, 51, 57], "latenc": 29, "latest": 5, "launch": 29, "launcher": 21, "layer": 26, "layernorm": 25, "layout": [24, 32], "lead": 27, "learn": [50, 52], "level": 20, "librari": [34, 40], "licens": [52, 63], "limit": 36, "linker": 40, "linux": 37, "list": 18, "load": 40, "local": [5, 45, 52], "log": [19, 29], "logic": 29, "loop": 28, "loss": 28, "lstm": 26, "manag": 23, "manual": 19, "mask": [31, 60], "matrix": 52, "max": 31, "medic": [31, 55], "memori": [29, 32], "metal": [41, 42, 47, 50], "method": 47, "mix": [18, 19, 20, 21, 24, 28, 47], "mobilenet": 18, "mode": 29, "model": [28, 31, 34, 47, 49, 50, 51, 54, 55, 57, 60, 61], "multi": [29, 55], "multipl": 29, "name": 33, "nativ": 37, "net": 31, "neural": 49, "nextpluggabledevic": 30, "node": [29, 31], "non": 32, "normal": 26, "note": 53, "notebook": [52, 54, 56], "notic": 19, "numa": [29, 32], "numactl": 32, "number": 29, "numer": 18, "o": 55, "object": [13, 16], "omp_num_thread": 32, "one": 29, "oneapi": [37, 39, 40, 42, 46, 58], "onednn": [13, 52], "onli": [39, 40, 42], "onlin": [5, 36], "op": [11, 25, 33], "openmp": [32, 35], "openxla": [16, 21, 30], "oper": [19, 21, 25, 26, 33], "optim": [12, 13, 19, 21, 24, 58], "option": [20, 37, 39, 40, 58], "origin": 19, "other": 62, "our": 0, "output": [48, 53, 54, 58, 61, 62], "overflow": 28, "overrid": [26, 33], "overview": [15, 16, 17, 19, 20, 27, 28, 29, 30, 31, 32, 33, 36, 39, 49], "packag": [11, 40, 42, 62], "paramet": [61, 62], "patch": [58, 61], "perform": [18, 27, 31, 47], "perman": 0, "phase2": 31, "physic": 29, "pjrt": 30, "platform": 42, "pledg": 0, "pluggabledevic": 30, "plugin": 30, "polici": [1, 28], "pool": 35, "practic": 32, "pre": 49, "precis": [18, 19, 20, 21, 28, 47], "precondit": 38, "prepack": 36, "prepar": [2, 3, 40, 44, 46, 47, 48, 49, 51, 54, 55, 56, 57, 58, 60, 61, 62], "prerequisit": [11, 33, 48, 51, 54, 55, 56, 57, 60, 61, 62], "preserv": 33, "pretrain": [47, 51], "product": 31, "profil": [21, 22], "protocol": [20, 33], "public": 23, "py": 53, "pypi": [37, 39, 41, 42], "python": [7, 11, 17, 18, 20, 21, 33, 40, 47, 48, 54, 62], "pythonpath": 62, "quantiz": [15, 21, 45, 49, 52], "question": 14, "quick": [19, 50, 53], "quick_exampl": 53, "r": 60, "rcnn": 31, "recommend": 40, "refer": [16, 36, 59], "regist": 11, "releas": [5, 8, 37], "repo": 58, "report": 1, "repositori": 47, "requir": [37, 39, 40, 41, 42, 47, 51, 54, 55, 56, 57, 60, 61, 62, 63], "resnet50": [48, 61, 62], "resnet50v1": 31, "resourc": [10, 63], "respons": 0, "result": [31, 47, 51], "rule": 18, "run": [2, 3, 34, 37, 40, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 60, 61, 62], "runtim": [14, 30], "sampl": 34, "save": 19, "scale": 28, "scope": 0, "script": [2, 29, 46], "secur": [1, 63], "segment": 55, "select": 35, "seri": 37, "serv": [3, 21, 34], "server": [34, 45, 52], "set": [28, 29, 45, 49, 61, 62], "set_config": 33, "setup": [19, 28, 37, 42, 46, 47, 48, 51, 54, 55, 56, 57, 58, 60, 61, 62], "shard": 62, "shardingconfig": 33, "singl": [29, 55], "situat": 27, "skip": [47, 48, 54, 56, 61], "softwar": [31, 32, 37, 41, 42, 49, 63], "sourc": [14, 34, 39, 40], "speed": 47, "stabil": 18, "stabl": [31, 54], "standard": 0, "start": [30, 50], "startup": [52, 56], "step": [37, 38, 47, 48, 54, 56, 61], "stock": [18, 19], "structur": [9, 17], "style": 7, "subsystem": 37, "support": [21, 63], "switch": 30, "system": [37, 41, 42], "tabl": [32, 63], "tcmalloc": [29, 32], "temporari": 0, "tensorflow": [2, 3, 4, 6, 7, 18, 19, 21, 23, 33, 34, 35, 37, 39, 40, 41, 42, 45, 49, 52, 63, 64], "test": [5, 7, 47], "text": [56, 57], "text2imag": 54, "tf_num_interop_thread": 29, "tf_num_intraop_thread": 29, "thi": [47, 48, 54, 56, 61], "thread": 35, "throughput": 29, "tile": 55, "tip": [7, 19], "toolkit": [39, 40, 42, 46], "train": [19, 28, 31, 49, 50, 55, 56, 58, 60, 61, 62], "train_resnet50": 59, "tree": 9, "troubleshoot": 14, "tune": [18, 19, 57], "type": [19, 24, 28, 30], "u": 31, "ubuntu": 37, "underflow": 28, "unet": 55, "uniform": 32, "unit": 7, "up": [45, 47, 49], "updat": 5, "us": [11, 21, 27, 29, 30, 34, 35, 61], "usag": [2, 15, 17, 18, 19, 22, 26, 29, 36], "user": 29, "v": [19, 29], "v1": 31, "v3": 52, "v4": 47, "variabl": [18, 20, 29, 33, 37, 42, 47], "vasriabl": 54, "verifi": [2, 11, 37, 41, 42], "version": [5, 33, 52], "vi": 29, "via": [20, 37, 41, 42, 47], "vii": 29, "viii": 29, "virtual": [37, 41, 42, 46, 58], "vulner": 1, "w": 55, "warn": [0, 27], "weekli": 63, "weight": 36, "welcom": [4, 6, 64], "wheel": [37, 41, 42], "why": 30, "window": 37, "without": [61, 62], "work": 16, "workflow": [10, 15, 17, 36], "workload": [31, 50], "write": 11, "wsl2": 37, "x": 29, "xeon": 52, "xla": 30, "xpu": [23, 39, 40, 42, 63], "xpuautoshard": [17, 21, 62], "your": 29, "zoo": 50}}) \ No newline at end of file +Search.setIndex({"alltitles": {"1. Prerequisite": [[11, "prerequisite"]], "1. Build Intel\u00ae Extension for TensorFlow* C++ library": [[34, "build-intel-extension-for-tensorflow-c-library"]], "1. Correction": [[0, "correction"]], "1. Install GPU Drivers": [[37, "install-gpu-drivers"]], "2. Define the op interface and Register op": [[11, "define-the-op-interface-and-register-op"]], "2. Build TensorFlow Serving": [[34, "build-tensorflow-serving"]], "2. Install TensorFlow* via PyPI Wheel in Linux": [[37, "install-tensorflow-via-pypi-wheel-in-linux"]], "2. Warning": [[0, "warning"]], "3. Register the kernels for the op": [[11, "register-the-kernels-for-the-op"]], "3. Install Intel\u00ae Extension for TensorFlow*": [[37, "install-intel-extension-for-tensorflow"]], "3. Temporary Ban": [[0, "temporary-ban"]], "4. Implement the kernels": [[11, "implement-the-kernels"]], "4. Permanent Ban": [[0, "permanent-ban"]], "4. Verify the Installation": [[37, "verify-the-installation"]], "6. Add the op to BUILD": [[11, "add-the-op-to-build"]], "7. Use the op in Python": [[11, "use-the-op-in-python"]], "8. Build the package": [[11, "build-the-package"]], "9. Install and Verify": [[11, "install-and-verify"]], "Accelerate 3D-Unet Training w/o horovod for medical image segmentation on Intel GPU": [[55, "accelerate-3d-unet-training-w-o-horovod-for-medical-image-segmentation-on-intel-gpu"]], "Accelerate AlexNet by Quantization with Intel\u00ae Extension for Tensorflow*": [[45, "accelerate-alexnet-by-quantization-with-intel-extension-for-tensorflow"]], "Accelerate BERT-Large Pretraining on Intel GPU": [[51, "accelerate-bert-large-pretraining-on-intel-gpu"]], "Accelerate Deep Learning Training and Inference for Model Zoo Workloads on Intel GPU": [[50, "accelerate-deep-learning-training-and-inference-for-model-zoo-workloads-on-intel-gpu"]], "Accelerate Mask R-CNN Training on Intel GPU": [[60, "accelerate-mask-r-cnn-training-on-intel-gpu"]], "Accelerate ResNet50 Training by XPUAutoShard on Intel GPU": [[62, "accelerate-resnet50-training-by-xpuautoshard-on-intel-gpu"]], "Accuracy": [[54, "accuracy"], [57, "accuracy"]], "AdamW": [[26, "adamw"]], "Additional": [[39, "additional"]], "Additional Performance Data for Intel AI Data Center Products": [[31, "additional-performance-data-for-intel-ai-data-center-products"]], "Advanced AMP vs. Stock TensorFlow AMP": [[19, "advanced-amp-vs-stock-tensorflow-amp"]], "Advanced Auto Mixed Precision": [[19, "advanced-auto-mixed-precision"], [19, "id1"]], "Advanced Auto Mixed Precision (AMP)": [[21, "advanced-auto-mixed-precision-amp"]], "Advanced Settings": [[29, "advanced-settings"]], "Advanced: Enable Advanced AMP Method": [[47, "advanced-enable-advanced-amp-method"]], "Apply Model Quantization": [[49, "apply-model-quantization"]], "Apply Patch": [[61, "apply-patch"]], "Apply Patch for Intel GPU": [[58, "apply-patch-for-intel-gpu"]], "Architecture": [[23, "architecture"]], "Attribution": [[0, "attribution"]], "Auto Mixed Precision Options": [[20, "auto-mixed-precision-options"]], "BERT Training for Classifying Text on Intel CPU and GPU": [[56, "bert-training-for-classifying-text-on-intel-cpu-and-gpu"]], "BERT-Large Phase2 Training Performance Results": [[31, "bert-large-phase2-training-performance-results"]], "BF16 + FP8 Fine-tuning": [[57, "bf16-fp8-fine-tuning"]], "Backend and Config Protocol": [[20, "backend-and-config-protocol"]], "Background": [[18, "background"], [45, "background"], [52, "background"]], "Basic Settings": [[29, "basic-settings"]], "Basic fusion": [[24, "basic-fusion"]], "Binaries Preparation": [[2, "binaries-preparation"]], "Build Docker container from Dockerfile": [[41, "build-docker-container-from-dockerfile"], [42, "build-docker-container-from-dockerfile"]], "Build Docker image from Dockerfile": [[34, "build-docker-image-from-dockerfile"]], "Build Intel\u00ae Extension for TensorFlow* CC library": [[40, "build-intel-extension-for-tensorflow-cc-library"]], "Build Intel\u00ae Extension for TensorFlow* PyPI": [[39, "build-intel-extension-for-tensorflow-pypi"]], "Build Source Code": [[39, "build-source-code"], [40, "build-source-code"]], "Build and run": [[40, "build-and-run"]], "Build from source": [[14, "build-from-source"], [34, "build-from-source"]], "Build the Docker Image": [[3, "build-the-docker-image"]], "Build to Local Test": [[5, "build-to-local-test"]], "Building the model": [[28, "building-the-model"]], "C++ coding style": [[7, "c-coding-style"]], "CPU": [[52, "cpu"]], "CPU Launcher [Experimental]": [[21, "cpu-launcher-experimental"]], "CPU Practice Guide": [[32, "cpu-practice-guide"]], "Check Currently Used Device Type": [[30, "check-currently-used-device-type"]], "Check Device Count (Optional)": [[58, "check-device-count-optional"]], "Check Intel\u00ae Advanced Matrix Extensions": [[52, "check-intel-advanced-matrix-extensions"]], "Check Intel\u00ae Deep Learning Boost": [[52, "check-intel-deep-learning-boost"]], "Check the Environment for XPU": [[42, "check-the-environment-for-xpu"]], "Clone Horovod Repo": [[58, "clone-horovod-repo"]], "Clone the Repository": [[47, "clone-the-repository"]], "Code": [[53, "code"]], "Code Structure": [[17, "code-structure"]], "Code style guide": [[7, "code-style-guide"]], "Command": [[61, "command"]], "Command with Horovod": [[61, "command-with-horovod"]], "Commands": [[51, "commands"]], "Common Execution Mode": [[29, "common-execution-mode"]], "Common Guide for Running": [[46, "common-guide-for-running"]], "Common Requirements": [[39, "common-requirements"], [40, "common-requirements"]], "Compatibility Table": [[63, "compatibility-table"]], "Conda Environment Installation Instructions": [[38, "conda-environment-installation-instructions"]], "Configuration": [[31, "configuration"], [52, "configuration"]], "Configuration List": [[18, "configuration-list"]], "Configuration via Environment Variables": [[20, "configuration-via-environment-variables"]], "Configure": [[39, "configure"], [40, "configure"]], "Configure Example For XPU": [[39, "configure-example-for-xpu"]], "Configure Example for CPU": [[39, "configure-example-for-cpu"]], "Configure For CPU": [[39, "configure-for-cpu"], [40, "configure-for-cpu"]], "Configure For GPU": [[40, "configure-for-gpu"]], "Configure For XPU": [[39, "configure-for-xpu"]], "Contributing": [[63, "contributing"]], "Contributing guidelines": [[7, "contributing-guidelines"]], "Contributing to Intel\u00ae Extension for TensorFlow*": [[7, "contributing-to-intel-extension-for-tensorflow"]], "Contributor Covenant Code of Conduct": [[0, "contributor-covenant-code-of-conduct"]], "Convergence": [[51, "convergence"]], "Create Release Version": [[5, "create-release-version"]], "Create Virtual Environment": [[58, "create-virtual-environment"]], "Create a Conda Environment": [[39, "create-a-conda-environment"], [40, "create-a-conda-environment"]], "Custom API": [[23, "custom-api"]], "Custom Operation": [[19, "custom-operation"]], "Customized Operators": [[25, "customized-operators"]], "Data Type": [[19, "data-type"]], "Default memory allocator": [[29, "default-memory-allocator"]], "Dense Layer": [[26, "dense-layer"]], "Dependency": [[58, "dependency"]], "Description": [[2, "description"], [3, "description"]], "Developing Intel\u00ae Extension for TensorFlow*": [[7, "developing-intel-extension-for-tensorflow"]], "Directory Tree Structure": [[9, "directory-tree-structure"]], "Disable Constant Folding Function": [[52, "disable-constant-folding-function"]], "Distributed Training Example with Intel\u00ae Optimization for Horovod* on Intel\u00ae GPU": [[58, "distributed-training-example-with-intel-optimization-for-horovod-on-intel-gpu"]], "Documentation": [[4, "documentation"], [63, "documentation"]], "Documentation style guide": [[7, "documentation-style-guide"]], "Download Jupyter Code:": [[56, "download-jupyter-code"]], "Download Patch": [[58, "download-patch"]], "Download Source Code": [[39, "download-source-code"], [40, "download-source-code"]], "Download the Pretrained-model": [[47, "download-the-pretrained-model"]], "Dump the graph": [[17, "dump-the-graph"]], "Ease-of-use Python API": [[21, "ease-of-use-python-api"]], "EfficientNet-B0 Inference Performance Results": [[31, "efficientnet-b0-inference-performance-results"]], "EfficientNet-B3 Inference Performance Results": [[31, "efficientnet-b3-inference-performance-results"]], "Enable Advanced AMP": [[19, "enable-advanced-amp"]], "Enable Running Environment": [[47, "enable-running-environment"], [48, "enable-running-environment"], [51, "enable-running-environment"], [54, "enable-running-environment"], [55, "enable-running-environment"], [56, "enable-running-environment"], [57, "enable-running-environment"], [60, "enable-running-environment"], [61, "enable-running-environment"], [62, "enable-running-environment"]], "Enable Virtual Running Environment": [[46, "enable-virtual-running-environment"]], "Enable oneAPI": [[58, "enable-oneapi"]], "Enable oneAPI Running Environment": [[46, "enable-oneapi-running-environment"]], "Enable oneDNN Graph": [[52, "enable-onednn-graph"]], "End-to-end Example": [[18, "end-to-end-example"]], "Enforcement": [[0, "enforcement"]], "Enforcement Guidelines": [[0, "enforcement-guidelines"]], "Enforcement Responsibilities": [[0, "enforcement-responsibilities"]], "Environment Variable Configuration": [[47, "environment-variable-configuration"]], "Environment Variable Difference with Stock TensorFlow": [[18, "environment-variable-difference-with-stock-tensorflow"]], "Environment Variables": [[20, "environment-variables"], [29, "environment-variables"]], "Environment Variables with Python APIs": [[20, "environment-variables-with-python-apis"]], "Environment Vasriable": [[54, "environment-vasriable"]], "Example": [[16, "example"], [18, "example"], [19, "example"], [35, "example"], [40, "example"]], "Example Output": [[48, "example-output"], [53, "example-output"], [54, "example-output"], [62, "example-output"]], "Example Output with hvd": [[61, "example-output-with-hvd"]], "Example Output without hvd": [[61, "example-output-without-hvd"]], "Example of Mix Precision by List": [[18, "example-of-mix-precision-by-list"]], "Example:": [[22, "example"]], "Examples": [[17, "examples"], [29, "examples"], [44, "examples"], [44, "id1"]], "Execute": [[45, "execute"], [56, "execute"]], "Execute Testing and Comparing the Performance of FP32 and Advanced AMP on CPU and GPU in Docker Container or Bare Metal": [[47, "execute-testing-and-comparing-the-performance-of-fp32-and-advanced-amp-on-cpu-and-gpu-in-docker-container-or-bare-metal"]], "Execute the Example": [[51, "execute-the-example"], [55, "execute-the-example"], [57, "execute-the-example"], [60, "execute-the-example"]], "Executes the Example with Python API": [[48, "executes-the-example-with-python-api"], [54, "executes-the-example-with-python-api"], [62, "executes-the-example-with-python-api"]], "Executing Command": [[62, "executing-command"]], "Execution": [[58, "execution"], [61, "execution"]], "Experimental Release": [[37, "experimental-release"]], "Experimental: Intel\u00ae Arc\u2122 A-Series GPU Software Installation": [[37, "experimental-intel-arc-a-series-gpu-software-installation"]], "Extension Design": [[10, "extension-design"]], "Extra Requirements for XPU Build Only": [[39, "extra-requirements-for-xpu-build-only"]], "Extra Requirements for XPU/GPU Build Only": [[40, "extra-requirements-for-xpu-gpu-build-only"]], "FAQ": [[22, "faq"], [47, "faq"], [48, "faq"], [51, "faq"], [54, "faq"], [55, "faq"], [56, "faq"], [57, "faq"], [60, "faq"]], "FP16 Inference": [[54, "fp16-inference"]], "FP32 Inference": [[54, "fp32-inference"]], "FP8 BERT-Large Fine-tuning for Classifying Text on Intel GPU": [[57, "fp8-bert-large-fine-tuning-for-classifying-text-on-intel-gpu"]], "Feature": [[19, "feature"]], "Features": [[21, "features"]], "Finetune Command": [[51, "finetune-command"]], "Frequently Asked Questions": [[14, "frequently-asked-questions"]], "Further Settings": [[62, "further-settings"]], "GNU OpenMP": [[32, "gnu-openmp"]], "GPU": [[45, "gpu"], [52, "gpu"]], "GPU Practice Guide": [[32, "gpu-practice-guide"]], "GPU Profiler": [[21, "gpu-profiler"], [22, "gpu-profiler"]], "Gelu Activation": [[26, "gelu-activation"]], "Generic layout optimizer": [[24, "generic-layout-optimizer"]], "Get docker container from dockerhub": [[41, "get-docker-container-from-dockerhub"], [42, "get-docker-container-from-dockerhub"]], "Graph Optimization": [[21, "graph-optimization"]], "Graph Optimizer": [[19, "graph-optimizer"]], "Graph fusion": [[24, "graph-fusion"]], "Hardware Configuration": [[31, "hardware-configuration"], [32, "hardware-configuration"]], "Hardware Configuration for Intel Flex 170 GPU": [[31, "hardware-configuration-for-intel-flex-170-gpu"]], "Hardware Configuration for Intel Max 1550 GPU": [[31, "hardware-configuration-for-intel-max-1550-gpu"]], "Hardware Environment": [[45, "hardware-environment"], [52, "hardware-environment"]], "Hardware Requirement": [[47, "hardware-requirement"], [63, "hardware-requirement"]], "Hardware Requirements": [[37, "hardware-requirements"], [39, "hardware-requirements"], [40, "hardware-requirements"], [41, "hardware-requirements"], [42, "hardware-requirements"], [51, "hardware-requirements"], [54, "hardware-requirements"], [55, "hardware-requirements"], [56, "hardware-requirements"], [57, "hardware-requirements"], [60, "hardware-requirements"], [61, "hardware-requirements"], [62, "hardware-requirements"]], "Highlights": [[4, "highlights"]], "How it works": [[16, "how-it-works"]], "How to identify different hardware types?": [[28, "how-to-identify-different-hardware-types"]], "How to write custom op": [[11, "how-to-write-custom-op"]], "I. Binaries Preparation": [[3, "i-binaries-preparation"]], "I. Customize Build Script": [[2, "i-customize-build-script"]], "I. Use all physical cores": [[29, "i-use-all-physical-cores"]], "II. Build the Container": [[2, "ii-build-the-container"], [3, "ii-build-the-container"]], "II. Use all cores including logical cores": [[29, "ii-use-all-cores-including-logical-cores"]], "III. Running the Container": [[2, "iii-running-the-container"]], "III. Use physical cores on one node": [[29, "iii-use-physical-cores-on-one-node"]], "INT8 Quantization": [[15, "int8-quantization"], [21, "int8-quantization"]], "ITEX_VERBOSE level definition": [[20, "itex-verbose-level-definition"]], "IV. Use your designated number of cores": [[29, "iv-use-your-designated-number-of-cores"]], "IX. Set environment variable TF_NUM_INTRAOP_THREADS": [[29, "ix-set-environment-variable-tf-num-intraop-threads"]], "If not use Horovod": [[61, "if-not-use-horovod"]], "If use Horovod": [[61, "if-use-horovod"]], "Implementation Details": [[24, "implementation-details"]], "Incompatible Changes": [[8, "incompatible-changes"]], "Inference Performance Results": [[31, "inference-performance-results"]], "Inference Performance on 1x Intel Data Center GPU Flex 170": [[31, "inference-performance-on-1x-intel-data-center-gpu-flex-170"]], "Inference Workloads": [[31, "inference-workloads"]], "Infrastructure": [[23, "infrastructure"]], "Install": [[58, "install"], [63, "install"]], "Install Bazel": [[39, "install-bazel"], [40, "install-bazel"]], "Install Clang-17 compiler": [[39, "install-clang-17-compiler"]], "Install GPU Drivers": [[42, "install-gpu-drivers"]], "Install Intel GPU Driver": [[39, "install-intel-gpu-driver"], [40, "install-intel-gpu-driver"]], "Install Intel\u00ae Extension for TensorFlow*": [[41, "install-intel-extension-for-tensorflow"], [42, "install-intel-extension-for-tensorflow"]], "Install Intel\u00ae Extension for Tensorflow*": [[49, "install-intel-extension-for-tensorflow"]], "Install Intel\u00ae Neural Compressor": [[49, "install-intel-neural-compressor"]], "Install Model Server": [[34, "install-model-server"]], "Install Other Required Packages": [[62, "install-other-required-packages"]], "Install TensorFlow": [[37, "install-tensorflow"], [39, "install-tensorflow"], [40, "install-tensorflow"], [41, "install-tensorflow"], [42, "install-tensorflow"]], "Install TensorFlow Serving with Intel\u00ae Extension for TensorFlow*": [[34, "install-tensorflow-serving-with-intel-extension-for-tensorflow"]], "Install for CPU": [[63, "install-for-cpu"]], "Install for CPU weekly": [[63, "install-for-cpu-weekly"]], "Install for XPU": [[63, "install-for-xpu"]], "Install for XPU weekly": [[63, "install-for-xpu-weekly"]], "Install for weekly binaries": [[63, "install-for-weekly-binaries"]], "Install oneAPI Base Toolkit": [[39, "install-oneapi-base-toolkit"], [40, "install-oneapi-base-toolkit"]], "Install oneAPI Base Toolkit Packages": [[42, "install-oneapi-base-toolkit-packages"]], "Install using Docker": [[34, "install-using-docker"]], "Install via Docker container": [[41, "install-via-docker-container"], [42, "install-via-docker-container"]], "Install via PyPI wheel in bare metal": [[41, "install-via-pypi-wheel-in-bare-metal"], [42, "install-via-pypi-wheel-in-bare-metal"]], "Installation": [[53, "installation"]], "Installation Channel:": [[63, "installation-channel"]], "Installation Guide": [[43, "installation-guide"]], "Instance Normalization": [[26, "instance-normalization"]], "Integrate the CC library": [[40, "integrate-the-cc-library"]], "Intel Advanced Feature and Extension Management": [[23, "intel-advanced-feature-and-extension-management"]], "Intel CPU Software Installation": [[41, "intel-cpu-software-installation"]], "Intel GPU Driver": [[46, "intel-gpu-driver"]], "Intel OpenMP": [[32, "intel-openmp"]], "Intel XPU Software Installation": [[42, "intel-xpu-software-installation"]], "Intel\u00ae DevCloud": [[45, "intel-devcloud"], [52, "intel-devcloud"]], "Intel\u00ae Extension for TensorFlow*": [[63, "intel-extension-for-tensorflow"]], "Intel\u00ae Extension for TensorFlow* Config Protocol": [[33, "intel-extension-for-tensorflow-config-protocol"]], "Intel\u00ae Extension for TensorFlow* Docker Container Guide": [[2, "intel-extension-for-tensorflow-docker-container-guide"]], "Intel\u00ae Extension for TensorFlow* Serving - Docker Container Guide": [[3, "intel-extension-for-tensorflow-serving-docker-container-guide"]], "Intel\u00ae Extension for TensorFlow* for C++": [[40, "intel-extension-for-tensorflow-for-c"]], "Intel\u00ae Extension for Tensorflow* Model Quantization API Example": [[49, "intel-extension-for-tensorflow-model-quantization-api-example"]], "Intel\u00ae Extension for Tensorflow* Version": [[52, "intel-extension-for-tensorflow-version"]], "Intel\u00ae oneAPI Base Toolkit": [[46, "intel-oneapi-base-toolkit"]], "Introduction": [[5, "introduction"], [13, "introduction"], [23, "introduction"], [45, "introduction"], [47, "introduction"], [50, "introduction"], [51, "introduction"], [52, "introduction"], [54, "introduction"], [55, "introduction"], [56, "introduction"], [57, "introduction"], [60, "introduction"], [61, "introduction"], [62, "introduction"]], "Jemalloc": [[29, "jemalloc"]], "Keras 3 Overview": [[27, "keras-3-overview"]], "Keras Mixed Precision": [[28, "keras-mixed-precision"]], "Known Issues": [[8, "known-issues"]], "LSTM": [[26, "lstm"]], "Latency mode": [[29, "latency-mode"]], "Launch Log": [[29, "launch-log"]], "Launch Script User Guide": [[29, "launch-script-user-guide"]], "Layer Normalization": [[26, "layer-normalization"]], "License": [[52, "license"], [63, "license"]], "Limitation": [[36, "limitation"]], "Linker": [[40, "linker"]], "Load": [[40, "load"]], "Local Server": [[45, "local-server"], [52, "local-server"]], "Log and Save Optimized Graph": [[19, "log-and-save-optimized-graph"]], "Loss scaling": [[28, "loss-scaling"]], "Loss scaling overview": [[28, "loss-scaling-overview"]], "Mask-RCNN Inference Performance Results": [[31, "mask-rcnn-inference-performance-results"]], "Mask-RCNN Training Performance Results": [[31, "mask-rcnn-training-performance-results"]], "Medical Image 3D U-Net Training Performance Results": [[31, "medical-image-3d-u-net-training-performance-results"]], "Memory Allocator": [[29, "memory-allocator"], [32, "memory-allocator"]], "Memory Layout format": [[32, "memory-layout-format"]], "Mixed data type fusion": [[24, "mixed-data-type-fusion"]], "Model Code change": [[51, "model-code-change"], [54, "model-code-change"], [55, "model-code-change"], [57, "model-code-change"], [60, "model-code-change"], [61, "model-code-change"]], "Models": [[31, "models"]], "Multi-instance": [[29, "multi-instance"]], "Multi-tile with horovod": [[55, "multi-tile-with-horovod"]], "Multiple instances for inference": [[29, "multiple-instances-for-inference"]], "NUMA Control": [[29, "numa-control"]], "Native Linux Running Directly on Hardware": [[37, "native-linux-running-directly-on-hardware"], [37, "id2"]], "NextPluggableDevice Architecture": [[30, "nextpluggabledevice-architecture"]], "NextPluggableDevice Overview": [[30, "nextpluggabledevice-overview"]], "Non-Uniform Memory Access (NUMA)": [[32, "non-uniform-memory-access-numa"]], "Notes": [[53, "notes"]], "Notice": [[19, "notice"]], "Numactl": [[32, "numactl"]], "Numeric Stability": [[18, "numeric-stability"]], "OMP_NUM_THREADS": [[32, "omp-num-threads"]], "Objectives": [[16, "objectives"]], "Online Documentation Build Guide": [[5, "online-documentation-build-guide"]], "Online Weight Prepack": [[36, "online-weight-prepack"]], "OpenMP": [[32, "openmp"]], "OpenXLA": [[16, "openxla"]], "OpenXLA PJRT Plugin": [[30, "openxla-pjrt-plugin"]], "OpenXLA Support on GPU [Experimental]": [[21, "openxla-support-on-gpu-experimental"]], "Operator Optimization": [[21, "operator-optimization"]], "Operators Override": [[26, "operators-override"]], "Optimization in convolution": [[13, "optimization-in-convolution"]], "Optimizations Design": [[12, "optimizations-design"]], "Option 1: Extract from Tensorflow* python package (Recommended)": [[40, "option-1-extract-from-tensorflow-python-package-recommended"]], "Option 2: Build from TensorFlow* source code": [[40, "option-2-build-from-tensorflow-source-code"]], "Optional Requirements for CPU Build Only": [[39, "optional-requirements-for-cpu-build-only"]], "Optional: Install Full Intel\u00ae oneAPI": [[37, "optional-install-full-intel-oneapi"]], "Original Code": [[19, "original-code"]], "Our Pledge": [[0, "our-pledge"]], "Our Standards": [[0, "our-standards"]], "Output": [[58, "output"]], "Overview": [[15, "overview"], [16, "overview"], [17, "overview"], [19, "overview"], [20, "overview"], [28, "overview"], [29, "overview"], [31, "overview"], [32, "overview"], [33, "overview"], [36, "overview"], [39, "overview"], [49, "overview"]], "Performance Data": [[31, "performance-data"]], "Practice Guide": [[32, "practice-guide"]], "Preconditions": [[38, "preconditions"]], "Prepare": [[46, "prepare"]], "Prepare Dataset": [[49, "prepare-dataset"], [51, "prepare-dataset"], [55, "prepare-dataset"], [60, "prepare-dataset"]], "Prepare Example Code": [[58, "prepare-example-code"]], "Prepare ImageNet dataset": [[61, "prepare-imagenet-dataset"]], "Prepare Pre-Trained Model": [[49, "prepare-pre-trained-model"]], "Prepare Tensorflow* CC library and header files": [[40, "prepare-tensorflow-cc-library-and-header-files"]], "Prepare for GPU": [[51, "prepare-for-gpu"], [55, "prepare-for-gpu"], [57, "prepare-for-gpu"], [60, "prepare-for-gpu"], [62, "prepare-for-gpu"]], "Prepare for GPU (Skip this Step for CPU)": [[47, "prepare-for-gpu-skip-this-step-for-cpu"]], "Prepare for GPU (Skip this step for CPU)": [[48, "prepare-for-gpu-skip-this-step-for-cpu"], [54, "prepare-for-gpu-skip-this-step-for-cpu"], [56, "prepare-for-gpu-skip-this-step-for-cpu"], [61, "prepare-for-gpu-skip-this-step-for-cpu"]], "Prepare for Running": [[44, "prepare-for-running"]], "Prepare the Codes": [[62, "prepare-the-codes"]], "Prerequisite: import intel_extension_for_tensorflow as itex": [[33, "prerequisite-import-intel-extension-for-tensorflow-as-itex"]], "Prerequisites": [[48, "prerequisites"], [51, "prerequisites"], [51, "id1"], [51, "id2"], [54, "prerequisites"], [55, "prerequisites"], [56, "prerequisites"], [57, "prerequisites"], [60, "prerequisites"], [61, "prerequisites"], [62, "prerequisites"]], "Pretraining Command": [[51, "pretraining-command"]], "Python API": [[17, "python-api"], [18, "python-api"], [47, "python-api"], [62, "python-api"]], "Python API Attribute & Environment Variable": [[18, "python-api-attribute-environment-variable"]], "Python APIs": [[33, "python-apis"]], "Python APIs and Environment Variable Names": [[33, "python-apis-and-environment-variable-names"]], "Python APIs and preserved environment variable Names": [[33, "python-apis-and-preserved-environment-variable-names"]], "Python Unit Testing": [[7, "python-unit-testing"]], "Python coding style": [[7, "python-coding-style"]], "Quantize Inception V3 by Intel\u00ae Extension for Tensorflow* on Intel\u00ae Xeon\u00ae": [[52, "quantize-inception-v3-by-intel-extension-for-tensorflow-on-intel-xeon"]], "Quick Example on Intel CPU and GPU": [[53, "quick-example-on-intel-cpu-and-gpu"]], "Quick Start Guide": [[50, "quick-start-guide"]], "Quick Training Example": [[19, "quick-training-example"]], "Refer to train_resnet50": [[59, "refer-to-train-resnet50"]], "Reference": [[36, "reference"]], "References": [[16, "references"]], "Releases": [[8, "releases"]], "Report a Vulnerability": [[1, "report-a-vulnerability"]], "Requirements": [[39, "requirements"], [40, "requirements"]], "ResNet50 Inference on Intel CPU and GPU": [[48, "resnet50-inference-on-intel-cpu-and-gpu"]], "ResNet50v1-5 Inference Performance Results": [[31, "resnet50v1-5-inference-performance-results"]], "ResNet50v1-5 Training Performance Results": [[31, "resnet50v1-5-training-performance-results"]], "Resnet50 train on Intel GPU": [[61, "resnet50-train-on-intel-gpu"]], "Resources": [[10, "resources"], [63, "resources"]], "Result": [[47, "result"]], "Results": [[51, "results"]], "Rule to Improve Performance by the Configuration List": [[18, "rule-to-improve-performance-by-the-configuration-list"]], "Run Model Quantization Example:": [[49, "run-model-quantization-example"]], "Run Models in the Docker Container": [[50, "run-models-in-the-docker-container"]], "Run Models on Bare Metal": [[50, "run-models-on-bare-metal"]], "Run Script": [[46, "run-script"]], "Run sample": [[34, "run-sample"]], "Running": [[46, "running"]], "Running Command": [[58, "running-command"]], "Running Environment": [[45, "running-environment"], [52, "running-environment"]], "Running the Container": [[3, "running-the-container"]], "Running the Jupyter Notebook": [[54, "running-the-jupyter-notebook"]], "Runtime": [[14, "runtime"]], "Runtime Switch of NextPluggableDevice and PluggableDevice": [[30, "runtime-switch-of-nextpluggabledevice-and-pluggabledevice"]], "Scope": [[0, "scope"]], "Security": [[63, "security"]], "Security Policy": [[1, "security-policy"]], "Selecting Thread Pool in Intel\u00ae Extension for TensorFlow* CPU [Experimental]": [[35, "selecting-thread-pool-in-intel-extension-for-tensorflow-cpu-experimental"]], "Set Model Parameters": [[61, "set-model-parameters"]], "Set Up Software Environment": [[49, "set-up-software-environment"]], "Set environment variables for inference": [[29, "set-environment-variables-for-inference"]], "Set up Base Running Environment": [[45, "set-up-base-running-environment"]], "Set up Intel\u00ae Extension for Tensorflow* for GPU": [[45, "set-up-intel-extension-for-tensorflow-for-gpu"]], "Setting the dtype policy": [[28, "setting-the-dtype-policy"]], "Setup": [[19, "setup"], [28, "setup"]], "Setup PYTHONPATH": [[62, "setup-pythonpath"]], "Setup Running Environment": [[46, "setup-running-environment"], [47, "setup-running-environment"], [48, "setup-running-environment"], [51, "setup-running-environment"], [54, "setup-running-environment"], [55, "setup-running-environment"], [56, "setup-running-environment"], [57, "setup-running-environment"], [58, "setup-running-environment"], [60, "setup-running-environment"], [61, "setup-running-environment"]], "Setup environment variables": [[37, "setup-environment-variables"], [42, "setup-environment-variables"]], "Sharding Parameters Setting": [[62, "sharding-parameters-setting"]], "Single Tile": [[55, "single-tile"]], "Single instance for inference": [[29, "single-instance-for-inference"]], "Situations leads to warning or Error": [[27, "situations-leads-to-warning-or-error"]], "Software Configuration": [[31, "software-configuration"], [32, "software-configuration"]], "Software Configuration for Intel Flex 170 GPU": [[31, "software-configuration-for-intel-flex-170-gpu"]], "Software Configuration for Intel Max 1550 GPU": [[31, "software-configuration-for-intel-max-1550-gpu"]], "Software Requirement": [[63, "software-requirement"]], "Software Requirements": [[37, "software-requirements"], [41, "software-requirements"], [42, "software-requirements"]], "Speed up Inference of Inception v4 by Advanced Automatic Mixed Precision on Intel CPU and GPU via Docker Container or Bare Metal": [[47, "speed-up-inference-of-inception-v4-by-advanced-automatic-mixed-precision-on-intel-cpu-and-gpu-via-docker-container-or-bare-metal"]], "Stable Diffusion Inference for Text2Image on Intel GPU": [[54, "stable-diffusion-inference-for-text2image-on-intel-gpu"]], "Stable Diffusion v1-4 Inference Performance Results": [[31, "stable-diffusion-v1-4-inference-performance-results"]], "Start with XLA using NextPluggableDevice": [[30, "start-with-xla-using-nextpluggabledevice"]], "Startup Jupyter Notebook": [[52, "startup-jupyter-notebook"], [56, "startup-jupyter-notebook"]], "Step": [[47, "step"]], "Step by step instructions:": [[38, "step-by-step-instructions"]], "Step-By-Step Instructions": [[37, "step-by-step-instructions"]], "Support": [[63, "support"]], "System environment install": [[37, "system-environment-install"], [41, "system-environment-install"], [42, "system-environment-install"]], "TCMalloc": [[29, "tcmalloc"], [32, "tcmalloc"]], "Table of Contents": [[32, "table-of-contents"]], "TensorFlow Public API": [[23, "tensorflow-public-api"]], "TensorFlow Serving": [[21, "tensorflow-serving"]], "Throughput mode": [[29, "throughput-mode"]], "Tips": [[19, "tips"]], "Tips and Debugging": [[7, "tips-and-debugging"]], "Training Accuracy Results": [[31, "training-accuracy-results"]], "Training Accuracy on 1-node of 4x Intel Data Center GPU Max 1550": [[31, "training-accuracy-on-1-node-of-4x-intel-data-center-gpu-max-1550"]], "Training Performance Results": [[31, "training-performance-results"]], "Training Performance on 1-node of 4x Intel Data Center GPU Max 1550": [[31, "training-performance-on-1-node-of-4x-intel-data-center-gpu-max-1550"]], "Training Workloads": [[31, "training-workloads"]], "Training the model with Model.fit": [[28, "training-the-model-with-model-fit"]], "Training the model with a custom training loop": [[28, "training-the-model-with-a-custom-training-loop"]], "Troubleshooting": [[14, "troubleshooting"]], "Tune Advanced AMP Manually": [[19, "tune-advanced-amp-manually"]], "Tune Advanced Auto Mixed Precision": [[18, "tune-advanced-auto-mixed-precision"]], "Tuning Performance Example on MobileNet": [[18, "tuning-performance-example-on-mobilenet"]], "Ubuntu Linux Installed in WSL2": [[37, "ubuntu-linux-installed-in-wsl2"]], "Underflow and Overflow": [[28, "underflow-and-overflow"]], "Unit testing": [[7, "unit-testing"]], "Update latest Version": [[5, "update-latest-version"]], "Usage": [[15, "usage"], [17, "usage"], [18, "usage"], [18, "id1"], [19, "usage"], [22, "usage"], [26, "usage"]], "Usage & Effect": [[36, "usage-effect"]], "Usage of Docker Container": [[2, "usage-of-docker-container"]], "Usage of TCMalloc/Jemalloc/Default memory allocator": [[29, "usage-of-tcmalloc-jemalloc-default-memory-allocator"]], "Use Case with different performance": [[27, "use-case-with-different-performance"]], "Using Eigen Thread Pool": [[35, "using-eigen-thread-pool"]], "Using OpenMP Thread Pool": [[35, "using-openmp-thread-pool"]], "V. Throughput mode": [[29, "v-throughput-mode"]], "VI. Latency mode": [[29, "vi-latency-mode"]], "VII. Your designated number of instances": [[29, "vii-your-designated-number-of-instances"]], "VIII. Your designated number of instances and instance index": [[29, "viii-your-designated-number-of-instances-and-instance-index"]], "Verify That Intel GPU is Accessible From TensorFlow": [[2, "verify-that-intel-gpu-is-accessible-from-tensorflow"]], "Verify the Installation": [[41, "verify-the-installation"], [42, "verify-the-installation"]], "Virtual environment install": [[37, "virtual-environment-install"], [41, "virtual-environment-install"], [42, "virtual-environment-install"]], "Welcome to Intel \u00ae Extension for TensorFlow* documentation!": [[6, "welcome-to-intel-extension-for-tensorflow-documentation"], [64, "welcome-to-intel-extension-for-tensorflow-documentation"]], "Welcome to Intel\u00ae Extension for TensorFlow* documentation": [[4, "welcome-to-intel-extension-for-tensorflow-documentation"]], "Why NextPluggableDevice": [[30, "why-nextpluggabledevice"]], "Windows GPU Drivers": [[37, "windows-gpu-drivers"]], "Windows Subsystem for Linux 2 (WSL2)": [[37, "windows-subsystem-for-linux-2-wsl2"], [37, "id1"]], "With XPUAutoShard": [[62, "with-xpuautoshard"]], "Without XPUAutoShard": [[62, "without-xpuautoshard"]], "Workflow": [[10, "workflow"], [15, "workflow"], [17, "workflow"], [36, "workflow"]], "X. Set environment variable TF_NUM_INTEROP_THREADS": [[29, "x-set-environment-variable-tf-num-interop-threads"]], "XPU Engine": [[23, "xpu-engine"]], "XPU for CPU only platform (Deprecated)": [[42, "xpu-for-cpu-only-platform-deprecated"]], "XPUAutoShard on GPU [Experimental]": [[17, "xpuautoshard-on-gpu-experimental"], [21, "xpuautoshard-on-gpu-experimental"]], "bazel style guide": [[7, "bazel-style-guide"]], "itex graph": [[33, "itex-graph"]], "itex operators": [[33, "itex-operators"]], "itex ops override": [[33, "itex-ops-override"]], "itex version": [[33, "itex-version"]], "itex.AutoMixedPrecisionOptions": [[33, "itex-automixedprecisionoptions"]], "itex.ConfigProto": [[33, "itex-configproto"]], "itex.DebugOptions": [[33, "itex-debugoptions"]], "itex.GPUOptions": [[33, "itex-gpuoptions"]], "itex.GraphOptions": [[33, "itex-graphoptions"]], "itex.ShardingConfig": [[33, "itex-shardingconfig"]], "itex.get_config": [[33, "itex-get-config"]], "itex.ops.AdamWithWeightDecayOptimizer": [[25, "itex-ops-adamwithweightdecayoptimizer"]], "itex.ops.GroupNormalization": [[25, "itex-ops-groupnormalization"]], "itex.ops.ItexLSTM": [[25, "itex-ops-itexlstm"]], "itex.ops.LAMBOptimizer": [[25, "itex-ops-lamboptimizer"]], "itex.ops.LayerNormalization": [[25, "itex-ops-layernormalization"]], "itex.ops.gelu": [[25, "itex-ops-gelu"]], "itex.set_config": [[33, "itex-set-config"]], "oneDNN object cache optimization": [[13, "onednn-object-cache-optimization"]], "quick_example.py": [[53, "quick-example-py"]]}, "docnames": ["CODE_OF_CONDUCT", "SECURITY", "docker/README", "docker/tensorflow-serving/README", "docs/README", "docs/build_docs/docs_build_tips", "docs/build_docs/source/index", "docs/community/contributing", "docs/community/releases", "docs/design/directory_structure", "docs/design/extension_design", "docs/design/how_to_write_custom_op", "docs/design/optimization/README", "docs/design/optimization/oneDNN_object_cache", "docs/guide/FAQ", "docs/guide/INT8_quantization", "docs/guide/OpenXLA", "docs/guide/XPUAutoShard", "docs/guide/aamp_tune", "docs/guide/advanced_auto_mixed_precision", "docs/guide/environment_variables", "docs/guide/features", "docs/guide/how_to_enable_profiler", "docs/guide/infrastructure", "docs/guide/itex_fusion", "docs/guide/itex_ops", "docs/guide/itex_ops_override", "docs/guide/keras3_support", "docs/guide/keras_mixed_precision", "docs/guide/launch", "docs/guide/next_pluggable_device", "docs/guide/performance", "docs/guide/practice_guide", "docs/guide/python_api", "docs/guide/tf_serving_install", "docs/guide/threadpool", "docs/guide/weight_prepack", "docs/install/experimental/install_for_arc_gpu", "docs/install/experimental/install_for_gpu_conda", "docs/install/how_to_build", "docs/install/install_for_cpp", "docs/install/install_for_cpu", "docs/install/install_for_xpu", "docs/install/installation_guide", "examples/README", "examples/accelerate_alexnet_by_quantization/README", "examples/common_guide_running", "examples/infer_inception_v4_amp/README", "examples/infer_resnet50/README", "examples/itex_quantization_example/README", "examples/model_zoo_example/README", "examples/pretrain_bert/README", "examples/quantize_inception_v3/README", "examples/quick_example", "examples/stable_diffussion_inference/README", "examples/train_3d_unet/README", "examples/train_bert/README", "examples/train_bert_fp8/README", "examples/train_horovod/mnist/README", "examples/train_horovod/resnet50/README", "examples/train_maskrcnn/README", "examples/train_resnet50/README", "examples/train_resnet50_with_autoshard/README", "get_started", "index"], "envversion": {"sphinx": 61, "sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2}, "filenames": ["CODE_OF_CONDUCT.md", "SECURITY.md", "docker/README.md", "docker/tensorflow-serving/README.md", "docs/README.md", "docs/build_docs/docs_build_tips.md", "docs/build_docs/source/index.rst", "docs/community/contributing.md", "docs/community/releases.md", "docs/design/directory_structure.md", "docs/design/extension_design.md", "docs/design/how_to_write_custom_op.md", "docs/design/optimization/README.md", "docs/design/optimization/oneDNN_object_cache.md", "docs/guide/FAQ.md", "docs/guide/INT8_quantization.md", "docs/guide/OpenXLA.md", "docs/guide/XPUAutoShard.md", "docs/guide/aamp_tune.md", "docs/guide/advanced_auto_mixed_precision.md", "docs/guide/environment_variables.md", "docs/guide/features.rst", "docs/guide/how_to_enable_profiler.md", "docs/guide/infrastructure.md", "docs/guide/itex_fusion.md", "docs/guide/itex_ops.md", "docs/guide/itex_ops_override.md", "docs/guide/keras3_support.md", "docs/guide/keras_mixed_precision.md", "docs/guide/launch.md", "docs/guide/next_pluggable_device.md", "docs/guide/performance.md", "docs/guide/practice_guide.md", "docs/guide/python_api.md", "docs/guide/tf_serving_install.md", "docs/guide/threadpool.md", "docs/guide/weight_prepack.md", "docs/install/experimental/install_for_arc_gpu.md", "docs/install/experimental/install_for_gpu_conda.md", "docs/install/how_to_build.md", "docs/install/install_for_cpp.md", "docs/install/install_for_cpu.md", "docs/install/install_for_xpu.md", "docs/install/installation_guide.rst", "examples/README.md", "examples/accelerate_alexnet_by_quantization/README.md", "examples/common_guide_running.md", "examples/infer_inception_v4_amp/README.md", "examples/infer_resnet50/README.md", "examples/itex_quantization_example/README.md", "examples/model_zoo_example/README.md", "examples/pretrain_bert/README.md", "examples/quantize_inception_v3/README.md", "examples/quick_example.md", "examples/stable_diffussion_inference/README.md", "examples/train_3d_unet/README.md", "examples/train_bert/README.md", "examples/train_bert_fp8/README.md", "examples/train_horovod/mnist/README.md", "examples/train_horovod/resnet50/README.md", "examples/train_maskrcnn/README.md", "examples/train_resnet50/README.md", "examples/train_resnet50_with_autoshard/README.md", "get_started.md", "index.rst"], "indexentries": {}, "objects": {}, "objnames": {}, "objtypes": {}, "terms": {"": [0, 4, 5, 14, 16, 18, 20, 21, 28, 31, 32, 34, 35, 39, 40, 45, 47, 49, 51, 52, 54, 55, 56, 63], "0": [2, 3, 4, 5, 11, 14, 15, 16, 19, 20, 22, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 37, 38, 39, 40, 41, 42, 45, 48, 49, 51, 52, 53, 56, 57, 58, 60, 61, 62, 63], "00": [16, 31, 42, 49, 61], "000": 28, "000000e": 51, "0001": 49, "0005": 51, "000611": 51, "001": [25, 26], "00363725": 25, "004": 51, "00404969": 25, "004888": 51, "006297": 61, "006950": 58, "00x": 31, "01": [14, 16, 26, 31, 33, 49, 61], "0113076031208038": 47, "01837550401687622": 47, "02": [16, 26, 28, 31, 61], "025180": 62, "027671": 62, "03": [29, 31, 51, 61], "037595": 51, "04": [2, 16, 31, 34, 35, 37, 39, 41, 42, 49, 56], "05": [16, 29, 31, 58], "0527704": 53, "06": [14, 16, 25, 28, 51], "061277": 28, "061301": 28, "061306": 28, "063685": 28, "063851": 28, "063865": 28, "0656753": 53, "07": [14, 16, 25, 31, 42, 61, 62], "072701": 51, "072752": 51, "072779": 51, "072805": 51, "072829": 51, "072861": 51, "072884": 51, "072928": 51, "073072": 51, "073094": 51, "073121": 51, "073183": 51, "077278": 53, "08": [16, 29, 35, 61], "089": 29, "09": [16, 29, 61], "090": 29, "0f": 11, "1": [2, 4, 5, 14, 16, 18, 19, 20, 21, 22, 25, 26, 27, 28, 29, 30, 32, 33, 35, 36, 38, 39, 42, 47, 49, 51, 52, 53, 54, 55, 56, 57, 58, 60, 61, 62, 63], "10": [2, 14, 16, 18, 19, 25, 28, 29, 35, 36, 37, 39, 40, 41, 49, 51, 52, 61, 62, 63], "100": [11, 28, 33, 39, 51], "1000": [31, 34, 55, 61], "10000": [19, 25, 28], "101": 37, "1024": [28, 31], "1024_a": 51, "1024gb": 31, "103148": 62, "105446": 51, "107809": 58, "10gbase": 31, "11": [16, 18, 29, 31, 37, 38, 39, 40, 42, 61, 63], "111": [28, 32], "112": 32, "114": [28, 58], "1146879196167": 54, "11490434": 28, "116": 14, "118": [28, 30], "118212": 53, "1193419": 53, "12": [7, 14, 16, 28, 29, 31, 42, 51, 54, 56, 58, 61, 62, 63], "1200": 61, "122": 33, "122414": 51, "122509": 51, "12278": 31, "127": [5, 34], "128": [16, 31, 47, 51, 57], "128gb": 31, "129": 29, "12_h": 51, "12e": 51, "13": [16, 40, 52, 58, 62, 63], "133": 49, "136": 29, "137": 29, "139660941027136": 61, "139898862851904": 61, "14": [28, 31, 34, 40, 49, 51, 56, 58, 61, 63], "140": [39, 40], "140348344015936": 62, "1403804": 53, "140612319840064": 61, "141": 11, "144": 29, "1445": 11, "145": [29, 61, 62], "1455178": 53, "15": [2, 7, 16, 29, 31, 35, 37, 38, 39, 40, 41, 42, 45, 51, 63], "150": 55, "15000": 25, "15031084974591766410": 2, "150400": 31, "150w": 31, "1550": 16, "156": 28, "15865526": 25, "158808": 25, "16": [18, 28, 29, 31, 33, 41, 47, 51, 61], "161625": 62, "163": 49, "163161": 58, "163517": 58, "163815": 62, "1657011814330": 18, "1657011815538": 18, "1658201": 53, "1666": 51, "1691980294577": 47, "16x64gb": 31, "17": [29, 40], "170": [39, 40, 42, 54, 57], "1704025": 53, "170intel": 47, "1729176": 53, "174": 56, "17448926295332318308": 2, "1762": 31, "1766": 31, "177216": 51, "178206": 61, "18": [16, 51, 58], "182": 31, "1846": 51, "185w": 31, "19": [29, 31, 37, 41, 42], "1900": 61, "190052": 51, "190136": 51, "190169": 51, "190193": 51, "190217": 51, "190249": 51, "190273": 51, "190343": 51, "190536": 51, "190559": 51, "190587": 51, "190668": 51, "191": 29, "192": [29, 51], "197306": 53, "198": 29, "1986": 28, "1997": 25, "1a": 40, "1ccb4fee": 38, "1e": [25, 26, 28], "1export": [18, 19], "1tb": 31, "1u": 28, "2": [2, 14, 15, 16, 17, 18, 19, 20, 24, 25, 27, 28, 29, 30, 31, 32, 33, 35, 36, 38, 39, 41, 42, 45, 47, 48, 49, 51, 52, 53, 54, 55, 57, 58, 60, 61, 62, 63], "20": [16, 29, 31, 35, 39, 41, 60, 62], "200": [25, 26, 51], "2000": [51, 61], "200m": 32, "2016": 25, "2017": [31, 60], "2018": 49, "20180905": 33, "2019": 55, "20200711": 49, "2021": 14, "2022": [28, 29, 33], "2023": [38, 42, 49, 51, 58], "20230123": 21, "2024": [14, 31, 37, 42], "206": 29, "207": 29, "21": [29, 31, 51], "210": 49, "2100": 61, "2134862": 53, "215": 29, "2155": 28, "216": 29, "217981": 42, "22": [2, 31, 34, 37, 39, 41, 42, 49, 51, 62], "2200": 61, "22355853": 48, "224": [22, 49], "22471978829632": 51, "224x224": 31, "227250": 51, "229": 29, "23": [29, 31, 42, 62], "2300": 61, "23092487755584": 51, "23450678511424": 51, "2350": 37, "24": [29, 31, 51, 58], "2400": 61, "241": 29, "2488174077578": 57, "24_h": 51, "24x": 31, "25": [31, 62], "250": 58, "250221": 53, "25294047594070435": 28, "254": 29, "255": [19, 28, 35], "256": [28, 31, 35, 51, 62], "26": 35, "2600": 51, "2607155": 53, "2636094": 53, "26531240344047546": 28, "266": 29, "268435456": 2, "269": 28, "27": [16, 29, 32, 62], "272": 30, "27642": 42, "277716": 61, "277811": 61, "278": 29, "28": [29, 31, 32, 38, 42, 49, 51], "280": 62, "29": [29, 31], "290": 29, "298973": 53, "299": 35, "2nd": 41, "2tb": 31, "2x": [31, 35], "2x256x10": 62, "3": [2, 4, 7, 16, 18, 20, 22, 24, 25, 26, 28, 29, 30, 31, 32, 33, 35, 38, 39, 40, 41, 42, 45, 46, 49, 52, 53, 62], "30": [14, 16, 31, 35, 49, 51, 62], "3000765": 53, "3007": 31, "300x300": [31, 49], "302": 29, "303": 28, "305706": 53, "31": [29, 37], "312": [31, 51], "314010": 51, "314064": 51, "314090": 51, "314113": 51, "314135": 51, "314165": 51, "314197": 51, "314260": 51, "314455": 51, "314478": 51, "314505": 51, "314589": 51, "315": 29, "318963": 53, "32": [16, 18, 25, 26, 28, 29, 31, 33, 47, 51, 57, 61], "3200": 31, "3221133": 53, "3265": 31, "327": 29, "327398": 53, "328223477737884": 54, "33": 14, "3343554": 62, "3359": 28, "3359284": 62, "3364005982875824": 28, "339": 29, "3391027": 53, "34": 29, "3455": 28, "3461": 31, "35": [29, 31, 42], "350w": 31, "351": 29, "3549364": 53, "3555": 28, "3587": 31, "36": [29, 31, 35, 49], "364": 29, "3670": 28, "37": 16, "3753": 28, "376": 29, "3787665": 53, "38": [29, 31], "3804817": 53, "381424": 53, "384": 31, "3870": 31, "388": 29, "39": [29, 31], "3905785": 53, "3999124": 53, "3d": 44, "3dunet_itex": 55, "3dunet_itex_with_horovod": 55, "3e": [51, 57], "3f": 35, "3rd": [4, 21, 31, 41], "4": [14, 17, 18, 20, 24, 25, 28, 29, 30, 32, 35, 38, 51, 53, 58, 60, 62], "40": [14, 16, 29, 31, 42, 51], "400": [29, 61], "404": 29, "405": 29, "408512": 61, "4096": [19, 28], "40ghz": 31, "41": [16, 28], "41249612335034": 57, "413": 29, "416651": 62, "419072": 62, "42": 31, "42261": 53, "425": 29, "43": [16, 29, 31, 42], "435": 31, "438": 29, "44": [11, 16, 29], "4498": 28, "452": 29, "45x": 31, "461180928": 51, "465": 29, "47": [16, 29, 61], "4718971": 53, "479": 62, "479142": 53, "47eb": [37, 42], "48": [16, 29, 51, 61], "480": 29, "4800": 31, "481086": 53, "4818356": 53, "49": [29, 61], "4929404": 53, "494": 29, "4d": 25, "4th": [31, 41, 47], "5": [11, 18, 19, 20, 22, 25, 28, 30, 33, 35, 39, 40, 41, 51, 53, 57, 62], "50": [29, 31, 35], "5000": 31, "5063303": 53, "509": 29, "50ghz": 32, "51": [16, 29, 31, 51], "510076": 14, "51179520": 51, "512": [31, 51, 57], "5120": 62, "512x512": 31, "517385": 53, "52": [16, 28, 29, 51], "523": 31, "5294489860534668": 28, "53": [29, 31], "5300783": 53, "5333": 37, "54": 58, "5479512": 53, "549": 29, "55": [14, 16, 29, 31, 32, 35, 62], "550": 29, "555174": 61, "555221": 61, "5597944": 53, "56": [16, 29, 31, 32, 35], "57": 31, "5774": 51, "57x": 31, "58": 29, "586": 29, "59": [16, 29], "590331": 61, "594147": 62, "595": 51, "596": [37, 42, 51], "597": 51, "597360": 62, "598": 51, "5e": 51, "5th": 31, "6": [18, 26, 28, 30, 31, 33, 42, 49, 51], "60": [28, 29, 31, 35, 51], "600": [51, 61], "60000": [19, 28], "600w": 31, "601": 51, "602": 51, "6027272": 53, "602742": 61, "603262": 61, "604": [29, 51], "6047": 31, "605": 29, "606": 51, "607": 51, "6153628825864496": 47, "6240": 28, "63": [16, 29], "6336y": 31, "6342418": 53, "634554": 62, "64": [14, 16, 17, 19, 28, 29, 31, 35, 37, 39, 41, 42, 51, 56], "640x640": 49, "6416": 51, "6422923": 53, "6456823": 53, "6461415": 53, "6514435": 53, "65504": 28, "6628485": 53, "66fa74b6a2a0bb1e563ae8bce66496b118b95200": 54, "67": [16, 29, 31], "6761076": 53, "68": 29, "6867": 31, "69": 31, "692": 31, "6926193": 53, "693": 29, "694": 29, "69612": 49, "699": 31, "7": [18, 28, 29, 30, 31, 33, 49, 51, 54], "7090344": 53, "71": 29, "7112d33": 33, "718459": 53, "72": [29, 49], "7239000201225281": 28, "7296917": 53, "7297122": 53, "730m": 14, "736": 31, "74": 31, "7494": 28, "75": [29, 31], "7520": 28, "757": 29, "76": [25, 29, 31, 51], "768": 51, "768_a": 51, "772": 29, "773": 11, "7787259": 53, "784": [19, 28, 29, 35], "79": 29, "790128": 61, "790632": 62, "792936": 62, "795": 29, "7987": 28, "7f": 51, "8": [18, 25, 28, 29, 31, 33, 40, 41, 42, 49, 51, 52], "80": [29, 31], "800": 61, "803": [37, 42], "806": 29, "81": [31, 51, 54, 57], "810": 51, "817": 29, "8180m": 32, "8192": [19, 28], "81m": 28, "82574l": 31, "828": 29, "83": [29, 31, 32, 51], "839": 29, "83m": 28, "84": [29, 31, 32], "841192": 25, "8413447": 25, "8480": [31, 35], "84m": 28, "85": 35, "850": 29, "8500": [3, 34], "8501": 34, "8534": 28, "85485": 53, "8598063": 53, "85m": 28, "86": [16, 31], "8672705": 53, "867908472383153": 47, "87": [29, 31], "870": 31, "875052": 53, "8751": 28, "88": [29, 57], "8809638": 53, "8819": 28, "8863": 28, "8876": [37, 42], "888000e": 51, "8880196": 53, "8888": [41, 42, 47, 52, 54, 56], "88eb3cff2f03dad85035621d041e23a14345999": 55, "891": 29, "892": 29, "8941312": 53, "8972": 28, "89942324": 53, "8x16gb": 31, "9": [14, 18, 25, 26, 29, 30, 37, 38, 39, 41, 42, 45, 46, 56, 62], "9000": 5, "908": 29, "909": 29, "91": [29, 31], "911": 29, "9154005": 53, "9168000221252441": 28, "917546": 61, "917738": 61, "918": 31, "92": [29, 31], "924008369445801": 28, "9259825": 53, "9260886": 53, "9266936945121049176": 2, "928": 31, "92880015134813": 47, "92x": 31, "93": 31, "930": 29, "9349675": 53, "9373732": 53, "9377": 28, "9381000399589539": 28, "9381838": 53, "93901324": 53, "94": 16, "940695": 58, "9410": 28, "947": 29, "948": 29, "9486000537872314": 28, "949225": 53, "95": [29, 31], "951": 29, "9536000490188599": 28, "96": [29, 31, 40, 51], "9631021": 53, "9677248": 53, "968": 31, "96x": 31, "97": 16, "9702091": 53, "9746864": 53, "9755": 28, "98": 16, "9842": 31, "9873173": 53, "988714": 53, "99": 16, "9959502": 25, "9963627": 25, "999": [25, 26], "99998": 25, "A": [0, 5, 17, 18, 24, 28, 29, 32, 33, 34, 36, 42, 44, 47, 58], "And": [30, 37, 41, 42, 51], "As": [17, 24, 28, 29, 32], "At": [16, 17, 21, 45, 54], "Being": 0, "But": [27, 28], "By": [13, 20, 28, 29, 32, 52], "For": [0, 1, 2, 4, 7, 11, 14, 15, 18, 19, 20, 23, 25, 26, 28, 29, 31, 33, 34, 35, 37, 42, 47, 48, 49, 50, 51, 54, 55, 56, 57, 58, 60, 61, 62], "If": [2, 3, 5, 20, 22, 25, 26, 27, 28, 29, 32, 33, 35, 37, 39, 40, 41, 42, 45, 47, 48, 49, 51, 52, 53, 54, 55, 56, 57, 60], "In": [4, 11, 16, 18, 19, 27, 28, 29, 30, 32, 35, 36, 38, 45, 47, 49, 52, 53, 58, 62], "It": [4, 11, 14, 15, 16, 17, 18, 19, 20, 21, 28, 30, 32, 35, 36, 38, 39, 44, 51, 52, 55, 56, 60, 63], "NOT": [7, 14], "No": [0, 14, 19, 22, 35, 39, 47, 48, 51, 54, 55, 56, 57, 60], "Not": 20, "ON": [17, 31, 33, 47, 62], "Of": 51, "On": [28, 32, 37, 41, 42], "One": [29, 32], "That": [14, 32, 39, 40, 47], "The": [0, 2, 4, 5, 7, 9, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 24, 25, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 45, 47, 49, 51, 52, 55, 56, 57, 58, 60, 61, 62], "Their": 28, "Then": [3, 11, 22, 33, 41, 42, 52], "There": [21, 27, 36, 39, 45, 47, 52, 61], "These": [16, 24, 28, 29, 63], "To": [2, 3, 4, 7, 16, 18, 19, 24, 27, 28, 32, 36, 37, 39, 40, 41, 42, 45, 51, 52, 54, 55, 60], "With": [18, 19, 28, 29, 30, 45, 48, 53, 54], "_": [0, 11, 13, 14, 17, 18, 20, 22, 24, 27, 28, 29, 30, 32, 33, 34, 35, 37, 39, 40, 46, 47, 49, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61], "__del__": 56, "__init__": 35, "__main__": [29, 35], "__name__": 35, "__version__": [11, 33, 37, 39, 40, 41, 42, 63], "_gbs1_": 51, "_gbs2_": 51, "_pywrap_itex": 39, "_timestamp_inst": 29, "_timestamp_instance_n_cor": 29, "a100": 54, "a380": [39, 40], "a730m": [39, 40], "a930253": 33, "abl": 5, "about": [0, 7, 19, 32, 34, 35, 45, 51, 52, 58], "abov": [18, 19, 22, 28, 29, 32, 37, 47, 51, 52, 55, 56, 57, 58, 60, 62], "absolut": [29, 51], "abus": 0, "acceler": [4, 14, 16, 30, 31, 33, 44, 47, 52, 63], "accept": [0, 7, 17], "access": 37, "accmatmul": 24, "accord": [17, 18, 47, 56, 58, 61], "accordingli": 62, "account": 0, "accumul": 31, "accur": 36, "accuraci": [15, 18, 19, 25, 28, 44, 45, 52, 58, 61], "achiev": [18, 32], "acm": [39, 40], "across": [16, 20, 25], "act": [0, 21, 34], "action": [0, 5, 36], "activ": [11, 18, 19, 22, 25, 28, 32, 33, 37, 38, 39, 40, 41, 42, 46, 47, 48, 52, 53, 55, 56, 58, 60], "ad": [5, 13, 17, 18, 21, 23, 28, 39, 51, 62], "adam": 25, "adamw": 25, "adamwithweightdecayoptim": 26, "adapt": 0, "add": [3, 4, 5, 17, 18, 19, 24, 27, 32, 34, 37, 39, 40, 47, 54, 62], "add_weight": 35, "add_with_xla": 30, "addit": [8, 21, 23, 24, 32, 36, 40, 63], "addition": [18, 28], "addn": 24, "addon": [26, 58], "address": [0, 32, 37], "adher": 63, "adjust": [20, 25, 51], "adjusted_init_lr": 51, "adopt": [4, 15, 16, 21], "advanc": [0, 4, 20, 30, 33, 44, 63], "affect": [0, 18, 28], "affin": 32, "after": [2, 17, 18, 19, 22, 24, 26, 27, 28, 32, 33, 36, 37, 38, 42, 45, 51, 56], "afterward": [28, 29, 32], "ag": 0, "again": 28, "against": 7, "agent": 37, "aggress": [0, 16, 18, 19], "ahead": [39, 40], "ai": [44, 45, 50, 52, 63], "aim": 63, "aka": 21, "akdlm": [37, 42], "al": 25, "alexnet": 44, "alg": 11, "alg_kind_": 11, "algebra": [4, 16, 30], "algo": 11, "algorithm": [11, 25], "align": [0, 13], "all": [0, 7, 11, 14, 18, 20, 21, 25, 27, 28, 30, 32, 37, 42, 45, 47, 51, 62], "allocate_output": 11, "allow": [0, 16, 18, 28, 32, 35, 56, 63], "allowlist": 18, "allowlist_add": [18, 19], "allowlist_remov": 18, "almost": 21, "along": [30, 32], "alpha": 11, "alpha_": 11, "alreadi": [18, 28, 38, 45], "also": [0, 4, 7, 15, 16, 17, 19, 21, 23, 27, 28, 29, 30, 32, 36, 37, 38, 41, 42, 63], "altern": 18, "although": 32, "alwai": [18, 28, 36], "alwayslink": [11, 34], "am": 51, "amd64": [7, 37], "among": [29, 32], "amount": [14, 28], "amp": [4, 18, 29, 31, 44, 55, 60, 63], "ampthre": 18, "amx": 52, "amx_bf16": 52, "amx_int8": 52, "an": [0, 2, 3, 4, 7, 11, 13, 14, 16, 18, 19, 21, 24, 25, 27, 28, 29, 30, 32, 34, 35, 37, 38, 39, 40, 42, 44, 49, 52, 53, 57, 62, 63], "anaconda": 38, "analysi": [16, 32], "analyt": 45, "analyz": [16, 22], "ani": [0, 4, 11, 16, 20, 21, 23, 24, 27, 28, 29, 37, 38, 39, 42, 45, 53, 56], "annot": 17, "anoth": [29, 32, 36], "answer": 0, "antirectifi": 35, "aot": [39, 40], "apach": 63, "api": [4, 7, 9, 10, 14, 15, 16, 19, 25, 26, 27, 28, 30, 32, 34, 40, 52, 53], "apolog": 0, "apologi": 0, "appear": [0, 28], "append": [35, 37, 41, 42], "appli": [0, 16, 17, 25, 28, 33, 34, 51, 54, 55, 57, 60, 62], "applic": [4, 21, 23, 31, 32, 33, 34, 36, 45], "apply_gradi": 28, "appoint": 0, "approach": [4, 16, 38], "appropri": [0, 3, 32, 39, 40], "approv": 7, "approxim": [11, 25], "approximate_": 11, "apt": [7, 34, 37, 39, 42], "ar": [0, 2, 4, 5, 7, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 32, 34, 36, 37, 39, 40, 41, 42, 44, 45, 47, 51, 52, 53, 55, 58, 61, 63], "arang": 25, "arc": [14, 39, 40, 42, 47, 63], "arch": 37, "architectur": [11, 16], "archiv": 37, "area": 13, "arg": [2, 13, 33], "argument": [13, 25, 28, 29, 33], "around": [0, 29, 51], "arrai": 25, "articl": 32, "as_graph_el": 35, "ask": [4, 36, 39, 40], "aspect": 28, "assign": [29, 32, 40], "assign_i": 40, "assign_x": 40, "assist": 8, "assum": [17, 28, 32, 38, 39, 40, 51, 55, 60], "assumpt": [2, 3], "astyp": [19, 28, 35, 53], "ats": [39, 40], "atsp": 28, "attach": [2, 3, 28, 32], "attack": 0, "attent": [0, 20], "attr": [11, 20], "attribut": [24, 33], "auto": [4, 11, 17, 27, 29, 30, 33, 40], "auto_mixed_precis": [18, 19, 33, 47], "auto_mixed_precision_log_path": [20, 33], "auto_mixed_precision_opt": [18, 19, 47], "auto_mixed_precision_optionsgraph_opt": 18, "auto_mod": [17, 62], "auto_sharding_pass": 17, "auto_sharding_pass_mlir": 17, "autom": [21, 29], "automat": [4, 5, 16, 17, 18, 19, 21, 26, 28, 29, 31, 32, 33, 37, 42, 44, 48, 53, 62], "automixedprecis": 18, "automixedprecisionopt": [18, 19, 47], "automixedprecosionopt": 18, "autoshard": [17, 62], "ava": 49, "avail": [0, 2, 3, 11, 14, 19, 25, 29, 32, 35, 36, 39, 40, 41, 42, 55], "averag": 51, "avgpool": [18, 19, 49], "avgpool3d": [18, 19], "avoid": [0, 4, 24, 27, 28, 29, 32, 35, 38, 51], "avx512": [4, 21, 52], "avx_vnni": 52, "awk": 51, "axi": [25, 26, 35], "b": [30, 35, 40, 47, 49, 51, 52, 61, 62], "b4ab4b8f8b3a41fade4899fd00b5b2d2dad0981f3e1bb10df4c522975fd7": 40, "b7a8": [37, 42], "ba": 25, "back": [17, 28, 39], "backend": [4, 16, 21, 23, 26, 27, 28, 33, 42, 47, 48, 52, 53, 63], "background": 32, "background_thread": 29, "backward": [11, 28], "balanc": [18, 19, 31, 35], "bare": 44, "base": [7, 11, 14, 15, 16, 18, 19, 25, 31, 32, 37, 38, 41, 44, 47, 51, 52, 57, 58, 62, 63], "base_config": 35, "base_shap": 35, "basekit": [37, 38, 42], "bash": [2, 37, 38, 39, 40, 47, 51, 52, 60, 63], "bashrc": 38, "basi": 37, "basic": [18, 19, 20, 28], "batch": [17, 25, 28, 29, 31, 51, 62], "batch_siz": [16, 17, 19, 28, 35, 55, 62], "batch_size_per_gpu": 51, "batchmatmul": [24, 26], "bazel": [3, 11, 34], "bazelbuild": [7, 39, 40], "bazelrc": 39, "becaus": [18, 19, 28, 36], "becom": [13, 32, 36], "been": [28, 32, 54, 62], "befor": [5, 7, 11, 16, 18, 19, 24, 27, 28, 29, 32, 35, 36, 39, 40, 44, 62], "begin": [7, 11, 47], "behavior": [0, 27, 28, 29, 32, 36, 51], "being": 32, "below": [2, 3, 24, 25, 28, 29, 30, 31, 32, 33, 37, 39, 42, 51, 56], "benchmark": [7, 16, 31, 35, 55, 61], "benefit": [4, 21, 28, 32, 33], "bert": [16, 20, 25, 36, 44], "bert_base_dir": 16, "bert_base_model": 16, "bert_config": [16, 57], "bert_config_fil": [16, 57], "bert_larg": 16, "bert_large_dir": 57, "bert_model": [51, 57], "bert_prep_working_dir": 51, "besid": [21, 32], "best": [0, 14, 16, 27, 37], "beta": 11, "beta_": 11, "beta_1": [25, 26], "beta_2": [25, 26], "beta_constraint": [25, 26], "beta_initi": [25, 26], "beta_regular": [25, 26], "better": [4, 15, 16, 18, 19, 21, 24, 25, 27, 29, 32, 35, 36, 44, 51, 52, 54, 55, 60], "between": [16, 17, 18, 19, 21, 32, 34, 35, 39, 54, 61, 62], "bf16": [18, 19, 24, 31, 44, 45, 47, 51, 55, 60, 61, 62], "bf32": 20, "bfloat16": [4, 11, 18, 19, 21, 24, 28, 33, 47, 51, 55, 57, 60], "bfloat16graph_opt": 19, "bia": [13, 20, 24, 53], "bias_add": 53, "bias_initi": [25, 26], "biasadd": [20, 26], "biasaddgrad": 24, "big": 45, "bin": [3, 7, 11, 29, 34, 39, 40, 46, 47, 48, 52, 55, 56, 58, 60], "bin_threadpool": 3, "binari": [18, 34, 39, 40], "bind": [13, 30, 32, 40], "bind_al": 22, "bit": [15, 18, 28, 33, 37, 39, 41, 42, 47], "blob": [21, 34], "block": [11, 32, 33, 35, 36, 42], "blocker": 45, "blocktim": 32, "blog": 16, "board": 31, "bodi": 0, "bookcorpu": [31, 51], "bool": 11, "boolean": [24, 29], "boost": [4, 21, 29, 31, 32], "both": [4, 7, 14, 15, 18, 19, 23, 27, 29, 30, 31, 32, 33, 39, 47, 61], "bound": 32, "box": 15, "brain": 55, "branch": [5, 7, 39], "break": 24, "bridg": [21, 34], "briefli": 32, "bring": [23, 28, 29, 63], "browser": [5, 22, 41, 42, 49, 52, 54, 56], "bs1": 49, "bt": 35, "bu": [2, 30], "buffer": [16, 49], "bug": [7, 63], "buid": 40, "build": [4, 7, 9, 35, 43, 44, 45, 51, 63], "build_doc": 5, "build_pip_packag": [11, 39], "build_tmp": 5, "build_with_threadpool": 40, "builder": 61, "buildifi": 7, "buildtool": 7, "built": [11, 16, 34, 41, 42], "bus_id": 2, "busi": 32, "bzl": 7, "c": [2, 4, 10, 11, 14, 29, 30, 32, 35, 37, 38, 39, 41, 42, 43, 56, 63], "c481324031ecf0f70f8939516c02e16cac60446d": 60, "c_api_experiment": 40, "c_str": 40, "cach": [12, 15, 32, 35, 51], "calcul": [29, 54], "calibr": 52, "call": [11, 15, 16, 26, 28, 30, 32, 33, 35, 36, 43, 46, 52, 53, 56, 57], "callabl": 56, "can": [2, 3, 4, 7, 11, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 25, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 45, 51, 55, 56, 60, 61, 62, 63], "cannot": [14, 18, 27, 35, 47, 48, 51, 54, 55, 57, 60], "capabl": [4, 14, 27, 28], "capi": 30, "card": [20, 51, 58], "case": [4, 13, 18, 19, 21, 28, 29, 32, 35, 47], "cast": [0, 18, 24, 28, 49], "cat": 29, "catch": 11, "caus": [27, 28, 32, 35, 56], "cbica": 55, "cc": [3, 11, 14, 17, 28, 30, 34, 42, 58, 62], "ccl": [38, 42], "cd": [2, 5, 7, 16, 32, 34, 39, 40, 47, 51, 54, 55, 57, 58, 60, 62], "cell": [28, 54], "center": [1, 4, 16, 21, 25, 26, 33, 39, 40, 42, 45, 47, 50, 51, 52, 54, 55, 56, 57, 58, 60, 61, 62, 63], "cento": 41, "certain": [16, 29, 32], "challeng": 55, "chanc": [18, 28], "chang": [4, 5, 7, 11, 18, 19, 20, 21, 23, 27, 28, 29, 30, 36, 38, 44, 45, 56, 58], "channel": [0, 24, 25, 43], "channels_last": 62, "characterist": 0, "cheap": 35, "check": [5, 7, 11, 13, 14, 18, 19, 21, 23, 28, 29, 37, 38, 39, 40, 45, 46, 47, 57, 63], "checker": 32, "checkout": [5, 34, 40, 55, 60, 62], "checkpoint": 51, "choos": [16, 23, 25, 27, 28, 29, 32, 35, 39, 40, 43, 47, 49, 52, 53, 55], "chrome": 5, "circular": 27, "ckpt": [51, 57], "clang": 7, "clarifi": 0, "clariti": 0, "class": [0, 11, 28, 33, 35], "classic": 32, "classif": 22, "classifi": [44, 61], "classifier_train": 61, "classify_text_with_bert": 56, "claus": [4, 21, 23], "clean": [11, 40], "clearlist": 18, "clearlist_add": 18, "clearlist_remov": 18, "click": [11, 39, 40], "client": [2, 30, 40], "client_sess": 40, "clientsess": 40, "clock": 14, "clone": [5, 16, 34, 39, 40, 51, 54, 55, 57, 60, 61, 62], "close": [25, 27, 32], "closer": 24, "cluster": [27, 38], "cm": 37, "cmake": 39, "cnn": [18, 31, 32, 44, 45], "co": [4, 14, 15, 21], "coco": [31, 49, 60], "coco17": 49, "code": [2, 4, 5, 9, 11, 16, 20, 21, 22, 23, 27, 30, 31, 32, 34, 35, 43, 44, 45, 47, 49, 52], "codebas": [4, 30], "codenam": 4, "colab": 28, "collabor": [16, 63], "collect": [2, 32, 42], "color": 0, "com": [0, 5, 7, 8, 16, 21, 28, 32, 34, 35, 37, 38, 39, 40, 42, 45, 47, 49, 51, 52, 54, 55, 56, 57, 58, 60, 61, 62, 63], "combin": [16, 21, 29, 32, 54], "come": 4, "comma": 32, "command": [2, 3, 14, 22, 29, 32, 37, 38, 39, 40, 41, 42, 46, 47, 49, 52, 57], "comment": [0, 7, 14], "commit": [0, 5, 17, 34], "common": [0, 11, 14, 17, 21, 32, 44, 51], "common_runtim": [11, 30], "commonli": 32, "commun": [0, 2, 7, 9, 21, 23, 32, 42, 63], "compact": [29, 32, 35], "compar": [16, 18, 28, 32, 44], "compat": [2, 3, 4, 15, 19, 21, 23, 26, 28, 30, 33, 35, 51, 52, 54, 55, 56, 57, 60, 61], "compet": 32, "competit": 32, "compil": [4, 11, 14, 16, 19, 21, 27, 28, 30, 32, 33, 34, 35, 36, 37, 38, 40, 42], "compiler_vers": 33, "complaint": 0, "complet": 32, "complic": [21, 29], "compon": [17, 19, 31, 33, 37, 38, 39, 40, 42], "compos": 17, "compressor": [4, 15, 21, 44, 45, 52], "comput": [4, 11, 15, 16, 25, 28, 32, 35, 37, 45, 53, 54, 63], "compute_dtyp": 28, "compute_gradi": 28, "concat": 35, "concaten": [35, 54], "concatv2": 49, "concept": [16, 28, 32], "concrete_funct": 35, "concurr": [4, 13, 20, 32, 35], "conda": [4, 14, 43, 51, 56], "conda_prefix": 29, "conduct": [7, 29], "conduit": [4, 30], "conf": 29, "config": [11, 14, 17, 18, 19, 28, 34, 35, 37, 39, 40, 42, 47, 52, 58, 61, 62], "config_fil": 61, "configproto": [17, 18, 19, 47, 52, 62], "configur": [4, 8, 11, 14, 17, 19, 21, 23, 28, 29, 33, 35, 37, 42, 49, 61, 63], "confirm": [29, 39, 40], "conflict": 35, "conform": 7, "connect": 32, "consecut": 32, "consequ": 0, "consid": [0, 18, 58], "consist": [7, 28], "consol": 42, "const": 40, "constant": [11, 15, 16, 25, 26, 28, 30], "constant_fold": 52, "constraint": 25, "construct": [0, 11, 17, 28], "constructor": 28, "consum": 51, "consumpt": [19, 21, 28, 47], "contact": 8, "contain": [5, 9, 15, 17, 27, 29, 32, 34, 43, 44, 55, 60, 63], "content": [5, 40, 42], "context": [11, 25, 32], "contigu": 32, "continu": [0, 14, 18, 27, 28], "contrast": 16, "contribut": [0, 4, 14, 21, 29, 39], "contributor": [7, 63], "control": [31, 32, 44, 52, 62], "conv": [17, 24, 53], "conv2d": [4, 21, 49, 53], "conv3d": 24, "convent": 7, "convers": [17, 18, 19, 24], "convert": [15, 16, 17, 18, 19, 28, 36, 45, 47, 49, 55, 61], "convert_to_tensor": 11, "convgradfilt": 24, "convolut": 32, "cooper": [4, 21, 44, 49, 52], "copi": [2, 3, 40], "copt": [11, 34], "copyright": 7, "core": [9, 11, 14, 17, 26, 28, 30, 31, 32, 35, 39, 40, 42, 52, 53, 58, 62], "core_id": 29, "core_list": 29, "correct": [28, 35, 39, 40], "correspond": [18, 29, 30, 36], "correspondli": 61, "cost": 15, "costli": 32, "could": [0, 18, 28, 33, 40, 45, 51, 52], "count": 14, "coupl": 32, "coven": [7, 63], "cover": [19, 21, 24, 29, 32], "cp": [3, 40, 51], "cp311": 40, "cpp": [3, 14, 17, 37], "cpplint": 7, "cpu": [2, 3, 4, 9, 11, 14, 15, 16, 18, 19, 20, 23, 24, 28, 31, 33, 34, 36, 43, 44, 45, 49], "cpudevic": 11, "cpunodebind": 32, "crash": 56, "creat": [11, 18, 28, 29, 30, 33, 36, 38, 42, 46, 49, 52, 55, 60, 62], "create_datasets_from_start": 51, "creatednnlengin": 11, "creatednnlstream": 11, "creation": 13, "critic": 18, "cross": [29, 32], "ctl": 61, "ctx": 11, "cuda": 28, "cuda_diagnost": 28, "cuda_driv": 28, "cuinit": 28, "curl": 38, "current": [14, 17, 22, 33, 51, 55, 60, 62], "custom": [4, 7, 9, 16, 18, 21, 26, 27, 29, 33, 37, 42, 51], "custom_graph_optimizer_registri": 58, "cv": 54, "cvfh": 3, "d": [7, 35, 37, 39, 40, 61], "d50dnp1sbb": 31, "dai": 51, "danger": 18, "dashboard": 22, "data": [4, 15, 16, 17, 18, 21, 22, 25, 28, 33, 35, 39, 40, 42, 45, 47, 49, 50, 51, 52, 54, 55, 56, 57, 58, 60, 61, 62, 63], "data_dir": [16, 51, 55, 60, 61], "data_f32": 11, "data_format": [20, 62], "data_typ": [18, 19, 47], "dataset": [19, 28, 31, 35, 52, 58], "dataset_dir": [55, 60], "datatyp": [33, 40, 51, 55, 60], "dch": 37, "dcmake_build_typ": 39, "ddr4": 31, "ddr5": 31, "de6201297144": [37, 42], "dealloc": 32, "dearmor": 37, "deb": [37, 39], "debug": [11, 20, 22, 33], "debugalloc": 32, "decai": 25, "decayed_learning_rate_at_crossover_point": 51, "decid": 17, "decis": [0, 17], "declar": 11, "decoupl": [25, 30], "dedic": 7, "deem": 0, "deep": [15, 25, 27, 32, 36, 44, 63], "deeper": 23, "deeplearningexampl": [31, 51, 55, 60], "def": [28, 30, 35], "default": [4, 7, 13, 14, 15, 18, 19, 20, 21, 23, 27, 28, 30, 31, 32, 33, 35, 39, 40, 51, 52, 53, 60, 61, 62], "default_data_typ": [18, 33], "default_dataset": 49, "default_static_qconfig": 49, "defin": [4, 16, 28, 40], "definit": [7, 18, 23, 33], "deleg": 15, "deliv": [4, 19, 21, 27], "delta_tim": 35, "demand": [13, 63], "demo": 22, "demonstr": [0, 31, 44], "denali": 31, "deni": 18, "dens": [19, 20, 28, 35], "dense1": 28, "dense2": 28, "dense_1": [19, 28], "dense_2": [19, 28], "dense_logit": [19, 28], "denylist": 18, "denylist_add": 18, "denylist_remov": 18, "dep": [11, 34], "depend": [14, 16, 19, 29, 32, 36, 37, 39, 40, 42], "deploi": [21, 34], "deploy": [38, 41, 42], "deprec": 39, "depthwiseconv2dn": 49, "dequant": [49, 52], "derogatori": 0, "desc": [11, 13], "descibl": 11, "describ": [25, 28, 29, 32], "descript": [9, 13, 18, 29, 32, 33, 44, 56], "descriptor": 11, "design": [4, 7, 9, 21, 30, 34, 45], "desir": [18, 29], "destruct": 32, "detail": [2, 3, 11, 15, 16, 17, 18, 19, 21, 23, 25, 28, 32, 33, 36, 37, 39, 40, 42, 45, 47, 51, 63], "detect": [32, 49], "determin": [0, 11, 28, 32], "dev": [2, 3, 14, 22, 34, 39, 42, 47, 57], "develop": [4, 14, 16, 21, 30, 32, 37, 39, 40, 41, 42, 63], "deviat": 25, "devic": [2, 3, 4, 9, 10, 11, 13, 14, 16, 17, 19, 20, 21, 22, 23, 24, 28, 33, 34, 39, 40, 42, 47, 62, 63], "device_cpu": 11, "device_gpu": [11, 17, 62], "device_lib": 2, "device_num": [17, 62], "device_typ": [2, 14, 17, 39, 40, 58, 62], "diagram": 63, "dialect": [16, 17], "dict": 35, "did": [28, 32], "diff_undef": 11, "diffent": 27, "differ": [0, 2, 4, 13, 16, 20, 21, 23, 25, 29, 30, 32, 33, 35, 36, 43], "differenct": [39, 40], "differenti": 39, "difficult": 30, "diffus": [44, 63], "digit": [19, 28], "dim": 13, "dimens": 17, "dir": [2, 3, 7, 51, 55, 56, 57, 60], "directli": [11, 14, 17, 27, 28, 29, 32, 36, 42], "directori": [2, 3, 4, 5, 7, 14, 17, 29, 34, 37, 39, 40, 42, 47, 48, 49, 51, 54, 55, 57, 60], "diretcori": 40, "disabl": [0, 15, 19, 27, 29, 30, 32, 33], "disable_numactl": 29, "disable_taskset": 29, "disbal": 39, "discontinu": 14, "discuss": 7, "disk": [36, 49], "disparag": 0, "displai": [20, 49], "distanc": 54, "distinguish": [28, 30], "distribut": [2, 4, 8, 31, 32, 37, 38, 42, 43, 44, 51, 60, 61, 63], "distribution_strategi": 62, "divers": 0, "divid": [25, 28, 32], "divis": 28, "dl": 7, "dll": 51, "dllogger": [55, 60], "dllvm_enable_project": 39, "dnnl": [11, 13], "dnnl_arg_dst": 11, "dnnl_arg_scratchpad": 11, "dnnl_arg_src": 11, "do": [7, 14, 19, 27, 28, 29, 33, 36, 39, 52], "do_benchmark": 35, "do_lower_cas": 16, "do_predict": [16, 57], "do_train": [16, 57], "doc": [5, 9, 11, 39, 56], "doc_strid": 57, "docker": [9, 43, 44], "dockerfil": 2, "dockerhub": 63, "docs_build": 9, "docstr": 11, "document": [2, 3, 28, 31, 36, 38, 39, 40], "doe": [16, 24, 27, 28], "doesn": [5, 17, 18, 36, 56], "domin": 28, "don": [28, 49], "done": [7, 22, 28, 32, 35, 37], "doubl": 28, "download": [2, 8, 28, 32, 37, 42, 49, 51, 60, 61], "download_and_preprocess_coco": 60, "downstream": 18, "dpc": [21, 37, 38, 39, 40, 42], "dpcpp": [33, 37], "draft": 5, "dramat": 32, "dri": [2, 3, 34, 42, 47], "drive": 35, "driver": [2, 3, 14, 28, 31, 38, 45, 47, 52, 63], "drop": [18, 29, 35], "dropout": 35, "dst_mem": 11, "dst_tensor": 11, "dt_float": [20, 40], "dtype": [11, 19, 25, 26, 30, 35, 53, 62], "dtype_polici": 28, "due": [18, 27, 32, 35], "dummi": [31, 49, 61], "dummy_v2": 49, "dump": [20, 35], "duplic": 39, "dure": [0, 15, 16, 18, 19, 24, 28, 36, 38, 39, 40, 47], "dut3046": 28, "dynam": [13, 28, 32, 35, 36], "e": [0, 2, 3, 5, 11, 17, 28, 29, 34, 40, 60, 61], "each": [14, 25, 28, 29, 30, 31, 32, 62], "eager": [11, 25], "earli": 37, "easi": [16, 21, 30, 45], "easiest": 38, "easili": [16, 30, 31, 33], "ecc": 31, "echo": [37, 51], "econom": 0, "ecosystem": [16, 30, 63], "ed": 40, "edit": [0, 2], "edu": 55, "educ": 0, "effect": [18, 29, 32], "effici": [4, 16, 21, 30, 32, 34, 35, 51, 62, 63], "effort": 37, "egg": 60, "eigen": [4, 20], "either": [3, 19, 27, 49], "elaps": [32, 49], "elig": 11, "elimin": [16, 36], "els": [19, 28, 40, 61], "eltwis": 11, "eltwise_bas": 11, "eltwise_base_hdr": 11, "eltwise_forward": 11, "eltwise_gelu_erf": 11, "eltwise_gelu_tanh": 11, "eltwise_relu": 11, "eltwisebaseop": 11, "elu": 24, "email": 0, "emit": 16, "empathi": 0, "empir": 25, "en": 42, "enabl": [4, 13, 15, 16, 17, 18, 21, 22, 25, 27, 28, 29, 30, 31, 32, 33, 35, 36, 38, 39, 40], "enable_checkpoint_and_export": 62, "enable_itex_amp": 29, "enable_itex_layout_opt": 29, "enable_jemalloc": 29, "enable_op_parallel": 29, "enable_tcmalloc": 29, "enable_tensorboard": 62, "enable_tf_profil": [4, 21, 22, 28], "enable_xla": 62, "encod": 20, "encompass": 16, "encount": 14, "end": [28, 35, 39, 40, 44, 45, 52], "engin": [11, 14], "enhanc": [4, 30], "ensur": [7, 29], "enter": [2, 3, 22, 38, 39, 40], "enterpris": [31, 42], "entir": 28, "entri": 17, "enum": 33, "env": [14, 34, 38, 39, 40, 42, 46, 51, 52, 54], "env_check": [37, 38, 42, 63], "env_itex": [46, 47, 52, 54, 55, 56, 58, 60], "env_itex_cpu": [48, 56], "env_nam": 46, "environ": [0, 2, 4, 11, 13, 15, 16, 19, 21, 22, 23, 27, 28, 30, 32, 34, 35, 43, 44, 63], "environment": [30, 40], "epoch": [18, 19, 28, 35, 51, 58, 60], "epoch_loss_avg": 28, "epsilon": [25, 26], "equal": [24, 27, 32], "equival": [4, 28], "error": [4, 7, 11, 14, 20, 25, 28, 34, 47, 48, 51, 54, 55, 56, 57, 60], "errors_impl": [14, 47, 48, 51, 54, 55, 57, 60], "especi": [13, 38], "estim": [36, 63], "et": 25, "etc": [21, 30, 37, 39], "ethernet": 31, "ethnic": 0, "eu": 14, "eval_batch_s": 51, "evalu": [19, 28, 35, 54, 57], "even": [28, 29, 32, 43, 51, 63], "event": 0, "everi": [18, 20, 54], "everyon": 0, "evo": 31, "evolv": 30, "exact": 31, "exact_match": [51, 57], "exactli": 30, "exampl": [0, 2, 4, 5, 7, 9, 11, 14, 15, 20, 21, 24, 25, 26, 28, 31, 32, 33, 34, 37, 38, 45, 47, 50, 52, 56, 63], "example_test": 40, "except": [30, 33, 42, 51], "excess": 30, "exclud": 7, "exclus": 29, "excutor": 27, "exec": [11, 13], "exec_mod": 55, "execut": [2, 5, 11, 13, 15, 16, 17, 18, 19, 20, 22, 25, 28, 31, 32, 36, 39, 44, 52, 53], "executor": 15, "exist": [19, 24, 26, 28, 29, 45], "exit": 34, "exp": 18, "expect": [18, 38, 52, 63], "experi": [0, 4, 21, 23, 32], "experiment": [4, 13, 14, 22, 33, 39, 40, 42], "experimental_compil": 30, "experimental_gelu": 16, "experimental_ops_overrid": [26, 33], "explain": 18, "explan": 0, "explicit": [0, 11, 28, 32], "explicitli": [28, 29, 33, 52], "export": [4, 7, 11, 15, 16, 17, 18, 19, 21, 22, 28, 29, 30, 32, 34, 37, 38, 40, 42, 46, 47, 51, 52, 54, 57, 61, 62, 63], "expos": [21, 22, 63], "expr": 51, "express": 0, "extend": [4, 14, 21, 23, 25, 30, 32, 33], "extens": [5, 8, 9, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 24, 25, 26, 28, 29, 30, 31, 32, 36, 38, 43, 44, 46, 47, 48, 50, 51, 53, 54, 55, 56, 57, 58, 60, 61, 62], "extent": 31, "extern": [0, 14, 40], "extra": [18, 28, 36], "extract": 51, "f": [2, 35, 40, 63], "f0": 11, "f1": [51, 57], "f502f0715979ec73c571ca5676ba58431b916f5f58ee3333": 56, "facilit": [4, 30], "factor": [21, 29], "fail": [11, 28, 33, 36], "fair": 0, "fairli": 0, "fallback": 25, "fals": [7, 16, 17, 25, 27, 28, 29, 35, 51, 57, 62], "familiar": 11, "faq": 0, "far": 28, "fashion": [4, 21], "fast": 25, "faster": [18, 19, 25, 27, 28, 32, 35, 36, 47, 49], "fatal": 14, "fdc7a2bc": [37, 42], "featur": [4, 7, 8, 11, 13, 17, 25, 32, 36, 39, 44, 52, 62, 63], "feedback": [0, 7], "fetch": 40, "few": [28, 61], "fewer": 28, "fi": 61, "fi_provid": 38, "fid": 54, "field": [33, 39, 40], "fig": [16, 36], "figur": [16, 30, 32], "file": [2, 5, 7, 14, 17, 18, 22, 29, 34, 37, 42, 47, 48, 49, 51, 54, 55, 56, 57, 60, 61, 63], "filenam": 35, "fill": [39, 40], "filter": 7, "filter_height": 53, "filter_width": 53, "final": [17, 19, 28, 51], "final_carry_st": 25, "final_memory_st": 25, "find": [7, 11, 22, 31, 32, 34, 36], "fine": [28, 29, 31, 32, 35, 51], "finish": [28, 35, 39, 53, 56], "first": [17, 18, 19, 22, 24, 25, 27, 28, 29, 30, 32, 37, 38, 39, 41, 42, 51, 55, 60], "fit": [19, 32, 35], "fix": [7, 28, 37], "flag": [17, 30, 40, 60], "flex": [39, 40, 42, 45, 47, 50, 52, 54, 57, 63], "flexibl": [4, 30, 33, 35], "flexibli": 63, "float": [11, 18, 20, 28, 33, 40, 47], "float16": [4, 16, 18, 19, 21, 28, 33, 47], "float16graph_opt": [18, 19], "float32": [11, 19, 24, 25, 26, 28, 30, 35, 51, 53, 55, 60], "flow": [16, 28], "flower": 52, "focus": [0, 30], "fold": 15, "folder": [2, 3, 19, 34, 39, 40, 61], "follow": [0, 2, 3, 7, 15, 16, 17, 18, 22, 24, 27, 28, 29, 31, 32, 33, 34, 35, 37, 38, 39, 40, 41, 42, 43, 45, 47, 48, 51, 53, 54, 55, 56, 57, 60, 61, 62, 63], "follw": 62, "footprint": 36, "forg": [14, 56], "fork": [32, 35], "format": [7, 9, 18, 24, 28, 33, 35, 36, 61], "forth": 63, "forward": [11, 28, 54], "forward_train": 11, "found": [7, 14, 28, 29, 32, 34, 36, 39, 51], "four": 18, "fp": 47, "fp16": [16, 18, 19, 31, 44, 47, 51], "fp32": [16, 18, 19, 20, 24, 31, 44, 45, 49, 51, 52, 60], "fpn": 49, "fraction": 16, "framework": [14, 16, 30, 35, 36, 37, 40, 47, 48, 50, 51, 54, 55, 57, 60], "free": [0, 21, 29], "frequenc": [14, 31], "frequent": [4, 36], "friendli": 32, "from": [0, 3, 5, 7, 11, 16, 17, 18, 19, 21, 22, 27, 28, 29, 30, 32, 33, 35, 36, 37, 39, 43, 44, 47, 49, 50, 51, 52, 55, 56, 63], "from_logit": 35, "from_model": 49, "from_tensor_slic": 28, "frontend": [4, 16, 21, 23], "frozen": 19, "fr\u00e9chet": 54, "full": [7, 39, 40, 42], "fulli": [4, 19, 21, 30, 35], "function": [5, 17, 20, 21, 23, 25, 26, 28, 30, 32, 33], "fundament": 16, "further": [4, 16, 21], "fuse": [4, 16, 18, 19, 21, 24, 26, 51], "fusedaccmatmul": 24, "fusedbatchnorm": 24, "fusedbatchnormgrad": 24, "fusedmatmul": 24, "fusion": [4, 9, 17, 18, 19, 21, 26, 33], "fwd_desc": 11, "fwd_pd": 11, "fwd_primit": 11, "fwd_primitive_arg": 11, "g": [5, 17, 28, 40, 56, 61], "g10": [39, 40], "g11": [39, 40], "gamma_constraint": [25, 26], "gamma_initi": [25, 26], "gamma_regular": [25, 26], "gate": 25, "gaussian": 25, "gb": 31, "gbs1": 51, "gbs2": 51, "gcc": [33, 39], "gd": 35, "gddr6": 31, "gelu": [11, 33], "gelu_erf": 24, "gelu_tanh": 24, "geluop": 11, "gen": 31, "gen9": 11, "gender": 0, "gener": [4, 5, 16, 20, 21, 23, 28, 29, 30, 31, 32, 34, 38, 39, 41, 47, 49, 52], "get": [2, 4, 7, 11, 13, 21, 28, 31, 32, 33, 34, 35, 37, 39, 40, 47, 48, 51, 54, 55, 57, 60, 63], "get_concrete_funct": 35, "get_config": 35, "get_scaled_loss": 28, "get_unscaled_gradi": 28, "get_weight": 28, "getattr": 11, "getsitepackag": [37, 38, 42, 63], "gh": 5, "ghz": 31, "gigabit": 31, "gin": 58, "git": [5, 11, 16, 33, 34, 39, 40, 47, 51, 54, 55, 57, 58, 60, 61, 62], "git_vers": [33, 38], "github": [5, 7, 8, 16, 21, 32, 34, 39, 40, 45, 47, 51, 54, 55, 57, 58, 60, 61, 62, 63], "give": [0, 35], "given": [17, 25, 29, 55], "glibcxx": 14, "glibcxx_3": 14, "global": [17, 28, 33, 62], "glorot_uniform": [25, 26], "glue_dataset": 16, "glue_dir": 16, "go": [7, 40, 41, 42], "go1": 7, "golang": 7, "gold": 31, "gomp": 32, "gomp_cpu_affin": 32, "good": [4, 19, 21, 23, 32, 34, 36], "googl": [7, 14, 16, 21, 22, 34, 57], "google_pretrained_weight": 51, "googleapi": [28, 35, 47, 49, 56], "govern": 63, "governor": 31, "gperftool": 32, "gpg": [37, 39], "gpu": [3, 4, 9, 11, 14, 15, 16, 18, 19, 20, 23, 24, 25, 27, 28, 33, 34, 38, 43, 44, 49, 63], "gpu_kernel": 11, "gpu_profil": 28, "gpudevic": 11, "gracefulli": 0, "grad": 28, "gradient": 28, "gradienttap": 28, "granular": [29, 32, 35], "graph": [4, 9, 10, 13, 15, 16, 18, 20, 23, 30, 35, 36, 44, 53, 62, 63], "graph_def": 35, "graph_opt": [17, 18, 19, 33, 47, 52, 62], "graph_pb2": 35, "graphdef": [17, 18, 35], "graphic": [37, 39, 40], "graphopt": [17, 18, 19, 47, 62], "grappler": [15, 17, 19, 58], "greater": [24, 32], "greaterequ": 24, "greatli": 28, "green": 15, "grep": 52, "group": [25, 32], "gt": [18, 33, 62], "guarante": 37, "guid": [4, 9, 11, 18, 21, 28, 31, 34, 37, 39, 40, 42, 44, 45, 52, 63], "guidelin": [1, 4, 16, 50, 63], "guidlin": 31, "gxx_linux": [14, 56], "gz": [7, 32, 49], "h": [7, 11, 14, 17, 34, 40], "ha": [2, 3, 4, 14, 18, 19, 20, 28, 30, 32, 36, 37, 40, 51, 62], "had": [28, 32], "half": [11, 28], "halv": 28, "hand": 16, "handl": [1, 13], "handwrit": [44, 45], "happen": [28, 36, 56], "harass": 0, "hard": [2, 54], "hardwar": [4, 16, 17, 19, 21, 23, 25, 29, 33, 35, 44], "harm": 0, "hasattr": [11, 33], "hasn": 54, "hat": 42, "have": [0, 18, 28, 32, 37, 38, 39, 42, 45, 49, 52], "hbm2e": 31, "hdr": [11, 34], "he": 25, "he_norm": 35, "header": 11, "headless": 60, "healthi": 0, "heap": 32, "help": [14, 19, 20, 21, 29, 32, 39, 40, 45, 52], "here": [8, 11, 14, 17, 18, 24, 27, 30, 35, 36, 39, 40, 49, 51, 54, 55, 60, 62], "heterogen": [17, 63], "heurist": 17, "high": [14, 16, 17, 28, 32, 63], "higher": [14, 15, 20, 28, 32], "highli": 28, "histori": [19, 28], "hlo": 16, "hochreit": 25, "hold": 32, "home": [7, 29, 37, 41, 42, 56], "homogen": 17, "hook": 17, "horovod": [2, 31, 37, 38, 42, 44, 51, 60], "horovodversionmismatcherror": 51, "host": [2, 3, 28, 39, 42, 47], "hour": 31, "how": [1, 5, 14, 17, 18, 27, 32, 34, 39, 40, 42, 44, 49, 58, 61, 63], "howev": [18, 21, 24, 28, 29, 30, 32, 54], "hpp": 11, "hs_to_tfg": 17, "hsp": 17, "html": [0, 5, 39, 42], "http": [0, 2, 5, 7, 8, 16, 21, 22, 28, 32, 34, 35, 37, 38, 39, 40, 41, 42, 45, 47, 49, 51, 52, 54, 55, 56, 57, 58, 60, 61, 62, 63], "http_proxi": [2, 3], "https_proxi": [2, 3], "hub": 34, "hurt": 33, "hutter": 25, "hvd": 51, "hvd_configur": 61, "hvd_support": 61, "hyper": [29, 31, 32], "hyperparamet": 51, "hyphen": 32, "i": [0, 4, 5, 7, 9, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 30, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 44, 45, 47, 48, 49, 51, 52, 53, 54, 55, 56, 57, 58, 60, 61, 62, 63], "i0203": 61, "i0324": 62, "i0817": 61, "i1015": 51, "i1021": 51, "i1022": 51, "icd": [37, 42], "id": [2, 30, 34], "idea": 32, "ident": [0, 28], "identif": 28, "identifi": 39, "if_not_mobil": 34, "igc": 37, "ignor": [18, 28, 34], "ii": [18, 19, 33], "iii": [18, 19], "illustr": 32, "ilov": 25, "imag": [27, 28, 35, 41, 42, 44, 49, 54], "image_classif": [61, 62], "image_nam": [2, 3], "imagenet": 22, "imageri": 0, "img_arrays_for_acc": 54, "impact": [0, 5, 14, 18, 24, 32, 56], "implement": [4, 7, 10, 16, 17, 19, 21, 23, 25, 26, 30, 32, 35, 49, 51, 63], "import": [2, 7, 11, 14, 17, 18, 19, 22, 23, 25, 26, 27, 28, 30, 32, 35, 37, 38, 39, 40, 41, 42, 47, 49, 52, 53, 56, 63], "import_graph_def": 35, "imports_graph_def": 35, "improv": [15, 16, 19, 28, 32, 36, 39, 40, 49, 62], "inappropri": 0, "incarn": 2, "incept": [15, 18, 35, 44, 49, 54], "inceptionv4": 35, "inceptionv4_fp32_pretrained_model": [35, 47], "incid": 0, "includ": [0, 7, 13, 14, 16, 17, 18, 20, 23, 40, 42, 51, 52, 53, 63], "include_subdir": 7, "inclus": 0, "incorrect": 28, "increas": [18, 28, 52], "independ": [16, 25, 29, 35], "index": [18, 32], "indic": [24, 28, 47, 62], "individu": [0, 16, 20], "inf": 28, "infer": [11, 15, 16, 17, 18, 19, 24, 28, 34, 36, 44, 45, 51, 52, 56], "infer_config": 52, "infer_fp32_vs_amp": 47, "infer_inception_v4_amp": 47, "infer_resnet50": [29, 48], "inferlist": 18, "inferlist_add": 18, "inferlist_remov": [18, 19], "infin": 28, "influenc": [21, 29, 32], "info": [17, 18, 29, 36, 40, 45, 47, 49], "inform": [0, 1, 7, 8, 16, 20, 29, 32, 33, 39, 40, 42, 45, 52, 61, 63], "infrastructur": [4, 9, 20, 63], "init": 11, "init_checkpoint": 57, "initi": [17, 20, 28, 31, 35, 39, 40], "initial_weight": 28, "innov": [4, 63], "inplac": 7, "input": [4, 11, 13, 17, 19, 20, 21, 22, 24, 25, 28, 33, 35, 62], "input_height": 53, "input_shap": [35, 49], "input_width": 53, "input_x": 35, "insert": [18, 19, 24, 35, 52], "insid": [2, 63], "inspir": 0, "instal": [2, 3, 4, 7, 9, 14, 18, 19, 21, 22, 23, 26, 27, 28, 29, 31, 32, 33, 45, 46, 47, 48, 51, 52, 54, 55, 56, 57, 60], "install_head": 40, "instanc": [0, 31], "instance_idx": 29, "instancenorm": [19, 26], "instead": [36, 37, 39, 51, 54, 55, 60], "instruct": [2, 3, 4, 7, 16, 18, 19, 21, 31, 32, 41, 42, 54, 61, 63], "insult": 0, "int": [11, 35, 40, 51], "int8": [4, 28, 31, 45, 49, 52], "integ": 29, "integr": [4, 15, 16, 30, 32, 39], "intel": [0, 1, 5, 8, 9, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 24, 25, 26, 28, 29, 30, 36, 38, 43, 44], "intel_extension_for_tensorflow": [11, 17, 18, 19, 25, 26, 28, 29, 34, 37, 38, 39, 41, 42, 47, 49, 63], "intel_extension_for_tensorflow_lib": [11, 39], "intel_xpu": 2, "intelai": 16, "intelpython3_ful": 38, "intend": [7, 16, 63], "intent": 7, "inter": [4, 20, 35], "inter_op_parallelism_thread": 35, "interact": [0, 39], "interfac": [17, 30, 43, 63], "intermedi": [16, 28], "intern": 16, "internet": 47, "interop": 29, "interpret": 29, "intraop": 29, "introduc": [16, 29, 32, 36], "introduct": 19, "invalid": [13, 27, 32], "invent": 15, "investig": [0, 29], "invis": 0, "invok": [16, 17], "involv": 0, "io": [5, 34], "ip": 56, "ipc": [2, 3, 42, 47], "ipp": 55, "ipykernel": 54, "ipynb": [52, 54, 56], "ipython": 56, "ir": [16, 17], "irc_na": [37, 42], "is_bf16_math_mod": 24, "is_gpu_avail": 28, "isol": [37, 41, 42], "issu": [0, 1, 4, 7, 14, 18, 28, 37, 39, 40, 42, 56, 63], "item": [22, 35], "iter": [20, 31, 35, 36, 62], "itex": [0, 2, 3, 4, 8, 9, 11, 13, 14, 17, 18, 19, 20, 21, 23, 26, 27, 28, 29, 30, 31, 34, 37, 38, 39, 40, 41, 42, 46, 47, 52, 54, 62, 63], "itex_auto_mixed_precis": [16, 18, 19, 29, 33, 47], "itex_auto_mixed_precision_allowlist_add": [18, 19], "itex_auto_mixed_precision_allowlist_remov": 18, "itex_auto_mixed_precision_clearlist_add": 18, "itex_auto_mixed_precision_clearlist_remov": 18, "itex_auto_mixed_precision_data_typ": [16, 18, 19, 47], "itex_auto_mixed_precision_denylist_add": 18, "itex_auto_mixed_precision_denylist_remov": 18, "itex_auto_mixed_precision_inferlist_add": 18, "itex_auto_mixed_precision_inferlist_remov": [18, 19], "itex_auto_mixed_precision_log_path": [18, 19, 20, 33], "itex_auto_mixed_precision_unsafe_force_al": 18, "itex_bf16": 61, "itex_bf16_lar": 61, "itex_build": [39, 40], "itex_cfg": [17, 62], "itex_check_eq": 11, "itex_cpp_min_log_level": 20, "itex_disable_xla": 27, "itex_dummy_bf16": 61, "itex_dummy_bf16_lar": 61, "itex_dummy_fp32": 61, "itex_dummy_fp32_lar": 61, "itex_enable_multiple_stream": 62, "itex_enable_nextpluggable_devic": 27, "itex_fp32": 61, "itex_fp32_lar": 61, "itex_fp32_math_mod": [20, 51], "itex_gpu_wrapp": 42, "itex_layout_opt": [29, 32, 33], "itex_layout_optitex_remapperitex_auto_mixed_precisionitex_shard": 33, "itex_omp_threadpool": [3, 4, 20, 29, 35, 40], "itex_onednn_graph": [33, 52], "itex_ops_overrid": 27, "itex_optimizer_after_shard": 17, "itex_optimizer_before_shard": 17, "itex_quant": 49, "itex_remapp": 33, "itex_repo": 47, "itex_shard": 33, "itex_sync_exec": 33, "itex_tf_constant_fold": [15, 52], "itex_tile_as_devic": 20, "itex_verbos": [11, 17], "itex_vlog": 11, "itex_xpu_librari": 11, "itex_xx": 61, "itexauto_mixed_precision_opt": [18, 19], "itexdatatyp": 33, "itexgelu": 26, "itexgelugrad": 26, "itexlayernorm": 26, "itexlayernormgrad": 26, "itexlstm": 26, "itexresourceapplyadamwithweightdecai": 26, "itexrnn": 26, "its": [4, 11, 25, 28, 29, 30, 32, 37, 42, 53], "iv": [18, 19], "jammi": [37, 39], "jax": [16, 27, 30, 63], "jemalloc": 32, "jit": [4, 16, 27, 30], "jit_compil": 27, "job": [11, 20, 40], "join": [22, 32, 35], "json": [16, 35, 57], "just": [0, 4], "k8": [3, 40], "kaim": 25, "kdstindex": 11, "keep": [28, 32], "keepdim": 35, "kei": [9, 17, 20, 36, 37, 39], "kept": [26, 28], "kera": [4, 19, 25, 26, 31, 35, 51, 52, 54, 58, 63], "keras_util": [61, 62], "kerascv": 31, "keraslay": 22, "kernel": [2, 3, 9, 10, 15, 20, 22, 23, 24, 25, 28, 30, 31, 35, 37, 39, 40, 41, 42, 51, 52, 54, 56, 63], "kernel_initi": [25, 26], "kernels_experiment": 34, "keyr": 37, "kind": [0, 4, 21, 53], "kitti": 49, "kmp": 32, "kmp_affin": [29, 32, 35], "kmp_blocktim": [29, 32, 35], "knob": 29, "know": [19, 28], "knowledg": [19, 32], "known": [16, 28, 56], "kwarg": [25, 26, 35], "l": [34, 35, 40], "l28": 34, "l2loss": 24, "l_basekit_p_2024": [37, 42], "label_shap": 49, "ladder": 0, "lake": [4, 21], "lamb": [25, 51], "lambda": 25, "languag": [0, 40], "language_model": 16, "languagemodel": 51, "laptop": 14, "lar": 61, "larg": [4, 16, 20, 25, 28, 32, 35, 36, 44], "larger": [31, 32, 35, 39, 40], "last": [28, 56], "latenc": [13, 35, 47, 54], "latency_mod": 29, "later": [32, 37, 41, 42], "latest": [8, 27, 31, 34, 38, 39, 40, 42, 63], "launch": [21, 42, 54], "launcher": [4, 29, 32], "layer": [2, 9, 16, 19, 25, 28, 35, 52], "layer_0": 20, "layernorm": [19, 24, 26], "layernormgrad": 26, "layout": [13, 29, 33, 36], "layout_opt": 33, "ld": 32, "ld_library_path": 40, "ld_preload": [29, 32], "lead": [0, 16, 18], "leader": 0, "leakyrelu": 24, "learn": [0, 14, 15, 16, 19, 21, 25, 27, 29, 32, 34, 36, 44, 45, 63], "learning_r": [25, 26, 57], "learning_rate_per_gpu": 51, "learning_rate_phase1": 51, "learning_rate_phase2": 51, "least": [28, 37, 38], "leav": 32, "legaci": [27, 30, 51, 54, 55, 56, 57, 60, 61, 62], "legal": 7, "len": 35, "length": [16, 31, 51], "less": [4, 18, 19, 21, 24, 28, 35, 47], "lessequ": 24, "let": [18, 28, 34, 35], "level": [0, 14, 16, 17, 23, 24, 28, 37], "level_zero": 14, "level_zero_util": 14, "leverag": [4, 16], "lib": [2, 14, 29, 39, 40, 56], "lib64": 29, "lib_path": 40, "libgomp": 32, "libiari": 42, "libigc1": 37, "libigdfcl1": 37, "libigdgmm12": 37, "libiomp": 32, "libiomp5": [32, 40], "libitex": 40, "libitex_common": 39, "libitex_cpu": 39, "libitex_cpu_cc": [34, 40], "libitex_gpu": 39, "libitex_gpu_cc": [34, 40], "libitex_gpu_xetla": 40, "libmkl_sycl": [14, 47, 48, 51, 54, 55, 57, 60], "libomp": 39, "librari": [2, 3, 11, 14, 16, 29, 32, 37, 39, 42, 55], "library_path": 40, "libtensorflow": 40, "libtensorflow_cc": 40, "libtensorflow_framework": 40, "like": [0, 2, 7, 17, 25, 28, 32, 33, 46, 47, 57, 58], "limit": [16, 17, 32, 63], "line": [7, 28, 32, 34, 47, 56, 62], "linear": [4, 16, 19, 21, 25, 28, 30], "linearli": 25, "link": [2, 31, 40, 52], "linkstat": 11, "linux": [2, 3, 7, 29, 31, 32, 38, 39, 40, 41, 42, 52], "list": [2, 7, 11, 16, 19, 24, 27, 28, 29, 30, 32, 35, 37, 39, 40], "list_local_devic": 2, "list_physical_devic": [14, 19, 28], "littl": 18, "live": 16, "ll": [20, 24], "lld": 39, "lldb": 39, "llga": [7, 33], "llvm": [16, 39], "llvm_openmp": 40, "ln": 40, "load": [11, 28, 34, 35, 42], "load_data": [19, 28, 35], "load_ops_librari": 11, "load_pb": 35, "load_ref_result": 54, "local": [2, 3, 7, 14, 19, 29, 31, 32, 34, 35, 39, 40, 41, 42, 49, 58], "localalloc": 29, "localhost": [5, 11, 20, 41, 42], "locat": [7, 8, 39, 40, 51, 54], "lock": 13, "log": [7, 11, 18, 20, 22, 28, 33, 35, 40, 42, 47, 48, 51, 54, 55, 56, 57, 58, 60, 62], "log_everi": [55, 60], "log_file_prefix": 29, "log_path": 29, "log_step": 62, "log_warmup_step": 60, "logdir": 22, "logic": 32, "logit": 35, "logpath": 22, "long": [25, 30], "look": [2, 24, 34, 39, 40], "loop": [54, 62], "loshch": 25, "loss": [15, 18, 19, 31, 35, 44, 45, 52, 58], "loss_object": 28, "loss_scal": 28, "lossscaleoptim": 28, "low": [4, 16, 18, 21, 23, 28, 45], "lower": [4, 15, 18, 19, 21, 35, 47], "lowpropos": 49, "lr": [25, 51, 58], "lscpu": [32, 52], "lstm": 25, "lt": [31, 33, 37], "ltensorflow_cc": 40, "ltensorflow_framework": 40, "m": [5, 29, 32, 45, 46, 49, 54, 55, 58, 60], "m150": [39, 40], "m75": [39, 40], "machin": [2, 3, 14, 16, 21, 28, 29, 32, 34, 41, 42, 53, 58], "macro": 11, "made": [11, 30, 55], "mai": [0, 7, 13, 14, 16, 18, 19, 24, 28, 29, 32, 35, 36, 37, 38, 42, 54, 63], "mail": 0, "main": [5, 17, 21, 37, 39, 40, 55, 58, 60, 61], "mainli": [15, 17, 29], "maintain": [0, 7, 8, 14, 18, 21, 23, 25, 34, 36], "make": [0, 2, 3, 5, 7, 11, 16, 18, 19, 28, 30, 32, 35, 36, 39, 40, 47], "makefil": 40, "malloc": [29, 32], "malloc_conf": 29, "man": 32, "manag": 63, "mani": [16, 18, 21, 28, 29, 32, 58], "manner": 16, "manual": [5, 7, 18, 28, 29, 51, 61], "manylinux2014": [37, 41, 42], "manylinux2014_x86_64": 40, "manylinux_2_17_x86_64": 40, "map_structur": 35, "mark": 17, "mask": [25, 44], "maskrcnn": 60, "master": [32, 34, 36], "match": [16, 29, 36, 43], "matcher": 24, "math": [20, 24, 28, 37, 42], "matmul": [17, 20, 24, 26, 35, 36, 40, 49], "matrix": [36, 40], "max": [16, 33, 39, 40, 42, 47, 50, 51, 54, 55, 56, 57, 58, 60, 61, 62, 63], "max_seq_length": 57, "max_step": 55, "maxim": [4, 17, 21, 25, 33, 62], "maximum": [31, 51], "maxpool": 49, "maxpool3d": 24, "maxval": 35, "md": 21, "mean": [13, 14, 18, 25, 27, 28, 29, 32, 35, 36, 39, 40], "mechan": [4, 16, 21, 30], "media": 0, "medic": 44, "meet": [3, 25, 51, 63], "member": [0, 33], "membind": 32, "memori": [4, 9, 11, 13, 14, 15, 16, 18, 19, 21, 25, 28, 31, 36, 47, 51], "memory_limit": 2, "mention": [28, 32], "merg": 5, "messag": [28, 29], "meta": 13, "metadata_thp": 29, "metal": 44, "method": [28, 32, 45, 52], "metric": [19, 28, 35], "middl": 28, "might": [11, 39], "migrat": 7, "millisecond": 32, "mind": 16, "miniconda": 38, "miniconda3": 38, "minim": [15, 32], "minimum": [31, 39], "minor": [4, 21, 23], "minut": [25, 39, 40], "minval": 35, "miscellan": 9, "mismatch": 28, "miss": 15, "mistak": 0, "mit": 52, "mix": [4, 31, 33, 35, 44, 49], "mixed_bfloat16": 28, "mixed_float16": 28, "mixed_precis": 28, "mkdir": [2, 3, 39, 61, 62], "mkl": [7, 34, 37, 38, 39, 40, 42], "ml": 16, "mlir": 17, "mnist": [19, 28, 34, 35, 44, 58], "mnist_client": 34, "mnist_saved_model": 34, "mode": [16, 17, 20, 24, 31, 33, 39, 51, 54, 61], "model": [2, 3, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 27, 32, 33, 35, 36, 44, 45, 52, 56, 58, 62, 63], "model_base_path": 34, "model_dir": [3, 34, 55, 60, 61, 62], "model_nam": [3, 34], "model_path": 49, "model_serv": [3, 34], "model_training_util": 51, "model_typ": 61, "modelserv": 34, "moder": 0, "modern": 36, "modif": [4, 16, 30], "modifi": [5, 35, 40, 47, 51, 62], "modul": [14, 17, 29], "modular": 10, "modulenotfounderror": 14, "monitor": 14, "monolith": 16, "more": [1, 4, 7, 11, 16, 18, 19, 21, 25, 32, 34, 35, 36, 37, 39, 40, 42, 45, 51, 52, 53, 58, 61], "most": [4, 18, 19, 28, 29, 32, 47, 56], "mount": [2, 3], "move": [18, 32, 51, 55, 60], "mozilla": 0, "mpi": [37, 38, 42], "mpirun": [55, 58, 60, 61], "mrpc": 16, "mt": 31, "much": [28, 32, 35, 52], "mul": 24, "multi": [28, 32, 33, 38, 39, 51, 60, 62], "multipl": [18, 20, 32, 36, 62], "multipli": 28, "must": [5, 15, 27, 28, 35], "mutex": 13, "mutual": 29, "my": [14, 18, 19], "mybuilddir": 39, "myfil": 7, "n": [18, 24, 25, 32, 33, 38, 39, 40, 51, 53], "n02123159": 48, "na": [27, 31], "name": [2, 3, 5, 7, 11, 14, 18, 19, 20, 25, 26, 28, 30, 32, 34, 35, 44, 49, 54, 58], "name_scop": 11, "namespac": [4, 17, 21, 23, 25, 26, 33, 40], "nan": 28, "narrow": 28, "nation": 0, "nativ": [4, 15, 16, 21], "natur": 0, "ncdhw": 24, "nchw": 32, "ncore_per_inst": 29, "ndhwc": 24, "necessari": [16, 28, 37, 41, 42, 53], "necessarili": 16, "need": [4, 8, 13, 14, 16, 17, 20, 21, 23, 28, 29, 30, 34, 35, 36, 37, 38, 39, 40, 42, 47, 52, 53, 56, 60, 61, 62], "neg": [32, 35], "neglig": 28, "neither": 29, "nest": 35, "netron": 18, "network": [14, 15, 32], "neural": [4, 14, 15, 21, 32, 44, 45, 52], "new": [4, 5, 7, 8, 15, 16, 21, 23, 24, 28, 30, 32, 36, 45, 51], "newer": [15, 45, 46, 52], "newrootscop": 40, "next": [4, 16, 28, 39, 49], "next_pluggable_devic": 30, "next_pluggable_device_factori": 30, "nextplugg": 30, "nextpluggabledevic": 16, "nhwc": [20, 32], "nibabel": 55, "nic": 31, "nice": 32, "nifti": 55, "nightli": 55, "ninstanc": 29, "nn": [11, 25, 26, 33, 35, 53], "nn_op": 11, "no_proxi": [2, 3], "no_python": 29, "node": [13, 18, 20, 24, 32, 36, 38, 45, 51], "node0": 32, "node1": 32, "node_id": 29, "nolint": 7, "nolintnextlin": 7, "non": [27, 35], "none": [8, 25, 26, 28, 29, 33, 51], "nonetyp": 56, "nonlinear": 25, "nor": 29, "norm": 25, "normal": [17, 20, 25, 28, 32, 39, 47], "note": [2, 3, 5, 11, 16, 17, 18, 20, 25, 27, 28, 29, 31, 33, 34, 36, 39, 40, 47, 49, 51, 54, 58, 60, 61], "notequ": 24, "notfounderror": [14, 47, 48, 51, 54, 55, 57, 60], "noth": 11, "notic": [13, 28], "novel": 16, "now": [2, 18, 28, 32, 34], "np": [22, 25, 53, 55, 58, 60, 61], "npd": [4, 27, 30], "npz": 28, "nth": 32, "nullptr": 11, "num": [29, 32, 51], "num_accumulation_steps_phase1": 51, "num_accumulation_steps_phase2": 51, "num_channel": 53, "num_class": 35, "num_el": 11, "num_gpu": [51, 62], "num_test": 34, "num_train_epoch": 57, "num_unit": [19, 28], "numa": 31, "numactl": [29, 35], "number": [15, 20, 24, 28, 31, 32, 35, 36, 44, 45, 51, 54, 61, 62], "number_of_process": 61, "numer": 28, "numpi": [22, 25, 28, 53, 55], "nv_result": 54, "nvidia": [28, 51, 54, 55, 60], "nvme": 31, "o": [2, 22, 27, 31, 35, 37, 38, 39, 40, 42, 44, 52], "oam": 31, "object": [12, 14, 18, 28, 32, 33, 47, 48, 49, 51, 54, 55, 56, 57, 60], "oblig": 0, "obvious": 18, "occasionali": 27, "occupi": 18, "occur": 28, "ocl": 11, "ocloc": [39, 40], "off": [13, 29, 31, 33, 52, 62, 63], "offcial": 11, "offens": 0, "offer": [19, 30, 32, 49], "offici": [0, 16, 32, 44, 45, 46, 51, 54, 55, 57, 60, 61, 62], "offlin": [0, 36, 39, 40], "offononoffoff": 33, "often": [29, 37, 41, 42], "ok": 51, "omp": [4, 20, 32, 35], "omp_num_thread": [29, 35], "omp_proc_bind": 32, "omp_schedul": 32, "onboard": 32, "onc": [20, 28, 32, 36], "onconfig": [18, 19], "one": [11, 15, 20, 21, 28, 32, 39, 40, 47, 53, 55, 61], "oneapi": [2, 14, 21, 31, 34, 38, 45, 47, 48, 51, 52, 54, 55, 56, 57, 60, 61, 62, 63], "oneapi_install_path": 34, "oneccl": [2, 37, 38, 42, 51], "onednn": [9, 11, 12, 14, 15, 20, 24, 32, 33, 36, 44], "onednn_cpu_git_vers": 33, "onednn_engin": 11, "onednn_gpu_git_vers": 33, "onednn_graph": 33, "onednn_graphoverrid": 33, "onednn_stream": 11, "onednn_verbos": 11, "onednngraph": 15, "onemkl": [37, 38, 39, 40, 42], "ones": [22, 25, 26, 33, 51], "onli": [2, 4, 5, 13, 14, 16, 17, 18, 20, 21, 23, 24, 28, 29, 30, 33, 34, 36, 37, 41, 51, 54, 55, 56, 57, 60, 61, 62], "onlin": [0, 31, 63], "op": [4, 9, 10, 16, 17, 20, 21, 23, 24, 26, 27, 28, 30, 35, 40, 49, 51, 54], "op_build": 11, "op_kernel": 11, "op_requires_ok": 11, "opaqu": 30, "open": [0, 5, 7, 14, 16, 18, 21, 34, 35, 37, 47, 48, 51, 52, 54, 55, 56, 57, 60, 63], "opencl": [14, 37, 39, 40, 42], "opencv": [49, 60], "openmp": [29, 39], "openvino": 49, "openxla": 4, "openxla_support_on_gpu": 21, "oper": [4, 13, 15, 16, 18, 23, 24, 28, 32, 35, 36, 63], "opinion": 0, "opkernel": 11, "opkernelconstruct": 11, "opkernelcontext": 11, "ops_overrid": 27, "opt": [2, 3, 11, 14, 37, 39, 40, 42, 46, 58], "optim": [2, 4, 9, 14, 15, 16, 17, 18, 23, 25, 26, 28, 29, 30, 31, 32, 33, 35, 36, 37, 38, 42, 44, 45, 47, 49, 50, 51, 52, 54, 55, 60, 61, 63], "option": [2, 3, 7, 11, 18, 21, 29, 33, 35, 61, 62, 63], "order": [18, 19, 28, 29, 30, 32, 38, 43], "org": [0, 2, 7, 21, 39, 40, 49, 56], "organ": 16, "orient": 0, "origin": [4, 16, 18, 21, 23, 24, 25, 31, 36, 40, 45, 47, 49, 56], "orign": 31, "orthogon": [25, 26], "other": [0, 17, 20, 25, 28, 29, 30, 31, 32, 33, 34, 35, 37, 39, 40, 42, 56, 58, 63], "otherwis": [0, 17, 28, 33, 52, 53], "our": 29, "out": [3, 15, 28, 36, 40, 48, 51, 53, 54, 62], "outcom": 54, "outermost": 25, "output": [2, 7, 11, 13, 16, 19, 20, 24, 25, 28, 30, 31, 33, 35, 37, 39, 40, 47, 49, 52, 57], "output_dim": 35, "output_dir": [16, 55, 57, 60], "over": [18, 28, 49], "overal": [0, 32], "overhead": [13, 16, 28, 32, 35, 51], "overload": 26, "overrid": [4, 11, 18, 27, 28], "oversize_threshold": 29, "overview": 4, "own": [35, 49], "p": [2, 3, 25, 34, 41, 42, 47, 61], "pacakg": 56, "packag": [3, 27, 30, 32, 37, 38, 39, 41, 45, 51, 52, 55, 56, 60, 63], "pad": [24, 25, 53], "page": [5, 21, 22, 23, 32, 63], "paintbucket": 18, "parallel": [13, 20, 32, 35, 39], "paramet": [17, 26, 35, 47, 51], "parent": 9, "parsefromstr": 35, "part": [15, 16, 17, 32, 39, 40, 51, 60], "parti": [9, 36, 63], "particip": 0, "particular": 28, "particularli": 14, "partit": [15, 32], "pass": [11, 15, 16, 17, 28, 31, 33, 36, 49, 54, 62], "patch": [7, 34, 51, 54, 55, 57, 60, 62], "path": [2, 3, 7, 16, 18, 19, 20, 22, 29, 32, 33, 34, 37, 38, 39, 40, 42, 47, 49, 51, 52, 55, 57, 60, 61, 62], "path_to_itex": 3, "path_to_libitex_cpu_cc": 34, "path_to_libitex_gpu_cc": 34, "path_to_python_unit_test": 7, "path_to_site_packag": [37, 38, 42, 63], "path_to_tensorflow_serv": 3, "pattern": [0, 4, 15, 16, 21, 24], "pb": [18, 19, 34, 35, 47, 49], "pb_file": 35, "pbtxt": 17, "pci": [2, 30], "pcie": 31, "pdf": 25, "peak": [18, 23], "penal": 32, "peopl": 0, "per": [17, 28, 29, 31, 32, 38, 58, 62], "perf": 27, "perform": [4, 14, 15, 16, 17, 19, 20, 21, 22, 23, 24, 25, 28, 29, 32, 33, 35, 36, 39, 40, 44, 49, 51, 52, 54, 55, 60, 62, 63], "period": [0, 32], "permiss": [0, 5], "person": 0, "perspect": [29, 32], "phase": [15, 31, 36, 51], "phase1": [31, 51], "phase2": 51, "phase_2": 51, "photo": 52, "physic": [0, 30, 32, 62], "physical_devic": [14, 58], "physical_device_desc": 2, "physicaldevic": [14, 58], "pick": 7, "picker": 5, "piecewiseconstantdecai": 25, "pip": [7, 11, 14, 22, 27, 33, 34, 37, 38, 39, 40, 41, 42, 45, 46, 49, 51, 54, 55, 58, 60, 62, 63], "pip3": 41, "pip_packag": [11, 39], "pip_set_env": [51, 52, 54, 55, 57, 60, 61], "pipelin": [16, 44, 45, 52], "pjrt": [4, 16, 21, 63], "place": [4, 17, 21, 32, 40], "placement": [29, 32], "plai": 32, "plain": 36, "platform": [14, 16, 28, 32, 33, 37, 39, 40, 41, 51, 54, 55, 56, 57, 60, 61, 62], "platinum": [31, 32, 35], "pleas": [7, 11, 14, 16, 17, 21, 27, 28, 37, 39, 40, 42, 44, 45, 47, 51, 53, 55, 57, 58, 60, 61, 63], "plu": [16, 32], "plug": [34, 63], "pluggabl": [4, 10, 16, 30, 40], "pluggable_devic": 30, "pluggable_device_factori": 30, "pluggabledevic": [10, 27, 63], "plugin": [4, 10, 16, 18, 19, 21, 22, 34, 39, 58, 63], "po": 35, "point": [17, 18, 20, 28, 33, 37, 42, 47], "polici": [29, 32, 63], "polit": 0, "polymorph": 11, "pool": 4, "popular": [15, 16, 31], "port": [34, 54], "portabl": [16, 36], "posit": [0, 7], "possibl": [4, 19, 32, 35, 36, 39], "post": [0, 7, 18, 19, 24, 33], "post1": 40, "potenti": [28, 63], "power": [19, 63], "ppn": [55, 58, 60, 61], "pr": 5, "practic": [4, 28, 29], "pramet": 62, "pre": [18, 31, 33, 41, 42, 51, 56], "precis": [4, 16, 30, 31, 33, 44, 45, 49, 54, 57], "preconfigur": 39, "predict": [19, 26, 27, 28, 35, 57], "predict_batch_s": 16, "predict_fil": 57, "prefer": [29, 37, 41, 42], "prefix": 29, "preload": 32, "preop": 18, "prepack": 4, "prepend": [29, 55, 58, 60, 61], "preprocess": 60, "preprocess_data": 55, "present": [30, 54], "preserv": 20, "press": 38, "pretrain": [31, 44, 49], "pretrain_bert": 51, "pretrain_lamb": 51, "pretrain_path": 51, "pretrain_result_dir": 51, "prevent": 28, "previou": [8, 25, 32, 51], "previous": [28, 30], "primari": [17, 32], "primit": [11, 13, 20, 36], "primitive_attr": 11, "primitive_desc": 11, "principl": 18, "print": [2, 11, 19, 22, 25, 28, 29, 30, 33, 35, 37, 38, 39, 40, 41, 42, 47, 48, 51, 53, 54, 62, 63], "print_graph": 35, "printf": 51, "priorit": 18, "prioriti": [20, 33], "privaci": 0, "privat": 0, "privileg": [2, 3, 47], "problem": [14, 24, 28, 32, 56], "proc": [28, 32], "procedur": [11, 37, 41, 42], "process": [4, 7, 11, 16, 21, 28, 29, 32, 34, 51, 52], "process_per_nod": 61, "processor": [4, 21, 31, 32, 41, 47, 52, 53], "proclist": 32, "produc": 57, "product": [5, 7, 21, 34, 37], "profession": 0, "profil": [4, 9, 28, 30, 32], "profiler_demo": 22, "program": [9, 27, 32, 63], "project": [2, 5, 7, 16, 63], "prolong": [39, 40], "promot": 7, "prompt": [31, 39, 40], "promptli": 0, "prop_kind": 11, "propag": [9, 13, 16, 17], "properli": [21, 29], "properti": [17, 18, 28], "propos": [7, 25], "protect": 11, "protobuf": 52, "protocol": 49, "protocolmessag": 33, "provid": [0, 2, 4, 7, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 28, 29, 30, 31, 32, 33, 35, 36, 37, 38, 39, 40, 42, 44, 45, 49, 51, 52, 55, 60, 61, 62, 63], "proxi": 36, "prune": 35, "pseudocod": 28, "pub": 37, "public": [0, 4, 5, 11, 21, 25, 33, 34], "publish": [0, 5], "pull": [7, 34, 41, 42, 47], "pure": 31, "push": [5, 16], "put": 34, "pvc": [39, 40, 51], "pwd": [47, 62], "py": [7, 11, 16, 22, 29, 34, 35, 42, 47, 48, 49, 51, 54, 55, 56, 57, 58, 60, 61, 62], "pybind11": 60, "pycocotool": 60, "pylint": 7, "pylintrc": 7, "pypi": [2, 43, 63], "python": [2, 4, 9, 14, 19, 22, 23, 25, 26, 27, 28, 29, 30, 32, 34, 35, 37, 38, 39, 41, 42, 45, 46, 49, 51, 52, 53, 55, 56, 57, 58, 60, 61, 63], "python3": [2, 5, 16, 38, 39, 54, 56], "pythonhost": 40, "pythonpath": 61, "pytorch": [27, 30], "q1": 14, "q_model": 49, "qdq": 52, "qo": 37, "qualiti": 28, "quantiz": [4, 44], "quantizev2": 49, "queri": 28, "question": [0, 4, 36, 63], "queue": [35, 62], "quick": [4, 11, 37, 44], "quickli": [20, 28], "r": [3, 7, 14, 28, 31, 32, 44, 62], "r2": [34, 40, 62], "race": 0, "rais": 33, "rand": 53, "random": [25, 35, 53], "randomnorm": 40, "rang": [25, 28, 32, 35], "rank": [31, 55, 58, 60, 61], "rapid": [41, 47], "rare": 28, "rate": [14, 15, 18, 25, 34], "rather": 25, "ratio": 36, "raw": 58, "rb": 35, "rcfile": 7, "rcnn": 49, "re": [2, 32, 35, 46], "reach": 18, "read": [20, 28, 35, 45, 55], "readm": 61, "real": [15, 28, 36, 51, 61], "reason": [0, 28, 30], "recent": 56, "recogn": [44, 45], "recommend": [16, 20, 28, 32, 33, 34, 35, 37, 38, 39, 41, 42, 46, 52], "record": [36, 61], "recurrent_activ": [25, 26], "recurrent_initi": [25, 26], "recurs": 7, "red": 42, "reduc": [15, 16, 18, 28, 32, 36, 39, 40, 45, 51, 54, 62], "reduce_mean": 35, "ref_result_dir": 54, "refer": [2, 3, 7, 11, 14, 15, 17, 18, 19, 20, 21, 23, 28, 31, 32, 33, 34, 37, 39, 40, 42, 44, 45, 46, 47, 48, 50, 51, 52, 53, 54, 55, 56, 57, 58, 60, 61, 62, 63], "refresh": 22, "regardless": 0, "region": 32, "regist": [4, 14, 30, 45, 52], "register_": 11, "register_geluop": 11, "register_kernel_build": 11, "registr": [10, 11, 55], "registrationcent": [37, 42], "regress": 27, "regular": [25, 36], "reinstal": 51, "reject": 0, "rel": [16, 29, 51], "relat": [5, 27, 29, 34, 36], "relationship": [14, 18], "releas": [4, 14, 17, 32, 33, 34, 39, 40, 45, 54, 56], "reli": 17, "relianc": 16, "religion": 0, "relu": [4, 11, 19, 21, 24, 25, 26, 28, 35, 53], "relu6": 24, "relu_op": 11, "relu_op_functor": 11, "relubaseop": 11, "relugrad": 24, "remain": [20, 30], "remapp": [19, 24, 33], "remot": 32, "remov": [0, 11, 16, 18, 24], "reorder": [13, 36], "repeat": 18, "replac": [14, 25, 26, 27, 34, 36, 40, 51], "replica": [11, 20], "repo": [5, 31, 37, 38], "report": [0, 7, 20, 63], "repositori": [9, 16, 31, 37, 51, 55, 60], "repres": [0, 4, 16, 17, 30, 31], "represent": 15, "representative_dataset": 49, "reproduc": 31, "request": [0, 7, 63], "requir": [2, 4, 7, 11, 13, 15, 16, 21, 22, 24, 25, 28, 29, 30, 36, 38, 45], "rerun": 28, "research": 57, "reserv": 32, "reset": 54, "reshap": [19, 25, 28, 35], "resnet": [61, 62], "resnet101": 49, "resnet34": 49, "resnet50": [17, 29, 31, 44, 49, 59], "resnet50_itex": 62, "resnet_ctl_imagenet_main": 62, "resnet_v1_50": 22, "resolv": 1, "resourc": [29, 32, 56], "respect": [0, 29, 35, 51], "rest": [20, 24], "rest_api_port": 34, "restart": 38, "result": [5, 15, 16, 17, 19, 22, 27, 28, 30, 32, 33, 38, 45, 48, 53, 54, 56, 62], "result_dir": 51, "retinanet50": 49, "retrain": 28, "retriev": [28, 49], "return": [11, 17, 28, 30, 33, 35, 40], "return_sequ": 25, "return_st": 25, "reus": [32, 45], "review": 0, "rewrit": [11, 17], "rewrite_opt": 52, "rewriter_config_pb2": 52, "rewriterconfig": 52, "rewritten": 16, "rf": [34, 46, 61], "rfc": [7, 21], "right": [0, 25], "rm": [34, 40, 46, 47, 61], "rmsprop": [19, 28, 35], "role": 32, "root": [7, 39, 40, 56], "rpath": 40, "rule": 19, "run": [7, 11, 14, 16, 18, 19, 22, 24, 26, 27, 28, 29, 31, 32, 33, 35, 39, 41, 42, 63], "run_20210712212258_inst": 29, "run_20210712212258_instance_0_cores_0": 29, "run_20221009103552_inst": 29, "run_20221009103552_instance_0_cores_0": 29, "run_20221009104740_inst": 29, "run_20221009104740_instance_0_cores_0": 29, "run_20221009105044_inst": 29, "run_20221009105044_instance_0_cores_12": 29, "run_20221009105320_inst": 29, "run_20221009105320_instance_0_cores_0": 29, "run_20221009105838_inst": 29, "run_20221009105838_instance_0_cores_0": 29, "run_20221009105838_instance_1_cores_12": 29, "run_20221009105838_instance_2_cores_24": 29, "run_20221009105838_instance_3_cores_36": 29, "run_20221009105838_instance_4_cores_48": 29, "run_20221009105838_instance_5_cores_60": 29, "run_20221009105838_instance_6_cores_72": 29, "run_20221009105838_instance_7_cores_84": 29, "run_20221009110327_inst": 29, "run_20221009110327_instance_0_cores_0": 29, "run_20221009110327_instance_10_cores_40": 29, "run_20221009110327_instance_11_cores_44": 29, "run_20221009110327_instance_12_cores_48": 29, "run_20221009110327_instance_13_cores_52": 29, "run_20221009110327_instance_14_cores_56": 29, "run_20221009110327_instance_15_cores_60": 29, "run_20221009110327_instance_16_cores_64": 29, "run_20221009110327_instance_17_cores_68": 29, "run_20221009110327_instance_18_cores_72": 29, "run_20221009110327_instance_19_cores_76": 29, "run_20221009110327_instance_1_cores_4": 29, "run_20221009110327_instance_20_cores_80": 29, "run_20221009110327_instance_21_cores_84": 29, "run_20221009110327_instance_22_cores_88": 29, "run_20221009110327_instance_23_cores_92": 29, "run_20221009110327_instance_2_cores_8": 29, "run_20221009110327_instance_3_cores_12": 29, "run_20221009110327_instance_4_cores_16": 29, "run_20221009110327_instance_5_cores_20": 29, "run_20221009110327_instance_6_cores_24": 29, "run_20221009110327_instance_7_cores_28": 29, "run_20221009110327_instance_8_cores_32": 29, "run_20221009110327_instance_9_cores_36": 29, "run_20221009110849_inst": 29, "run_20221009110849_instance_0_cores_0": 29, "run_20221009110849_instance_1_cores_11": 29, "run_20221009110849_instance_1_cores_24": 29, "run_20221009110849_instance_2_cores_22": 29, "run_20221009110849_instance_2_cores_48": 29, "run_20221009110849_instance_3_cores_33": 29, "run_20221009110849_instance_3_cores_72": 29, "run_20221009111034_instance_0_cores_0": 29, "run_20221009111239_instance_0_cores_24": 29, "run_20221009111753_inst": 29, "run_20221009111753_instance_0_cores_0": 29, "run_20221009111951_inst": 29, "run_20221009111951_instance_0_cores_0": 29, "run_20221009112720_instance_0_cores_0": 29, "run_20221009112905_instance_0_cores_0": 29, "run_20221009112956_instance_0_cores_0": 29, "run_classifi": 16, "run_inf": 35, "run_jupyt": 52, "run_pretraining_lamb": 51, "run_squad": [51, 57], "runner": 61, "runtim": [16, 18, 23, 25, 27, 28, 32, 36, 37, 39, 40, 51, 63], "safe": [13, 18, 33, 63], "sai": [28, 51], "same": [5, 7, 14, 20, 21, 23, 24, 25, 28, 29, 30, 31, 32, 33, 34, 35, 36, 39, 40, 45, 53], "sampl": [2, 22, 31, 35, 45, 52, 54], "samsung": 31, "saniti": [7, 63], "sapphir": [41, 47], "satisfi": [13, 23], "save": [5, 11, 17, 29, 33, 49, 57], "save_checkpoint_step": 51, "save_json_data": 35, "saved_model": 34, "savedmodel": 49, "scalabl": [4, 21, 31, 34, 41, 47], "scale": [4, 25, 26, 31, 35, 62], "scaled_gradi": 28, "scaled_loss": 28, "scenario": [4, 13, 20, 21, 23, 32, 33], "schedul": [13, 16, 25, 29, 32, 35], "schmidhub": 25, "scope": [17, 40], "scratch": [28, 51], "scratchpad": [11, 13], "scratchpad_mem": 11, "scratchpad_mod": 11, "screen": 47, "script": [5, 21, 22, 27, 32, 39, 40, 42, 47, 49, 51, 53, 55, 56, 60, 61], "sdp": 29, "seamless": [4, 30], "search": [7, 29], "sec": [31, 35, 51, 62], "second": [32, 35, 52, 61, 62], "section": [14, 28, 32, 37, 39, 40, 49], "secur": 0, "see": [0, 1, 2, 4, 7, 14, 16, 22, 25, 28, 29, 32, 34, 36, 37, 39, 52, 61, 63], "seed": 60, "seen": 32, "segment": [31, 44, 60], "select": [14, 28, 29, 30, 33, 54, 63], "self": 35, "semant": [17, 20, 25], "send": 16, "separ": [11, 14, 23, 24, 28, 31, 32, 38, 39, 63], "seq": 16, "sequenc": [31, 51, 54], "sequenti": 35, "seri": [0, 16, 32, 33, 39, 40, 42, 45, 47, 50, 51, 52, 54, 55, 56, 57, 58, 60, 61, 62, 63], "serial": 35, "seriesintel": 47, "seriesne": 47, "seriessupport": 47, "seriou": 0, "serv": [4, 30], "serval": 27, "server": [5, 31, 39, 40, 42], "servic": 55, "serving_plugin": 34, "session": [40, 52], "set": [0, 2, 4, 7, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 27, 31, 32, 33, 35, 37, 38, 40, 42, 47, 51, 52, 57, 63], "set_config": [17, 18, 19, 47, 62], "set_env_cpu": [47, 48, 56], "set_env_gpu": [47, 48, 56], "set_global_polici": 28, "set_log_device_plac": 22, "set_scratchpad_mod": 11, "set_sess": 52, "set_weight": 28, "setup": [38, 41, 43, 45], "setvar": [14, 37, 42, 46, 58], "sever": [4, 16, 21, 29, 31, 32, 39, 40, 44, 61], "sex": 0, "sexual": 0, "sh": [2, 3, 5, 14, 34, 37, 38, 39, 40, 42, 46, 47, 48, 51, 52, 54, 55, 56, 57, 58, 60, 61, 63], "shape": [11, 13, 16, 17, 19, 25, 28, 30, 35, 36, 53], "shard": [4, 17, 21, 33], "sharding_config": [17, 62], "shardingconfig": [17, 62], "share": [7, 14, 32, 37, 47, 48, 51, 54, 55, 57, 60], "short": [16, 25, 28], "shoul": 40, "should": [2, 3, 5, 7, 22, 27, 28, 32, 34, 35, 37, 38, 40, 41, 42, 45, 51, 57, 62], "show": [5, 14, 16, 18, 27, 28, 31, 35, 39, 40, 42, 44, 45, 47, 49, 50, 51, 52, 54, 55, 56, 57, 60, 61, 62], "showcas": [16, 31], "shown": [2, 3, 15, 22, 24, 29, 51, 54, 55, 60], "shuffl": 28, "sigmoid": [24, 25, 26], "sign": [25, 37], "signific": [4, 7, 18], "significantli": [4, 28], "signoff": 51, "similar": [19, 32], "simpl": [4, 21, 23, 28, 40], "simpli": [28, 30, 62], "simplifi": 45, "simultan": [31, 42], "sinc": [4, 14, 28, 32, 36, 42], "singl": [0, 4, 7, 15, 20, 21, 24, 31, 51, 60, 61], "single_l2_loss_op": 62, "site": [5, 8, 37, 38, 39, 42, 56, 63], "situat": [20, 33], "size": [0, 20, 25, 28, 29, 31, 51, 58, 62], "skip": [7, 28, 29, 38], "skip_cross_node_cor": 29, "skip_ev": 62, "sle": 42, "sleep": 32, "slowdown": 16, "slower": [18, 19, 28, 35], "slowli": 28, "small": [13, 25, 28, 29, 32, 35], "sn850x": 31, "snapshot": 39, "snippet": 61, "so": [14, 16, 19, 28, 29, 32, 33, 34, 39, 40, 47, 48, 51, 54, 55, 56, 57, 58, 60], "social": 0, "socio": 0, "socket": [31, 32, 38, 62], "softmax": [18, 19, 28], "softwar": [2, 16, 38, 43, 45, 52, 53, 58], "sole": 32, "solut": [4, 14, 15, 21, 27, 30], "solv": [28, 56], "some": [2, 11, 18, 19, 26, 28, 29, 32, 39, 40, 49, 51, 58], "sometim": 7, "sort": [0, 16], "sourc": [2, 3, 4, 7, 11, 16, 17, 21, 37, 38, 42, 43, 46, 47, 48, 52, 55, 56, 58, 60, 63], "sp4": [31, 42], "sp5": 42, "space": [0, 32, 63], "sparse_categorical_crossentropi": [19, 28], "sparsecategoricalaccuraci": [28, 35], "sparsecategoricalcrossentropi": [28, 35], "special": [16, 19, 23, 28, 39, 40], "specif": [4, 16, 28, 30, 32, 33, 34, 37, 42, 61, 63], "specifi": [0, 3, 11, 21, 24, 28, 29, 32, 34, 39, 40, 49], "sped": 28, "speed": [15, 16, 18, 32, 44, 45], "speedup": [16, 31, 52, 62], "spend": 28, "split": [17, 18, 35], "squad": [31, 51, 57], "squad_dir": 57, "squad_vers": 51, "src": [7, 11, 14, 17, 34, 39], "src_md": 11, "src_mem": 11, "src_tensor": 11, "ssd": [31, 49], "ssdsc2kg960g8": 31, "st": [3, 40], "stabil": [19, 28], "stabl": [25, 28, 44, 63], "stable_diffusion_accuraci": 54, "stable_diffusion_infer": 54, "stable_diffussion_infer": 54, "stablehlo": 16, "stack": [31, 42, 43], "stage": [16, 52], "stage_num": [17, 62], "stall": 32, "standard": [7, 25], "standard_op": 40, "start": [2, 3, 14, 21, 22, 28, 29, 34, 35, 63], "startup": [39, 40], "stat": 22, "static": 32, "statist": 49, "statu": [0, 11, 19, 40], "status_msg": 40, "statusuniqueptr": 11, "std": [11, 40], "stdout": [7, 29], "steal": 35, "step": [3, 16, 17, 18, 25, 28, 31, 32, 34, 36, 44, 45, 51, 55, 58, 60, 62], "steps_per_epoch": [35, 60], "steps_per_loop": 62, "still": 28, "stock": [14, 16, 23, 24, 28, 30, 37, 38, 41, 42, 45, 49, 51, 54, 55, 56, 57, 60, 61, 62, 63], "stop": [22, 32], "storag": [16, 28, 31, 35, 47, 49, 56], "store": 36, "strategi": 32, "stream": [13, 27, 54, 62], "stream_executor": 28, "streamexecutor": [10, 30], "streamlin": [4, 21, 34], "strictli": 25, "stride": 53, "string": [18, 28, 29, 39, 40], "stringop": 34, "strong": 18, "structur": [4, 19, 29, 32], "sub": [9, 14, 18, 19, 32, 33], "subgraph": [15, 16], "submit": [5, 7, 63], "subsequ": [18, 19, 28, 32, 54], "subystem": 37, "succe": 36, "success": [48, 53, 54, 62], "successfulli": [14, 34, 38, 39, 40, 42, 62], "sudo": [7, 34, 37, 39, 40, 42], "suffici": [28, 35], "suggest": [56, 62], "sum": 35, "summari": [51, 63], "super": 35, "suppli": 35, "support": [4, 7, 13, 14, 15, 16, 17, 18, 19, 22, 24, 27, 28, 29, 30, 32, 33, 37, 39, 40, 41, 42, 45, 47, 52, 61, 62], "suppos": [32, 51], "sure": [3, 11, 28, 35, 37, 39, 40], "suse": [31, 42], "sustain": 0, "sw": 37, "swish": [19, 24], "switch": [4, 5, 27, 32, 35, 39], "sy": 53, "sycl": 14, "sycl_runtim": [14, 28], "symbol": 40, "sync": 33, "system": [14, 21, 30, 31, 32, 34, 35, 38, 39, 40, 56], "t": [2, 5, 11, 13, 17, 18, 20, 28, 29, 31, 36, 49, 54, 56], "tab": 22, "tabl": [18, 28, 29, 30, 31, 49], "tag": 5, "take": [0, 11, 16, 24, 28, 29, 32, 34, 35, 38, 51], "tanh": [24, 25, 26], "tape": 28, "tar": [3, 7, 32, 49], "target": [3, 16, 17, 39, 40], "task": [11, 20, 32, 61], "task_nam": 16, "taskset": 29, "tbb": 42, "tdp": 31, "team": [7, 54], "techniqu": [15, 28], "technologi": [16, 45], "tee": [29, 37, 51, 62], "tell": 14, "templat": 11, "temporari": 13, "tensor": [11, 16, 25, 28, 30, 40, 53], "tensorboard": [22, 63], "tensorflow": [5, 8, 9, 10, 11, 13, 14, 15, 16, 17, 20, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 36, 38, 43, 44, 46, 47, 48, 50, 51, 53, 54, 55, 56, 57, 58, 60, 61, 62], "tensorflow2": [51, 58, 60], "tensorflow2_keras_mnist": 58, "tensorflow_doc": 56, "tensorflow_hub": 22, "tensorflow_model_serv": [3, 34], "tensorflow_plugin": 34, "tensorflow_serv": [3, 34], "tensorflow_src": 40, "term": [0, 25, 30, 63], "termin": 38, "test": [9, 19, 22, 28, 34, 35, 38, 44, 55, 56], "test_accuraci": 28, "test_dataset": 28, "test_func": 28, "test_scor": [19, 28], "test_step": 28, "text": [18, 31, 44], "text2imag": [31, 44], "tf": [11, 14, 15, 19, 22, 25, 26, 27, 28, 29, 30, 33, 35, 37, 39, 40, 41, 42, 51, 52, 53, 62], "tf2": [49, 51, 56], "tf32": [20, 31, 51], "tf_auto_jit_flag": 27, "tf_auto_mixed_precision_graph_rewrite_allowlist_add": 18, "tf_auto_mixed_precision_graph_rewrite_allowlist_remov": 18, "tf_auto_mixed_precision_graph_rewrite_clearlist_add": 18, "tf_auto_mixed_precision_graph_rewrite_clearlist_remov": 18, "tf_auto_mixed_precision_graph_rewrite_denylist_add": 18, "tf_auto_mixed_precision_graph_rewrite_denylist_remov": 18, "tf_auto_mixed_precision_graph_rewrite_inferlist_add": 18, "tf_auto_mixed_precision_graph_rewrite_inferlist_remov": 18, "tf_auto_mixed_precision_graph_rewrite_level": 18, "tf_auto_mixed_precision_graph_rewrite_log_path": 18, "tf_bert_finetune_": 51, "tf_bert_pretraining_lamb_": 51, "tf_check_ok": 40, "tf_code": 40, "tf_compatible_vers": 33, "tf_copt": [11, 34], "tf_cpp_max_vlog_level": 20, "tf_cpp_min_log_level": 20, "tf_cuda_librari": 34, "tf_enable_onednn_opt": 29, "tf_getcod": [11, 40], "tf_hub": 22, "tf_include_path": 40, "tf_kera": 27, "tf_loadpluggabledevicelibrari": 40, "tf_messag": 40, "tf_newopdefinitionbuild": 11, "tf_newstatu": [11, 40], "tf_num_interop_thread": 62, "tf_num_intraop_thread": 62, "tf_ok": [11, 40], "tf_opdefinitionbuild": 11, "tf_opdefinitionbuilderaddattr": 11, "tf_opdefinitionbuilderaddinput": 11, "tf_opdefinitionbuilderaddoutput": 11, "tf_opdefinitionbuildersetshapeinferencefunct": 11, "tf_registeropdefinit": 11, "tf_serv": 34, "tf_statu": 40, "tf_use_legacy_kera": [27, 51, 54], "tf_ver": 2, "tf_xla_auto_jit": [16, 27, 30], "tf_xla_flag": [16, 27, 30], "tf_xla_use_device_api": [16, 30], "tfa": [25, 26, 55], "tfcc_path": 40, "tfd": 61, "tfg": 17, "tfg_optimizer_hook": 62, "tfg_to_h": 17, "tfhub": 22, "tfrecord": [51, 55, 61], "tfx": 21, "than": [19, 25, 28, 32, 35, 37, 42, 47, 53, 58], "thei": [0, 18, 28, 29, 32], "them": [16, 18, 21, 28, 29, 32, 34, 56, 61], "therefor": [28, 32], "thereof": 16, "thi": [0, 2, 3, 4, 5, 11, 13, 14, 16, 17, 18, 19, 20, 21, 23, 24, 25, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 38, 39, 40, 42, 45, 46, 49, 50, 51, 52, 53, 55, 57, 60, 62, 63], "thing": 21, "think": 28, "third": [9, 36, 63], "third_parti": [7, 9, 34], "those": [0, 16, 18, 19, 34, 61], "though": 39, "thrash": 32, "thread": [4, 13, 20, 29, 31, 32, 33, 42], "threadpool": [3, 20, 40], "threaten": 0, "three": [4, 21, 22, 23, 29], "through": [0, 27, 28, 32, 35, 39, 40, 55, 63], "throughput": [31, 47, 51, 54], "throughput_mod": 29, "throughput_train": 51, "thu": 32, "tiger_cat": 48, "tightli": 30, "tile": [17, 20, 33, 51, 58, 60, 61, 62], "time": [0, 4, 11, 14, 16, 18, 19, 20, 21, 22, 28, 31, 32, 35, 39, 40, 45, 49, 51], "timehistori": [61, 62], "tip": [11, 20, 32, 34], "tmp": 34, "todai": 30, "togeth": 32, "toggl": 33, "toi": 28, "token": [54, 56], "too": [18, 28, 37, 42], "tookit": [39, 40], "tool": [7, 9, 11, 14, 18, 32, 36, 37, 38, 39, 40, 42, 63], "toolchain": 39, "toolkit": [14, 31, 37, 38, 45, 47, 58, 63], "top": 27, "topic": 4, "topologi": [21, 29, 32], "total": [31, 32, 35, 49, 51, 58], "total_loss": 51, "total_tim": 35, "total_training_step": 51, "tour": 63, "tout": 24, "toward": 0, "tpl": 7, "tpost": 24, "tpu": 49, "trace": 22, "traceback": 56, "track": [22, 56], "train": [2, 14, 17, 18, 21, 24, 25, 26, 27, 29, 34, 35, 37, 38, 42, 43, 44, 47, 51, 52, 57, 59, 63], "train_accuraci": 62, "train_and_ev": 61, "train_batch_s": [57, 60], "train_batch_size_phase1": 51, "train_batch_size_phase2": 51, "train_dataset": 28, "train_epoch": 62, "train_fil": 57, "train_horovod": 58, "train_loss": [51, 62], "train_maskrcnn": [55, 60], "train_step": [28, 51, 62], "trainabl": [25, 35], "trainable_vari": 28, "trainer": 61, "trainingop": 24, "transfer": 52, "transform": [24, 25], "translat": [0, 39, 40], "transpar": [4, 21], "transpos": [24, 26], "travers": 36, "treat": 20, "tree": [39, 40], "tri": 56, "tricki": 28, "trigger": [5, 19, 33], "troll": 0, "true": [11, 16, 22, 25, 26, 28, 29, 30, 33, 35, 40, 51, 57, 62], "truncat": 34, "try": [11, 21, 29, 45, 49, 52], "ttt": 31, "tumor": 55, "tune": [31, 33, 45, 51], "tupl": 35, "turbo": 31, "turn": [17, 63], "tutori": 56, "two": [4, 13, 14, 19, 21, 23, 28, 32, 35, 39, 47, 51, 54, 55, 60], "txt": [16, 18, 37, 42, 54, 57, 62], "type": [4, 7, 11, 14, 18, 20, 21, 29, 31, 33, 38, 39, 40, 47, 49], "type_infer": 17, "typeconstraint": 11, "typeerror": 56, "typenam": 11, "typic": [4, 21, 23, 28, 32], "u": [0, 22, 29, 42], "ubuntu": [2, 31, 34, 39, 40, 41, 42], "ubuntu22": 56, "ubuntu_vers": 2, "uma": 32, "unaccept": 0, "uncased_l": 51, "unchanged_shape_fn": 11, "undef": 11, "undefin": [2, 30], "under": [17, 23, 26, 29, 33, 39, 52], "understand": 36, "undesir": 29, "unet": [31, 44], "unet_3d_med": 55, "unexpect": 51, "unifi": [21, 29, 37], "uniform": [4, 16, 21, 30, 35], "uniniti": 17, "uninstal": [11, 51, 60], "unit": [19, 25, 28, 32, 35], "unknown": [14, 28], "unkown": 27, "unless": 33, "unmodifi": 16, "unnecessari": [24, 28, 32], "unoptim": 36, "unordered_map": 11, "unprofession": 0, "unsafe_force_al": 18, "unscal": 28, "unshard": 17, "unsolicit": 0, "unspecifi": 29, "until": [18, 32], "unwelcom": 0, "unzip": 40, "up": [18, 22, 28, 32, 37, 40, 44, 51, 54, 57], "updat": [2, 18, 27, 28, 37, 38, 39, 40, 41, 42, 62], "update_st": 28, "upenn": 55, "upgrad": [14, 37, 38, 41, 42, 45, 46, 49, 55, 60, 63], "upon": 55, "upstream": [14, 18], "url": [49, 54, 56], "us": [0, 2, 3, 4, 5, 7, 13, 14, 15, 16, 18, 19, 20, 22, 23, 24, 25, 26, 28, 31, 32, 33, 36, 37, 38, 39, 40, 42, 44, 46, 47, 49, 50, 51, 52, 53, 55, 56, 57, 60, 63], "usag": [4, 14, 16, 21, 32, 33, 35, 44], "use_bia": [25, 26], "use_default_alloc": 29, "use_itex_shard": 62, "use_logical_cor": 29, "use_mytrain": 51, "use_synthetic_data": [60, 62], "use_tf_funct": 62, "use_tf_while_loop": 62, "use_tpu": 57, "use_xla": 51, "usecyclespersecondtim": [4, 21, 22, 28], "user": [4, 5, 7, 11, 13, 19, 20, 21, 23, 27, 30, 37, 39, 40, 41, 42, 43, 47, 54, 63], "usr": [7, 29, 37, 39], "usual": 18, "ut": 7, "util": [4, 9, 11, 14, 16, 21, 23, 29, 31, 32, 35, 56, 62], "v": [2, 3, 16, 18, 34, 38, 40, 42, 46, 47], "v0": [31, 33, 38], "v1": [35, 49, 51, 52, 57, 63], "v100": 51, "v1_8": [35, 47], "v2": [15, 31, 33, 38, 42, 49, 51, 61, 63], "v3": [15, 44], "v4": [18, 35, 44], "val_accuraci": 28, "val_loss": 28, "valid": [8, 33], "validation_split": [19, 28, 35], "valu": [15, 17, 18, 20, 25, 28, 29, 31, 32, 33, 61], "valueerror": 33, "var": [2, 14, 34, 38, 39, 40, 42], "vari": 27, "variabl": [2, 4, 13, 15, 16, 19, 21, 22, 23, 24, 25, 27, 28, 30, 32, 34, 35, 38, 40, 52], "variable_dtyp": 28, "varianc": 25, "varibl": 51, "varieti": 44, "variou": 16, "ve": [39, 40], "vector": 40, "venv": [46, 55, 58, 60], "verbos": [11, 19, 20, 28, 29, 30, 35], "veri": [15, 28, 51], "verifi": [38, 39, 40, 44, 51, 54, 55, 56, 57, 60, 61, 62], "version": [0, 2, 11, 14, 16, 27, 28, 31, 32, 37, 38, 39, 40, 41, 42, 45, 46, 51, 56], "versu": [19, 32], "via": [0, 4, 11, 17, 27, 30, 31, 35, 44, 62, 63], "view": 8, "viewer": 22, "viewpoint": 0, "violat": 0, "virtual": [39, 40, 51, 52, 54, 55, 56, 57, 60, 61, 62], "virtual_env": 29, "visibl": [0, 2, 11, 34], "vision": 30, "visit": 63, "vnni": 52, "vocab": [16, 57], "vocab_fil": [16, 57], "void": 11, "volum": 55, "vulner": 63, "vz": 40, "w": [28, 31, 35, 44], "wa": [0, 29, 32, 33, 39, 40], "wai": [0, 16, 19, 28, 30, 34, 36, 38], "wait": 32, "want": [3, 5, 7, 28, 29, 37, 39, 40, 42, 51, 54, 57, 60], "warm": [22, 35], "warmup": 35, "warmup_step": 55, "warmup_steps_phase1": 51, "warmup_steps_phase2": 51, "warn": [28, 29, 40, 51], "wd": [25, 31], "wd_black": 31, "we": [0, 2, 7, 11, 24, 27, 28, 31, 32, 33, 34, 35, 38, 39, 40, 45, 46, 47, 49, 51, 52, 54, 55, 56, 57, 60, 61, 63], "weak": 31, "web": [5, 56], "websit": [45, 63], "weight": [4, 13, 25, 28, 51, 53, 62], "weight_decai": [25, 26], "welcom": [0, 7, 63], "well": [0, 2, 8, 11, 21, 26, 28, 29, 30, 31, 32, 51], "were": [0, 16, 29, 32], "wether": 27, "wget": [2, 7, 32, 35, 37, 39, 40, 42, 47, 49, 56, 58], "what": [0, 14, 28], "wheel": [2, 38, 39], "when": [0, 5, 14, 17, 19, 24, 27, 28, 29, 32, 34, 35, 36, 37, 39, 40, 51, 52, 55, 56, 60], "where": [25, 28, 31, 32, 39, 49], "wherea": 61, "wherebi": 32, "whether": [24, 29, 32], "which": [0, 4, 7, 9, 13, 14, 15, 16, 17, 18, 19, 20, 24, 28, 29, 30, 32, 33, 35, 36, 37, 39, 40, 42, 45, 46, 52, 57], "while": [16, 21, 28, 31, 32, 33, 34, 39, 48, 53, 56], "whitespac": 51, "whitlei": 31, "whl": [2, 11, 39, 40, 63], "whole": [18, 20, 33, 51], "whole_seq_output": 25, "whose": 18, "why": 0, "wide": [14, 25, 36, 44], "wiki": 0, "wiki_onli": 51, "wikicorpus_en": 51, "wikipedia": [31, 32, 51], "wish": 39, "within": [0, 15, 25, 30, 37, 51], "without": [0, 4, 16, 18, 20, 21, 23, 28, 30, 31, 39, 40, 44, 52, 56, 63], "withsum": 24, "wl": 40, "wno": 34, "won": [5, 29, 36], "work": [1, 4, 7, 14, 15, 19, 20, 21, 27, 28, 29, 32, 35, 36, 40, 42, 45, 49, 52], "worker": 28, "workflow": 16, "workload": [2, 4, 16, 32, 35, 44, 52, 60, 63], "workspac": [2, 3, 34], "world": 28, "wors": 47, "would": [28, 37, 39, 61], "wrap": 28, "wrap_funct": 35, "wrapper": [28, 42], "write": [5, 7, 16, 19], "written": [0, 7, 27], "wrong": [39, 40], "ws1": 47, "wu": 25, "www": [0, 21, 42], "x": [11, 19, 25, 26, 28, 31, 39, 40, 47, 53, 58], "x15": 14, "x710": 31, "x86_64": [38, 39, 40], "x_test": [19, 28, 35], "x_train": [19, 28, 35], "xe": 31, "xeon": [4, 21, 31, 32, 35, 39, 40, 41, 44, 47], "xfd": 11, "xla": [4, 16, 27], "xla_global_id": 2, "xpu": [2, 4, 11, 14, 17, 19, 22, 25, 26, 28, 30, 33, 37, 38, 43, 45, 46, 47, 48, 49, 53, 54, 55, 58, 60], "xpu_force_sync": 33, "xpu_lib_path": 40, "xpuautoshard": [4, 33, 44], "xx": [34, 61], "xxx": [7, 52, 56], "xxxx": [58, 61], "xxxxx": [34, 51, 62], "xxxxxx": 11, "xxxxxxxx": 52, "xzf": 7, "xzvf": 32, "y": [11, 25, 26, 28, 35, 37, 39, 40, 47, 58, 63], "y_test": [19, 28, 35], "y_train": [19, 28, 35], "yaml": 61, "ye": [19, 38], "you": [2, 3, 4, 5, 7, 8, 11, 13, 14, 16, 17, 18, 20, 21, 22, 23, 28, 29, 30, 31, 32, 33, 34, 35, 37, 38, 39, 40, 41, 42, 45, 46, 47, 48, 49, 51, 52, 53, 54, 55, 56, 57, 60, 61, 62], "your": [2, 3, 5, 7, 14, 27, 30, 32, 34, 35, 37, 38, 39, 40, 41, 42, 46, 47, 49, 51, 52, 54, 56, 62, 63], "your_script": 29, "your_script_arg": 29, "yourself": 29, "yuxin": 25, "yyi": 52, "yym": 58, "yyyi": 58, "z": [40, 58], "ze_api": 14, "ze_enable_tracing_lay": [4, 21, 22, 28], "zero": [14, 25, 26, 28, 37], "zip": 28, "zoo": 44, "zxvf": 49, "zzz": 7, "zzzz": 58}, "titles": ["Contributor Covenant Code of Conduct", "Security Policy", "Intel\u00ae Extension for TensorFlow* Docker Container Guide", "Intel\u00ae Extension for TensorFlow* Serving - Docker Container Guide", "Welcome to Intel\u00ae Extension for TensorFlow* documentation", "Online Documentation Build Guide", "Welcome to Intel \u00ae Extension for TensorFlow* documentation!", "Contributing guidelines", "Releases", "Directory Tree Structure", "Extension Design", "How to write custom op", "Optimizations Design", "oneDNN object cache optimization", "Frequently Asked Questions", "INT8 Quantization", "OpenXLA", "XPUAutoShard on GPU [Experimental]", "Tune Advanced Auto Mixed Precision", "Advanced Auto Mixed Precision", "Environment Variables", "Features", "GPU Profiler", "Infrastructure", "Graph fusion", "Customized Operators", "Operators Override", "Keras 3 Overview", "Keras Mixed Precision", "Launch Script User Guide", "NextPluggableDevice Overview", "Performance Data", "Practice Guide", "Python APIs", "Install TensorFlow Serving with Intel\u00ae Extension for TensorFlow*", "Selecting Thread Pool in Intel\u00ae Extension for TensorFlow* CPU [Experimental]", "Online Weight Prepack", "Experimental: Intel\u00ae Arc\u2122 A-Series GPU Software Installation", "Conda Environment Installation Instructions", "Overview", "Intel\u00ae Extension for TensorFlow* for C++", "Intel CPU Software Installation", "Intel XPU Software Installation", "Installation Guide", "Examples", "Accelerate AlexNet by Quantization with Intel\u00ae Extension for Tensorflow*", "Common Guide for Running", "Speed up Inference of Inception v4 by Advanced Automatic Mixed Precision on Intel CPU and GPU via Docker Container or Bare Metal", "ResNet50 Inference on Intel CPU and GPU", "Intel\u00ae Extension for Tensorflow* Model Quantization API Example", "Accelerate Deep Learning Training and Inference for Model Zoo Workloads on Intel GPU", "Accelerate BERT-Large Pretraining on Intel GPU", "Quantize Inception V3 by Intel\u00ae Extension for Tensorflow* on Intel\u00ae Xeon\u00ae", "Quick Example on Intel CPU and GPU", "Stable Diffusion Inference for Text2Image on Intel GPU", "Accelerate 3D-Unet Training w/o horovod for medical image segmentation on Intel GPU", "BERT Training for Classifying Text on Intel CPU and GPU", "FP8 BERT-Large Fine-tuning for Classifying Text on Intel GPU", "Distributed Training Example with Intel\u00ae Optimization for Horovod* on Intel\u00ae GPU", "Refer to train_resnet50", "Accelerate Mask R-CNN Training on Intel GPU", "Resnet50 train on Intel GPU", "Accelerate ResNet50 Training by XPUAutoShard on Intel GPU", "Intel\u00ae Extension for TensorFlow*", "Welcome to Intel \u00ae Extension for TensorFlow* documentation!"], "titleterms": {"1": [0, 11, 31, 34, 37, 40], "1550": 31, "17": 39, "170": 31, "1x": 31, "2": [0, 11, 34, 37, 40], "3": [0, 11, 27, 37], "3d": [31, 55], "4": [0, 11, 31, 37], "4x": 31, "5": 31, "6": 11, "7": 11, "8": 11, "9": 11, "A": 37, "By": 37, "For": [39, 40], "If": 61, "That": 2, "With": 62, "acceler": [45, 50, 51, 55, 60, 62], "access": [2, 32], "accuraci": [31, 54, 57], "activ": 26, "adamw": 26, "adamwithweightdecayoptim": 25, "add": 11, "addit": [31, 39], "advanc": [18, 19, 21, 23, 29, 47, 52], "ai": 31, "alexnet": 45, "all": 29, "alloc": [29, 32], "amp": [19, 21, 47], "api": [17, 18, 20, 21, 23, 33, 47, 48, 49, 54, 62], "appli": [49, 58, 61], "arc": 37, "architectur": [23, 30], "ask": 14, "attribut": [0, 18], "auto": [18, 19, 20, 21], "automat": 47, "automixedprecisionopt": 33, "b0": 31, "b3": 31, "backend": 20, "background": [18, 45, 52], "ban": 0, "bare": [41, 42, 47, 50], "base": [39, 40, 42, 45, 46], "basic": [24, 29], "bazel": [7, 39, 40], "bert": [31, 51, 56, 57], "bf16": 57, "binari": [2, 3, 63], "boost": 52, "build": [2, 3, 5, 11, 14, 28, 34, 39, 40, 41, 42], "c": [7, 34, 40], "cach": 13, "case": 27, "cc": 40, "center": 31, "chang": [8, 51, 54, 55, 57, 60, 61], "channel": 63, "check": [30, 42, 52, 58], "clang": 39, "classifi": [56, 57], "clone": [47, 58], "cnn": 60, "code": [0, 7, 17, 19, 39, 40, 51, 53, 54, 55, 56, 57, 58, 60, 61, 62], "command": [51, 58, 61, 62], "common": [29, 39, 40, 46], "compar": 47, "compat": 63, "compil": 39, "compressor": 49, "conda": [38, 39, 40], "conduct": 0, "config": [20, 33], "configproto": 33, "configur": [18, 20, 31, 32, 39, 40, 47, 52], "constant": 52, "contain": [2, 3, 41, 42, 47, 50], "content": 32, "contribut": [7, 63], "contributor": 0, "control": 29, "converg": 51, "convolut": 13, "core": 29, "correct": 0, "count": 58, "coven": 0, "cpu": [21, 32, 35, 39, 40, 41, 42, 47, 48, 52, 53, 54, 56, 61, 63], "creat": [5, 39, 40, 58], "current": 30, "custom": [2, 11, 19, 23, 25, 28], "data": [19, 24, 31], "dataset": [49, 51, 55, 60, 61], "debug": 7, "debugopt": 33, "deep": [50, 52], "default": 29, "defin": 11, "definit": 20, "dens": 26, "depend": 58, "deprec": 42, "descript": [2, 3], "design": [10, 12, 29], "detail": 24, "devcloud": [45, 52], "develop": 7, "devic": [30, 58], "differ": [18, 27, 28], "diffus": [31, 54], "directli": 37, "directori": 9, "disabl": 52, "distribut": 58, "docker": [2, 3, 34, 41, 42, 47, 50], "dockerfil": [34, 41, 42], "dockerhub": [41, 42], "document": [4, 5, 6, 7, 63, 64], "download": [39, 40, 47, 56, 58], "driver": [37, 39, 40, 42, 46], "dtype": 28, "dump": 17, "eas": 21, "effect": 36, "efficientnet": 31, "eigen": 35, "enabl": [19, 46, 47, 48, 51, 52, 54, 55, 56, 57, 58, 60, 61, 62], "end": 18, "enforc": 0, "engin": 23, "environ": [18, 20, 29, 33, 37, 38, 39, 40, 41, 42, 45, 46, 47, 48, 49, 51, 52, 54, 55, 56, 57, 58, 60, 61, 62], "error": 27, "exampl": [16, 17, 18, 19, 22, 29, 35, 39, 40, 44, 48, 49, 51, 53, 54, 55, 57, 58, 60, 61, 62], "execut": [29, 45, 47, 48, 51, 54, 55, 56, 57, 58, 60, 61, 62], "experiment": [17, 21, 35, 37], "extens": [2, 3, 4, 6, 7, 10, 23, 33, 34, 35, 37, 39, 40, 41, 42, 45, 49, 52, 63, 64], "extra": [39, 40], "extract": 40, "faq": [22, 47, 48, 51, 54, 55, 56, 57, 60], "featur": [19, 21, 23], "file": 40, "fine": 57, "finetun": 51, "fit": 28, "flex": 31, "fold": 52, "format": 32, "fp16": 54, "fp32": [47, 54], "fp8": 57, "frequent": 14, "from": [2, 14, 34, 40, 41, 42], "full": 37, "function": 52, "further": 62, "fusion": 24, "gelu": [25, 26], "gener": 24, "get": [41, 42], "get_config": 33, "gnu": 32, "gpu": [2, 17, 21, 22, 31, 32, 37, 39, 40, 42, 45, 46, 47, 48, 50, 51, 52, 53, 54, 55, 56, 57, 58, 60, 61, 62], "gpuoption": 33, "graph": [17, 19, 21, 24, 33, 52], "graphopt": 33, "groupnorm": 25, "guid": [2, 3, 5, 7, 29, 32, 43, 46, 50], "guidelin": [0, 7], "hardwar": [28, 31, 32, 37, 39, 40, 41, 42, 45, 47, 51, 52, 54, 55, 56, 57, 60, 61, 62, 63], "header": 40, "highlight": 4, "horovod": [55, 58, 61], "how": [11, 16, 28], "hvd": 61, "i": [2, 3, 29], "identifi": 28, "ii": [2, 3, 29], "iii": [2, 29], "imag": [3, 31, 34, 55], "imagenet": 61, "implement": [11, 24], "import": 33, "improv": 18, "incept": [47, 52], "includ": 29, "incompat": 8, "index": 29, "infer": [29, 31, 47, 48, 50, 54], "infrastructur": 23, "instal": [11, 34, 37, 38, 39, 40, 41, 42, 43, 49, 53, 58, 62, 63], "instanc": [26, 29], "instruct": [37, 38], "int8": [15, 21], "integr": 40, "intel": [2, 3, 4, 6, 7, 23, 31, 32, 33, 34, 35, 37, 39, 40, 41, 42, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 60, 61, 62, 63, 64], "intel_extension_for_tensorflow": 33, "interfac": 11, "introduct": [5, 13, 23, 45, 47, 50, 51, 52, 54, 55, 56, 57, 60, 61, 62], "issu": 8, "itex": [25, 33], "itex_verbos": 20, "itexlstm": 25, "iv": 29, "ix": 29, "jemalloc": 29, "jupyt": [52, 54, 56], "kera": [27, 28], "kernel": 11, "known": 8, "lamboptim": 25, "larg": [31, 51, 57], "latenc": 29, "latest": 5, "launch": 29, "launcher": 21, "layer": 26, "layernorm": 25, "layout": [24, 32], "lead": 27, "learn": [50, 52], "level": 20, "librari": [34, 40], "licens": [52, 63], "limit": 36, "linker": 40, "linux": 37, "list": 18, "load": 40, "local": [5, 45, 52], "log": [19, 29], "logic": 29, "loop": 28, "loss": 28, "lstm": 26, "manag": 23, "manual": 19, "mask": [31, 60], "matrix": 52, "max": 31, "medic": [31, 55], "memori": [29, 32], "metal": [41, 42, 47, 50], "method": 47, "mix": [18, 19, 20, 21, 24, 28, 47], "mobilenet": 18, "mode": 29, "model": [28, 31, 34, 47, 49, 50, 51, 54, 55, 57, 60, 61], "multi": [29, 55], "multipl": 29, "name": 33, "nativ": 37, "net": 31, "neural": 49, "nextpluggabledevic": 30, "node": [29, 31], "non": 32, "normal": 26, "note": 53, "notebook": [52, 54, 56], "notic": 19, "numa": [29, 32], "numactl": 32, "number": 29, "numer": 18, "o": 55, "object": [13, 16], "omp_num_thread": 32, "one": 29, "oneapi": [37, 39, 40, 42, 46, 58], "onednn": [13, 52], "onli": [39, 40, 42], "onlin": [5, 36], "op": [11, 25, 33], "openmp": [32, 35], "openxla": [16, 21, 30], "oper": [19, 21, 25, 26, 33], "optim": [12, 13, 19, 21, 24, 58], "option": [20, 37, 39, 40, 58], "origin": 19, "other": 62, "our": 0, "output": [48, 53, 54, 58, 61, 62], "overflow": 28, "overrid": [26, 33], "overview": [15, 16, 17, 19, 20, 27, 28, 29, 30, 31, 32, 33, 36, 39, 49], "packag": [11, 40, 42, 62], "paramet": [61, 62], "patch": [58, 61], "perform": [18, 27, 31, 47], "perman": 0, "phase2": 31, "physic": 29, "pjrt": 30, "platform": 42, "pledg": 0, "pluggabledevic": 30, "plugin": 30, "polici": [1, 28], "pool": 35, "practic": 32, "pre": 49, "precis": [18, 19, 20, 21, 28, 47], "precondit": 38, "prepack": 36, "prepar": [2, 3, 40, 44, 46, 47, 48, 49, 51, 54, 55, 56, 57, 58, 60, 61, 62], "prerequisit": [11, 33, 48, 51, 54, 55, 56, 57, 60, 61, 62], "preserv": 33, "pretrain": [47, 51], "product": 31, "profil": [21, 22], "protocol": [20, 33], "public": 23, "py": 53, "pypi": [37, 39, 41, 42], "python": [7, 11, 17, 18, 20, 21, 33, 40, 47, 48, 54, 62], "pythonpath": 62, "quantiz": [15, 21, 45, 49, 52], "question": 14, "quick": [19, 50, 53], "quick_exampl": 53, "r": 60, "rcnn": 31, "recommend": 40, "refer": [16, 36, 59], "regist": 11, "releas": [5, 8, 37], "repo": 58, "report": 1, "repositori": 47, "requir": [37, 39, 40, 41, 42, 47, 51, 54, 55, 56, 57, 60, 61, 62, 63], "resnet50": [48, 61, 62], "resnet50v1": 31, "resourc": [10, 63], "respons": 0, "result": [31, 47, 51], "rule": 18, "run": [2, 3, 34, 37, 40, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 55, 56, 57, 58, 60, 61, 62], "runtim": [14, 30], "sampl": 34, "save": 19, "scale": 28, "scope": 0, "script": [2, 29, 46], "secur": [1, 63], "segment": 55, "select": 35, "seri": 37, "serv": [3, 21, 34], "server": [34, 45, 52], "set": [28, 29, 45, 49, 61, 62], "set_config": 33, "setup": [19, 28, 37, 42, 46, 47, 48, 51, 54, 55, 56, 57, 58, 60, 61, 62], "shard": 62, "shardingconfig": 33, "singl": [29, 55], "situat": 27, "skip": [47, 48, 54, 56, 61], "softwar": [31, 32, 37, 41, 42, 49, 63], "sourc": [14, 34, 39, 40], "speed": 47, "stabil": 18, "stabl": [31, 54], "standard": 0, "start": [30, 50], "startup": [52, 56], "step": [37, 38, 47, 48, 54, 56, 61], "stock": [18, 19], "structur": [9, 17], "style": 7, "subsystem": 37, "support": [21, 63], "switch": 30, "system": [37, 41, 42], "tabl": [32, 63], "tcmalloc": [29, 32], "temporari": 0, "tensorflow": [2, 3, 4, 6, 7, 18, 19, 21, 23, 33, 34, 35, 37, 39, 40, 41, 42, 45, 49, 52, 63, 64], "test": [5, 7, 47], "text": [56, 57], "text2imag": 54, "tf_num_interop_thread": 29, "tf_num_intraop_thread": 29, "thi": [47, 48, 54, 56, 61], "thread": 35, "throughput": 29, "tile": 55, "tip": [7, 19], "toolkit": [39, 40, 42, 46], "train": [19, 28, 31, 49, 50, 55, 56, 58, 60, 61, 62], "train_resnet50": 59, "tree": 9, "troubleshoot": 14, "tune": [18, 19, 57], "type": [19, 24, 28, 30], "u": 31, "ubuntu": 37, "underflow": 28, "unet": 55, "uniform": 32, "unit": 7, "up": [45, 47, 49], "updat": 5, "us": [11, 21, 27, 29, 30, 34, 35, 61], "usag": [2, 15, 17, 18, 19, 22, 26, 29, 36], "user": 29, "v": [19, 29], "v1": 31, "v3": 52, "v4": 47, "variabl": [18, 20, 29, 33, 37, 42, 47], "vasriabl": 54, "verifi": [2, 11, 37, 41, 42], "version": [5, 33, 52], "vi": 29, "via": [20, 37, 41, 42, 47], "vii": 29, "viii": 29, "virtual": [37, 41, 42, 46, 58], "vulner": 1, "w": 55, "warn": [0, 27], "weekli": 63, "weight": 36, "welcom": [4, 6, 64], "wheel": [37, 41, 42], "why": 30, "window": 37, "without": [61, 62], "work": 16, "workflow": [10, 15, 17, 36], "workload": [31, 50], "write": 11, "wsl2": 37, "x": 29, "xeon": 52, "xla": 30, "xpu": [23, 39, 40, 42, 63], "xpuautoshard": [17, 21, 62], "your": 29, "zoo": 50}}) \ No newline at end of file